Upload model.safetensors.index.json with huggingface_hub
Browse files- model.safetensors.index.json +991 -1
model.safetensors.index.json
CHANGED
|
@@ -87552,7 +87552,997 @@
|
|
| 87552 |
"model.layers.91.self_attn.v_proj.bias": "model-00092-of-00092.safetensors",
|
| 87553 |
"model.layers.91.self_attn.v_proj.weight": "model-00092-of-00092.safetensors",
|
| 87554 |
"model.layers.91.self_attn.v_proj.weight_scale": "model-00092-of-00092.safetensors",
|
| 87555 |
-
"model.norm.weight": "model-00092-of-00092.safetensors"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 87556 |
},
|
| 87557 |
"metadata": {
|
| 87558 |
"total_size": 241145664
|
|
|
|
| 87552 |
"model.layers.91.self_attn.v_proj.bias": "model-00092-of-00092.safetensors",
|
| 87553 |
"model.layers.91.self_attn.v_proj.weight": "model-00092-of-00092.safetensors",
|
| 87554 |
"model.layers.91.self_attn.v_proj.weight_scale": "model-00092-of-00092.safetensors",
|
| 87555 |
+
"model.norm.weight": "model-00092-of-00092.safetensors",
|
| 87556 |
+
"model.layers.92.embed_tokens.weight": "mtp.safetensors",
|
| 87557 |
+
"model.layers.92.shared_head.head.weight": "mtp.safetensors",
|
| 87558 |
+
"model.layers.92.shared_head.head.weight_scale": "mtp.safetensors",
|
| 87559 |
+
"model.layers.92.eh_proj.weight": "mtp.safetensors",
|
| 87560 |
+
"model.layers.92.enorm.weight": "mtp.safetensors",
|
| 87561 |
+
"model.layers.92.hnorm.weight": "mtp.safetensors",
|
| 87562 |
+
"model.layers.92.input_layernorm.weight": "mtp.safetensors",
|
| 87563 |
+
"model.layers.92.mlp.experts.0.down_proj.weight": "mtp.safetensors",
|
| 87564 |
+
"model.layers.92.mlp.experts.0.down_proj.weight_scale": "mtp.safetensors",
|
| 87565 |
+
"model.layers.92.mlp.experts.0.gate_proj.weight": "mtp.safetensors",
|
| 87566 |
+
"model.layers.92.mlp.experts.0.gate_proj.weight_scale": "mtp.safetensors",
|
| 87567 |
+
"model.layers.92.mlp.experts.0.up_proj.weight": "mtp.safetensors",
|
| 87568 |
+
"model.layers.92.mlp.experts.0.up_proj.weight_scale": "mtp.safetensors",
|
| 87569 |
+
"model.layers.92.mlp.experts.1.down_proj.weight": "mtp.safetensors",
|
| 87570 |
+
"model.layers.92.mlp.experts.1.down_proj.weight_scale": "mtp.safetensors",
|
| 87571 |
+
"model.layers.92.mlp.experts.1.gate_proj.weight": "mtp.safetensors",
|
| 87572 |
+
"model.layers.92.mlp.experts.1.gate_proj.weight_scale": "mtp.safetensors",
|
| 87573 |
+
"model.layers.92.mlp.experts.1.up_proj.weight": "mtp.safetensors",
|
| 87574 |
+
"model.layers.92.mlp.experts.1.up_proj.weight_scale": "mtp.safetensors",
|
| 87575 |
+
"model.layers.92.mlp.experts.10.down_proj.weight": "mtp.safetensors",
|
| 87576 |
+
"model.layers.92.mlp.experts.10.down_proj.weight_scale": "mtp.safetensors",
|
| 87577 |
+
"model.layers.92.mlp.experts.10.gate_proj.weight": "mtp.safetensors",
|
| 87578 |
+
"model.layers.92.mlp.experts.10.gate_proj.weight_scale": "mtp.safetensors",
|
| 87579 |
+
"model.layers.92.mlp.experts.10.up_proj.weight": "mtp.safetensors",
|
| 87580 |
+
"model.layers.92.mlp.experts.10.up_proj.weight_scale": "mtp.safetensors",
|
| 87581 |
+
"model.layers.92.mlp.experts.100.down_proj.weight": "mtp.safetensors",
|
| 87582 |
+
"model.layers.92.mlp.experts.100.down_proj.weight_scale": "mtp.safetensors",
|
| 87583 |
+
"model.layers.92.mlp.experts.100.gate_proj.weight": "mtp.safetensors",
|
| 87584 |
+
"model.layers.92.mlp.experts.100.gate_proj.weight_scale": "mtp.safetensors",
|
| 87585 |
+
"model.layers.92.mlp.experts.100.up_proj.weight": "mtp.safetensors",
|
| 87586 |
+
"model.layers.92.mlp.experts.100.up_proj.weight_scale": "mtp.safetensors",
|
| 87587 |
+
"model.layers.92.mlp.experts.101.down_proj.weight": "mtp.safetensors",
|
| 87588 |
+
"model.layers.92.mlp.experts.101.down_proj.weight_scale": "mtp.safetensors",
|
| 87589 |
+
"model.layers.92.mlp.experts.101.gate_proj.weight": "mtp.safetensors",
|
| 87590 |
+
"model.layers.92.mlp.experts.101.gate_proj.weight_scale": "mtp.safetensors",
|
| 87591 |
+
"model.layers.92.mlp.experts.101.up_proj.weight": "mtp.safetensors",
|
| 87592 |
+
"model.layers.92.mlp.experts.101.up_proj.weight_scale": "mtp.safetensors",
|
| 87593 |
+
"model.layers.92.mlp.experts.102.down_proj.weight": "mtp.safetensors",
|
| 87594 |
+
"model.layers.92.mlp.experts.102.down_proj.weight_scale": "mtp.safetensors",
|
| 87595 |
+
"model.layers.92.mlp.experts.102.gate_proj.weight": "mtp.safetensors",
|
| 87596 |
+
"model.layers.92.mlp.experts.102.gate_proj.weight_scale": "mtp.safetensors",
|
| 87597 |
+
"model.layers.92.mlp.experts.102.up_proj.weight": "mtp.safetensors",
|
| 87598 |
+
"model.layers.92.mlp.experts.102.up_proj.weight_scale": "mtp.safetensors",
|
| 87599 |
+
"model.layers.92.mlp.experts.103.down_proj.weight": "mtp.safetensors",
|
| 87600 |
+
"model.layers.92.mlp.experts.103.down_proj.weight_scale": "mtp.safetensors",
|
| 87601 |
+
"model.layers.92.mlp.experts.103.gate_proj.weight": "mtp.safetensors",
|
| 87602 |
+
"model.layers.92.mlp.experts.103.gate_proj.weight_scale": "mtp.safetensors",
|
| 87603 |
+
"model.layers.92.mlp.experts.103.up_proj.weight": "mtp.safetensors",
|
| 87604 |
+
"model.layers.92.mlp.experts.103.up_proj.weight_scale": "mtp.safetensors",
|
| 87605 |
+
"model.layers.92.mlp.experts.104.down_proj.weight": "mtp.safetensors",
|
| 87606 |
+
"model.layers.92.mlp.experts.104.down_proj.weight_scale": "mtp.safetensors",
|
| 87607 |
+
"model.layers.92.mlp.experts.104.gate_proj.weight": "mtp.safetensors",
|
| 87608 |
+
"model.layers.92.mlp.experts.104.gate_proj.weight_scale": "mtp.safetensors",
|
| 87609 |
+
"model.layers.92.mlp.experts.104.up_proj.weight": "mtp.safetensors",
|
| 87610 |
+
"model.layers.92.mlp.experts.104.up_proj.weight_scale": "mtp.safetensors",
|
| 87611 |
+
"model.layers.92.mlp.experts.105.down_proj.weight": "mtp.safetensors",
|
| 87612 |
+
"model.layers.92.mlp.experts.105.down_proj.weight_scale": "mtp.safetensors",
|
| 87613 |
+
"model.layers.92.mlp.experts.105.gate_proj.weight": "mtp.safetensors",
|
| 87614 |
+
"model.layers.92.mlp.experts.105.gate_proj.weight_scale": "mtp.safetensors",
|
| 87615 |
+
"model.layers.92.mlp.experts.105.up_proj.weight": "mtp.safetensors",
|
| 87616 |
+
"model.layers.92.mlp.experts.105.up_proj.weight_scale": "mtp.safetensors",
|
| 87617 |
+
"model.layers.92.mlp.experts.106.down_proj.weight": "mtp.safetensors",
|
| 87618 |
+
"model.layers.92.mlp.experts.106.down_proj.weight_scale": "mtp.safetensors",
|
| 87619 |
+
"model.layers.92.mlp.experts.106.gate_proj.weight": "mtp.safetensors",
|
| 87620 |
+
"model.layers.92.mlp.experts.106.gate_proj.weight_scale": "mtp.safetensors",
|
| 87621 |
+
"model.layers.92.mlp.experts.106.up_proj.weight": "mtp.safetensors",
|
| 87622 |
+
"model.layers.92.mlp.experts.106.up_proj.weight_scale": "mtp.safetensors",
|
| 87623 |
+
"model.layers.92.mlp.experts.107.down_proj.weight": "mtp.safetensors",
|
| 87624 |
+
"model.layers.92.mlp.experts.107.down_proj.weight_scale": "mtp.safetensors",
|
| 87625 |
+
"model.layers.92.mlp.experts.107.gate_proj.weight": "mtp.safetensors",
|
| 87626 |
+
"model.layers.92.mlp.experts.107.gate_proj.weight_scale": "mtp.safetensors",
|
| 87627 |
+
"model.layers.92.mlp.experts.107.up_proj.weight": "mtp.safetensors",
|
| 87628 |
+
"model.layers.92.mlp.experts.107.up_proj.weight_scale": "mtp.safetensors",
|
| 87629 |
+
"model.layers.92.mlp.experts.108.down_proj.weight": "mtp.safetensors",
|
| 87630 |
+
"model.layers.92.mlp.experts.108.down_proj.weight_scale": "mtp.safetensors",
|
| 87631 |
+
"model.layers.92.mlp.experts.108.gate_proj.weight": "mtp.safetensors",
|
| 87632 |
+
"model.layers.92.mlp.experts.108.gate_proj.weight_scale": "mtp.safetensors",
|
| 87633 |
+
"model.layers.92.mlp.experts.108.up_proj.weight": "mtp.safetensors",
|
| 87634 |
+
"model.layers.92.mlp.experts.108.up_proj.weight_scale": "mtp.safetensors",
|
| 87635 |
+
"model.layers.92.mlp.experts.109.down_proj.weight": "mtp.safetensors",
|
| 87636 |
+
"model.layers.92.mlp.experts.109.down_proj.weight_scale": "mtp.safetensors",
|
| 87637 |
+
"model.layers.92.mlp.experts.109.gate_proj.weight": "mtp.safetensors",
|
| 87638 |
+
"model.layers.92.mlp.experts.109.gate_proj.weight_scale": "mtp.safetensors",
|
| 87639 |
+
"model.layers.92.mlp.experts.109.up_proj.weight": "mtp.safetensors",
|
| 87640 |
+
"model.layers.92.mlp.experts.109.up_proj.weight_scale": "mtp.safetensors",
|
| 87641 |
+
"model.layers.92.mlp.experts.11.down_proj.weight": "mtp.safetensors",
|
| 87642 |
+
"model.layers.92.mlp.experts.11.down_proj.weight_scale": "mtp.safetensors",
|
| 87643 |
+
"model.layers.92.mlp.experts.11.gate_proj.weight": "mtp.safetensors",
|
| 87644 |
+
"model.layers.92.mlp.experts.11.gate_proj.weight_scale": "mtp.safetensors",
|
| 87645 |
+
"model.layers.92.mlp.experts.11.up_proj.weight": "mtp.safetensors",
|
| 87646 |
+
"model.layers.92.mlp.experts.11.up_proj.weight_scale": "mtp.safetensors",
|
| 87647 |
+
"model.layers.92.mlp.experts.110.down_proj.weight": "mtp.safetensors",
|
| 87648 |
+
"model.layers.92.mlp.experts.110.down_proj.weight_scale": "mtp.safetensors",
|
| 87649 |
+
"model.layers.92.mlp.experts.110.gate_proj.weight": "mtp.safetensors",
|
| 87650 |
+
"model.layers.92.mlp.experts.110.gate_proj.weight_scale": "mtp.safetensors",
|
| 87651 |
+
"model.layers.92.mlp.experts.110.up_proj.weight": "mtp.safetensors",
|
| 87652 |
+
"model.layers.92.mlp.experts.110.up_proj.weight_scale": "mtp.safetensors",
|
| 87653 |
+
"model.layers.92.mlp.experts.111.down_proj.weight": "mtp.safetensors",
|
| 87654 |
+
"model.layers.92.mlp.experts.111.down_proj.weight_scale": "mtp.safetensors",
|
| 87655 |
+
"model.layers.92.mlp.experts.111.gate_proj.weight": "mtp.safetensors",
|
| 87656 |
+
"model.layers.92.mlp.experts.111.gate_proj.weight_scale": "mtp.safetensors",
|
| 87657 |
+
"model.layers.92.mlp.experts.111.up_proj.weight": "mtp.safetensors",
|
| 87658 |
+
"model.layers.92.mlp.experts.111.up_proj.weight_scale": "mtp.safetensors",
|
| 87659 |
+
"model.layers.92.mlp.experts.112.down_proj.weight": "mtp.safetensors",
|
| 87660 |
+
"model.layers.92.mlp.experts.112.down_proj.weight_scale": "mtp.safetensors",
|
| 87661 |
+
"model.layers.92.mlp.experts.112.gate_proj.weight": "mtp.safetensors",
|
| 87662 |
+
"model.layers.92.mlp.experts.112.gate_proj.weight_scale": "mtp.safetensors",
|
| 87663 |
+
"model.layers.92.mlp.experts.112.up_proj.weight": "mtp.safetensors",
|
| 87664 |
+
"model.layers.92.mlp.experts.112.up_proj.weight_scale": "mtp.safetensors",
|
| 87665 |
+
"model.layers.92.mlp.experts.113.down_proj.weight": "mtp.safetensors",
|
| 87666 |
+
"model.layers.92.mlp.experts.113.down_proj.weight_scale": "mtp.safetensors",
|
| 87667 |
+
"model.layers.92.mlp.experts.113.gate_proj.weight": "mtp.safetensors",
|
| 87668 |
+
"model.layers.92.mlp.experts.113.gate_proj.weight_scale": "mtp.safetensors",
|
| 87669 |
+
"model.layers.92.mlp.experts.113.up_proj.weight": "mtp.safetensors",
|
| 87670 |
+
"model.layers.92.mlp.experts.113.up_proj.weight_scale": "mtp.safetensors",
|
| 87671 |
+
"model.layers.92.mlp.experts.114.down_proj.weight": "mtp.safetensors",
|
| 87672 |
+
"model.layers.92.mlp.experts.114.down_proj.weight_scale": "mtp.safetensors",
|
| 87673 |
+
"model.layers.92.mlp.experts.114.gate_proj.weight": "mtp.safetensors",
|
| 87674 |
+
"model.layers.92.mlp.experts.114.gate_proj.weight_scale": "mtp.safetensors",
|
| 87675 |
+
"model.layers.92.mlp.experts.114.up_proj.weight": "mtp.safetensors",
|
| 87676 |
+
"model.layers.92.mlp.experts.114.up_proj.weight_scale": "mtp.safetensors",
|
| 87677 |
+
"model.layers.92.mlp.experts.115.down_proj.weight": "mtp.safetensors",
|
| 87678 |
+
"model.layers.92.mlp.experts.115.down_proj.weight_scale": "mtp.safetensors",
|
| 87679 |
+
"model.layers.92.mlp.experts.115.gate_proj.weight": "mtp.safetensors",
|
| 87680 |
+
"model.layers.92.mlp.experts.115.gate_proj.weight_scale": "mtp.safetensors",
|
| 87681 |
+
"model.layers.92.mlp.experts.115.up_proj.weight": "mtp.safetensors",
|
| 87682 |
+
"model.layers.92.mlp.experts.115.up_proj.weight_scale": "mtp.safetensors",
|
| 87683 |
+
"model.layers.92.mlp.experts.116.down_proj.weight": "mtp.safetensors",
|
| 87684 |
+
"model.layers.92.mlp.experts.116.down_proj.weight_scale": "mtp.safetensors",
|
| 87685 |
+
"model.layers.92.mlp.experts.116.gate_proj.weight": "mtp.safetensors",
|
| 87686 |
+
"model.layers.92.mlp.experts.116.gate_proj.weight_scale": "mtp.safetensors",
|
| 87687 |
+
"model.layers.92.mlp.experts.116.up_proj.weight": "mtp.safetensors",
|
| 87688 |
+
"model.layers.92.mlp.experts.116.up_proj.weight_scale": "mtp.safetensors",
|
| 87689 |
+
"model.layers.92.mlp.experts.117.down_proj.weight": "mtp.safetensors",
|
| 87690 |
+
"model.layers.92.mlp.experts.117.down_proj.weight_scale": "mtp.safetensors",
|
| 87691 |
+
"model.layers.92.mlp.experts.117.gate_proj.weight": "mtp.safetensors",
|
| 87692 |
+
"model.layers.92.mlp.experts.117.gate_proj.weight_scale": "mtp.safetensors",
|
| 87693 |
+
"model.layers.92.mlp.experts.117.up_proj.weight": "mtp.safetensors",
|
| 87694 |
+
"model.layers.92.mlp.experts.117.up_proj.weight_scale": "mtp.safetensors",
|
| 87695 |
+
"model.layers.92.mlp.experts.118.down_proj.weight": "mtp.safetensors",
|
| 87696 |
+
"model.layers.92.mlp.experts.118.down_proj.weight_scale": "mtp.safetensors",
|
| 87697 |
+
"model.layers.92.mlp.experts.118.gate_proj.weight": "mtp.safetensors",
|
| 87698 |
+
"model.layers.92.mlp.experts.118.gate_proj.weight_scale": "mtp.safetensors",
|
| 87699 |
+
"model.layers.92.mlp.experts.118.up_proj.weight": "mtp.safetensors",
|
| 87700 |
+
"model.layers.92.mlp.experts.118.up_proj.weight_scale": "mtp.safetensors",
|
| 87701 |
+
"model.layers.92.mlp.experts.119.down_proj.weight": "mtp.safetensors",
|
| 87702 |
+
"model.layers.92.mlp.experts.119.down_proj.weight_scale": "mtp.safetensors",
|
| 87703 |
+
"model.layers.92.mlp.experts.119.gate_proj.weight": "mtp.safetensors",
|
| 87704 |
+
"model.layers.92.mlp.experts.119.gate_proj.weight_scale": "mtp.safetensors",
|
| 87705 |
+
"model.layers.92.mlp.experts.119.up_proj.weight": "mtp.safetensors",
|
| 87706 |
+
"model.layers.92.mlp.experts.119.up_proj.weight_scale": "mtp.safetensors",
|
| 87707 |
+
"model.layers.92.mlp.experts.12.down_proj.weight": "mtp.safetensors",
|
| 87708 |
+
"model.layers.92.mlp.experts.12.down_proj.weight_scale": "mtp.safetensors",
|
| 87709 |
+
"model.layers.92.mlp.experts.12.gate_proj.weight": "mtp.safetensors",
|
| 87710 |
+
"model.layers.92.mlp.experts.12.gate_proj.weight_scale": "mtp.safetensors",
|
| 87711 |
+
"model.layers.92.mlp.experts.12.up_proj.weight": "mtp.safetensors",
|
| 87712 |
+
"model.layers.92.mlp.experts.12.up_proj.weight_scale": "mtp.safetensors",
|
| 87713 |
+
"model.layers.92.mlp.experts.120.down_proj.weight": "mtp.safetensors",
|
| 87714 |
+
"model.layers.92.mlp.experts.120.down_proj.weight_scale": "mtp.safetensors",
|
| 87715 |
+
"model.layers.92.mlp.experts.120.gate_proj.weight": "mtp.safetensors",
|
| 87716 |
+
"model.layers.92.mlp.experts.120.gate_proj.weight_scale": "mtp.safetensors",
|
| 87717 |
+
"model.layers.92.mlp.experts.120.up_proj.weight": "mtp.safetensors",
|
| 87718 |
+
"model.layers.92.mlp.experts.120.up_proj.weight_scale": "mtp.safetensors",
|
| 87719 |
+
"model.layers.92.mlp.experts.121.down_proj.weight": "mtp.safetensors",
|
| 87720 |
+
"model.layers.92.mlp.experts.121.down_proj.weight_scale": "mtp.safetensors",
|
| 87721 |
+
"model.layers.92.mlp.experts.121.gate_proj.weight": "mtp.safetensors",
|
| 87722 |
+
"model.layers.92.mlp.experts.121.gate_proj.weight_scale": "mtp.safetensors",
|
| 87723 |
+
"model.layers.92.mlp.experts.121.up_proj.weight": "mtp.safetensors",
|
| 87724 |
+
"model.layers.92.mlp.experts.121.up_proj.weight_scale": "mtp.safetensors",
|
| 87725 |
+
"model.layers.92.mlp.experts.122.down_proj.weight": "mtp.safetensors",
|
| 87726 |
+
"model.layers.92.mlp.experts.122.down_proj.weight_scale": "mtp.safetensors",
|
| 87727 |
+
"model.layers.92.mlp.experts.122.gate_proj.weight": "mtp.safetensors",
|
| 87728 |
+
"model.layers.92.mlp.experts.122.gate_proj.weight_scale": "mtp.safetensors",
|
| 87729 |
+
"model.layers.92.mlp.experts.122.up_proj.weight": "mtp.safetensors",
|
| 87730 |
+
"model.layers.92.mlp.experts.122.up_proj.weight_scale": "mtp.safetensors",
|
| 87731 |
+
"model.layers.92.mlp.experts.123.down_proj.weight": "mtp.safetensors",
|
| 87732 |
+
"model.layers.92.mlp.experts.123.down_proj.weight_scale": "mtp.safetensors",
|
| 87733 |
+
"model.layers.92.mlp.experts.123.gate_proj.weight": "mtp.safetensors",
|
| 87734 |
+
"model.layers.92.mlp.experts.123.gate_proj.weight_scale": "mtp.safetensors",
|
| 87735 |
+
"model.layers.92.mlp.experts.123.up_proj.weight": "mtp.safetensors",
|
| 87736 |
+
"model.layers.92.mlp.experts.123.up_proj.weight_scale": "mtp.safetensors",
|
| 87737 |
+
"model.layers.92.mlp.experts.124.down_proj.weight": "mtp.safetensors",
|
| 87738 |
+
"model.layers.92.mlp.experts.124.down_proj.weight_scale": "mtp.safetensors",
|
| 87739 |
+
"model.layers.92.mlp.experts.124.gate_proj.weight": "mtp.safetensors",
|
| 87740 |
+
"model.layers.92.mlp.experts.124.gate_proj.weight_scale": "mtp.safetensors",
|
| 87741 |
+
"model.layers.92.mlp.experts.124.up_proj.weight": "mtp.safetensors",
|
| 87742 |
+
"model.layers.92.mlp.experts.124.up_proj.weight_scale": "mtp.safetensors",
|
| 87743 |
+
"model.layers.92.mlp.experts.125.down_proj.weight": "mtp.safetensors",
|
| 87744 |
+
"model.layers.92.mlp.experts.125.down_proj.weight_scale": "mtp.safetensors",
|
| 87745 |
+
"model.layers.92.mlp.experts.125.gate_proj.weight": "mtp.safetensors",
|
| 87746 |
+
"model.layers.92.mlp.experts.125.gate_proj.weight_scale": "mtp.safetensors",
|
| 87747 |
+
"model.layers.92.mlp.experts.125.up_proj.weight": "mtp.safetensors",
|
| 87748 |
+
"model.layers.92.mlp.experts.125.up_proj.weight_scale": "mtp.safetensors",
|
| 87749 |
+
"model.layers.92.mlp.experts.126.down_proj.weight": "mtp.safetensors",
|
| 87750 |
+
"model.layers.92.mlp.experts.126.down_proj.weight_scale": "mtp.safetensors",
|
| 87751 |
+
"model.layers.92.mlp.experts.126.gate_proj.weight": "mtp.safetensors",
|
| 87752 |
+
"model.layers.92.mlp.experts.126.gate_proj.weight_scale": "mtp.safetensors",
|
| 87753 |
+
"model.layers.92.mlp.experts.126.up_proj.weight": "mtp.safetensors",
|
| 87754 |
+
"model.layers.92.mlp.experts.126.up_proj.weight_scale": "mtp.safetensors",
|
| 87755 |
+
"model.layers.92.mlp.experts.127.down_proj.weight": "mtp.safetensors",
|
| 87756 |
+
"model.layers.92.mlp.experts.127.down_proj.weight_scale": "mtp.safetensors",
|
| 87757 |
+
"model.layers.92.mlp.experts.127.gate_proj.weight": "mtp.safetensors",
|
| 87758 |
+
"model.layers.92.mlp.experts.127.gate_proj.weight_scale": "mtp.safetensors",
|
| 87759 |
+
"model.layers.92.mlp.experts.127.up_proj.weight": "mtp.safetensors",
|
| 87760 |
+
"model.layers.92.mlp.experts.127.up_proj.weight_scale": "mtp.safetensors",
|
| 87761 |
+
"model.layers.92.mlp.experts.128.down_proj.weight": "mtp.safetensors",
|
| 87762 |
+
"model.layers.92.mlp.experts.128.down_proj.weight_scale": "mtp.safetensors",
|
| 87763 |
+
"model.layers.92.mlp.experts.128.gate_proj.weight": "mtp.safetensors",
|
| 87764 |
+
"model.layers.92.mlp.experts.128.gate_proj.weight_scale": "mtp.safetensors",
|
| 87765 |
+
"model.layers.92.mlp.experts.128.up_proj.weight": "mtp.safetensors",
|
| 87766 |
+
"model.layers.92.mlp.experts.128.up_proj.weight_scale": "mtp.safetensors",
|
| 87767 |
+
"model.layers.92.mlp.experts.129.down_proj.weight": "mtp.safetensors",
|
| 87768 |
+
"model.layers.92.mlp.experts.129.down_proj.weight_scale": "mtp.safetensors",
|
| 87769 |
+
"model.layers.92.mlp.experts.129.gate_proj.weight": "mtp.safetensors",
|
| 87770 |
+
"model.layers.92.mlp.experts.129.gate_proj.weight_scale": "mtp.safetensors",
|
| 87771 |
+
"model.layers.92.mlp.experts.129.up_proj.weight": "mtp.safetensors",
|
| 87772 |
+
"model.layers.92.mlp.experts.129.up_proj.weight_scale": "mtp.safetensors",
|
| 87773 |
+
"model.layers.92.mlp.experts.13.down_proj.weight": "mtp.safetensors",
|
| 87774 |
+
"model.layers.92.mlp.experts.13.down_proj.weight_scale": "mtp.safetensors",
|
| 87775 |
+
"model.layers.92.mlp.experts.13.gate_proj.weight": "mtp.safetensors",
|
| 87776 |
+
"model.layers.92.mlp.experts.13.gate_proj.weight_scale": "mtp.safetensors",
|
| 87777 |
+
"model.layers.92.mlp.experts.13.up_proj.weight": "mtp.safetensors",
|
| 87778 |
+
"model.layers.92.mlp.experts.13.up_proj.weight_scale": "mtp.safetensors",
|
| 87779 |
+
"model.layers.92.mlp.experts.130.down_proj.weight": "mtp.safetensors",
|
| 87780 |
+
"model.layers.92.mlp.experts.130.down_proj.weight_scale": "mtp.safetensors",
|
| 87781 |
+
"model.layers.92.mlp.experts.130.gate_proj.weight": "mtp.safetensors",
|
| 87782 |
+
"model.layers.92.mlp.experts.130.gate_proj.weight_scale": "mtp.safetensors",
|
| 87783 |
+
"model.layers.92.mlp.experts.130.up_proj.weight": "mtp.safetensors",
|
| 87784 |
+
"model.layers.92.mlp.experts.130.up_proj.weight_scale": "mtp.safetensors",
|
| 87785 |
+
"model.layers.92.mlp.experts.131.down_proj.weight": "mtp.safetensors",
|
| 87786 |
+
"model.layers.92.mlp.experts.131.down_proj.weight_scale": "mtp.safetensors",
|
| 87787 |
+
"model.layers.92.mlp.experts.131.gate_proj.weight": "mtp.safetensors",
|
| 87788 |
+
"model.layers.92.mlp.experts.131.gate_proj.weight_scale": "mtp.safetensors",
|
| 87789 |
+
"model.layers.92.mlp.experts.131.up_proj.weight": "mtp.safetensors",
|
| 87790 |
+
"model.layers.92.mlp.experts.131.up_proj.weight_scale": "mtp.safetensors",
|
| 87791 |
+
"model.layers.92.mlp.experts.132.down_proj.weight": "mtp.safetensors",
|
| 87792 |
+
"model.layers.92.mlp.experts.132.down_proj.weight_scale": "mtp.safetensors",
|
| 87793 |
+
"model.layers.92.mlp.experts.132.gate_proj.weight": "mtp.safetensors",
|
| 87794 |
+
"model.layers.92.mlp.experts.132.gate_proj.weight_scale": "mtp.safetensors",
|
| 87795 |
+
"model.layers.92.mlp.experts.132.up_proj.weight": "mtp.safetensors",
|
| 87796 |
+
"model.layers.92.mlp.experts.132.up_proj.weight_scale": "mtp.safetensors",
|
| 87797 |
+
"model.layers.92.mlp.experts.133.down_proj.weight": "mtp.safetensors",
|
| 87798 |
+
"model.layers.92.mlp.experts.133.down_proj.weight_scale": "mtp.safetensors",
|
| 87799 |
+
"model.layers.92.mlp.experts.133.gate_proj.weight": "mtp.safetensors",
|
| 87800 |
+
"model.layers.92.mlp.experts.133.gate_proj.weight_scale": "mtp.safetensors",
|
| 87801 |
+
"model.layers.92.mlp.experts.133.up_proj.weight": "mtp.safetensors",
|
| 87802 |
+
"model.layers.92.mlp.experts.133.up_proj.weight_scale": "mtp.safetensors",
|
| 87803 |
+
"model.layers.92.mlp.experts.134.down_proj.weight": "mtp.safetensors",
|
| 87804 |
+
"model.layers.92.mlp.experts.134.down_proj.weight_scale": "mtp.safetensors",
|
| 87805 |
+
"model.layers.92.mlp.experts.134.gate_proj.weight": "mtp.safetensors",
|
| 87806 |
+
"model.layers.92.mlp.experts.134.gate_proj.weight_scale": "mtp.safetensors",
|
| 87807 |
+
"model.layers.92.mlp.experts.134.up_proj.weight": "mtp.safetensors",
|
| 87808 |
+
"model.layers.92.mlp.experts.134.up_proj.weight_scale": "mtp.safetensors",
|
| 87809 |
+
"model.layers.92.mlp.experts.135.down_proj.weight": "mtp.safetensors",
|
| 87810 |
+
"model.layers.92.mlp.experts.135.down_proj.weight_scale": "mtp.safetensors",
|
| 87811 |
+
"model.layers.92.mlp.experts.135.gate_proj.weight": "mtp.safetensors",
|
| 87812 |
+
"model.layers.92.mlp.experts.135.gate_proj.weight_scale": "mtp.safetensors",
|
| 87813 |
+
"model.layers.92.mlp.experts.135.up_proj.weight": "mtp.safetensors",
|
| 87814 |
+
"model.layers.92.mlp.experts.135.up_proj.weight_scale": "mtp.safetensors",
|
| 87815 |
+
"model.layers.92.mlp.experts.136.down_proj.weight": "mtp.safetensors",
|
| 87816 |
+
"model.layers.92.mlp.experts.136.down_proj.weight_scale": "mtp.safetensors",
|
| 87817 |
+
"model.layers.92.mlp.experts.136.gate_proj.weight": "mtp.safetensors",
|
| 87818 |
+
"model.layers.92.mlp.experts.136.gate_proj.weight_scale": "mtp.safetensors",
|
| 87819 |
+
"model.layers.92.mlp.experts.136.up_proj.weight": "mtp.safetensors",
|
| 87820 |
+
"model.layers.92.mlp.experts.136.up_proj.weight_scale": "mtp.safetensors",
|
| 87821 |
+
"model.layers.92.mlp.experts.137.down_proj.weight": "mtp.safetensors",
|
| 87822 |
+
"model.layers.92.mlp.experts.137.down_proj.weight_scale": "mtp.safetensors",
|
| 87823 |
+
"model.layers.92.mlp.experts.137.gate_proj.weight": "mtp.safetensors",
|
| 87824 |
+
"model.layers.92.mlp.experts.137.gate_proj.weight_scale": "mtp.safetensors",
|
| 87825 |
+
"model.layers.92.mlp.experts.137.up_proj.weight": "mtp.safetensors",
|
| 87826 |
+
"model.layers.92.mlp.experts.137.up_proj.weight_scale": "mtp.safetensors",
|
| 87827 |
+
"model.layers.92.mlp.experts.138.down_proj.weight": "mtp.safetensors",
|
| 87828 |
+
"model.layers.92.mlp.experts.138.down_proj.weight_scale": "mtp.safetensors",
|
| 87829 |
+
"model.layers.92.mlp.experts.138.gate_proj.weight": "mtp.safetensors",
|
| 87830 |
+
"model.layers.92.mlp.experts.138.gate_proj.weight_scale": "mtp.safetensors",
|
| 87831 |
+
"model.layers.92.mlp.experts.138.up_proj.weight": "mtp.safetensors",
|
| 87832 |
+
"model.layers.92.mlp.experts.138.up_proj.weight_scale": "mtp.safetensors",
|
| 87833 |
+
"model.layers.92.mlp.experts.139.down_proj.weight": "mtp.safetensors",
|
| 87834 |
+
"model.layers.92.mlp.experts.139.down_proj.weight_scale": "mtp.safetensors",
|
| 87835 |
+
"model.layers.92.mlp.experts.139.gate_proj.weight": "mtp.safetensors",
|
| 87836 |
+
"model.layers.92.mlp.experts.139.gate_proj.weight_scale": "mtp.safetensors",
|
| 87837 |
+
"model.layers.92.mlp.experts.139.up_proj.weight": "mtp.safetensors",
|
| 87838 |
+
"model.layers.92.mlp.experts.139.up_proj.weight_scale": "mtp.safetensors",
|
| 87839 |
+
"model.layers.92.mlp.experts.14.down_proj.weight": "mtp.safetensors",
|
| 87840 |
+
"model.layers.92.mlp.experts.14.down_proj.weight_scale": "mtp.safetensors",
|
| 87841 |
+
"model.layers.92.mlp.experts.14.gate_proj.weight": "mtp.safetensors",
|
| 87842 |
+
"model.layers.92.mlp.experts.14.gate_proj.weight_scale": "mtp.safetensors",
|
| 87843 |
+
"model.layers.92.mlp.experts.14.up_proj.weight": "mtp.safetensors",
|
| 87844 |
+
"model.layers.92.mlp.experts.14.up_proj.weight_scale": "mtp.safetensors",
|
| 87845 |
+
"model.layers.92.mlp.experts.140.down_proj.weight": "mtp.safetensors",
|
| 87846 |
+
"model.layers.92.mlp.experts.140.down_proj.weight_scale": "mtp.safetensors",
|
| 87847 |
+
"model.layers.92.mlp.experts.140.gate_proj.weight": "mtp.safetensors",
|
| 87848 |
+
"model.layers.92.mlp.experts.140.gate_proj.weight_scale": "mtp.safetensors",
|
| 87849 |
+
"model.layers.92.mlp.experts.140.up_proj.weight": "mtp.safetensors",
|
| 87850 |
+
"model.layers.92.mlp.experts.140.up_proj.weight_scale": "mtp.safetensors",
|
| 87851 |
+
"model.layers.92.mlp.experts.141.down_proj.weight": "mtp.safetensors",
|
| 87852 |
+
"model.layers.92.mlp.experts.141.down_proj.weight_scale": "mtp.safetensors",
|
| 87853 |
+
"model.layers.92.mlp.experts.141.gate_proj.weight": "mtp.safetensors",
|
| 87854 |
+
"model.layers.92.mlp.experts.141.gate_proj.weight_scale": "mtp.safetensors",
|
| 87855 |
+
"model.layers.92.mlp.experts.141.up_proj.weight": "mtp.safetensors",
|
| 87856 |
+
"model.layers.92.mlp.experts.141.up_proj.weight_scale": "mtp.safetensors",
|
| 87857 |
+
"model.layers.92.mlp.experts.142.down_proj.weight": "mtp.safetensors",
|
| 87858 |
+
"model.layers.92.mlp.experts.142.down_proj.weight_scale": "mtp.safetensors",
|
| 87859 |
+
"model.layers.92.mlp.experts.142.gate_proj.weight": "mtp.safetensors",
|
| 87860 |
+
"model.layers.92.mlp.experts.142.gate_proj.weight_scale": "mtp.safetensors",
|
| 87861 |
+
"model.layers.92.mlp.experts.142.up_proj.weight": "mtp.safetensors",
|
| 87862 |
+
"model.layers.92.mlp.experts.142.up_proj.weight_scale": "mtp.safetensors",
|
| 87863 |
+
"model.layers.92.mlp.experts.143.down_proj.weight": "mtp.safetensors",
|
| 87864 |
+
"model.layers.92.mlp.experts.143.down_proj.weight_scale": "mtp.safetensors",
|
| 87865 |
+
"model.layers.92.mlp.experts.143.gate_proj.weight": "mtp.safetensors",
|
| 87866 |
+
"model.layers.92.mlp.experts.143.gate_proj.weight_scale": "mtp.safetensors",
|
| 87867 |
+
"model.layers.92.mlp.experts.143.up_proj.weight": "mtp.safetensors",
|
| 87868 |
+
"model.layers.92.mlp.experts.143.up_proj.weight_scale": "mtp.safetensors",
|
| 87869 |
+
"model.layers.92.mlp.experts.144.down_proj.weight": "mtp.safetensors",
|
| 87870 |
+
"model.layers.92.mlp.experts.144.down_proj.weight_scale": "mtp.safetensors",
|
| 87871 |
+
"model.layers.92.mlp.experts.144.gate_proj.weight": "mtp.safetensors",
|
| 87872 |
+
"model.layers.92.mlp.experts.144.gate_proj.weight_scale": "mtp.safetensors",
|
| 87873 |
+
"model.layers.92.mlp.experts.144.up_proj.weight": "mtp.safetensors",
|
| 87874 |
+
"model.layers.92.mlp.experts.144.up_proj.weight_scale": "mtp.safetensors",
|
| 87875 |
+
"model.layers.92.mlp.experts.145.down_proj.weight": "mtp.safetensors",
|
| 87876 |
+
"model.layers.92.mlp.experts.145.down_proj.weight_scale": "mtp.safetensors",
|
| 87877 |
+
"model.layers.92.mlp.experts.145.gate_proj.weight": "mtp.safetensors",
|
| 87878 |
+
"model.layers.92.mlp.experts.145.gate_proj.weight_scale": "mtp.safetensors",
|
| 87879 |
+
"model.layers.92.mlp.experts.145.up_proj.weight": "mtp.safetensors",
|
| 87880 |
+
"model.layers.92.mlp.experts.145.up_proj.weight_scale": "mtp.safetensors",
|
| 87881 |
+
"model.layers.92.mlp.experts.146.down_proj.weight": "mtp.safetensors",
|
| 87882 |
+
"model.layers.92.mlp.experts.146.down_proj.weight_scale": "mtp.safetensors",
|
| 87883 |
+
"model.layers.92.mlp.experts.146.gate_proj.weight": "mtp.safetensors",
|
| 87884 |
+
"model.layers.92.mlp.experts.146.gate_proj.weight_scale": "mtp.safetensors",
|
| 87885 |
+
"model.layers.92.mlp.experts.146.up_proj.weight": "mtp.safetensors",
|
| 87886 |
+
"model.layers.92.mlp.experts.146.up_proj.weight_scale": "mtp.safetensors",
|
| 87887 |
+
"model.layers.92.mlp.experts.147.down_proj.weight": "mtp.safetensors",
|
| 87888 |
+
"model.layers.92.mlp.experts.147.down_proj.weight_scale": "mtp.safetensors",
|
| 87889 |
+
"model.layers.92.mlp.experts.147.gate_proj.weight": "mtp.safetensors",
|
| 87890 |
+
"model.layers.92.mlp.experts.147.gate_proj.weight_scale": "mtp.safetensors",
|
| 87891 |
+
"model.layers.92.mlp.experts.147.up_proj.weight": "mtp.safetensors",
|
| 87892 |
+
"model.layers.92.mlp.experts.147.up_proj.weight_scale": "mtp.safetensors",
|
| 87893 |
+
"model.layers.92.mlp.experts.148.down_proj.weight": "mtp.safetensors",
|
| 87894 |
+
"model.layers.92.mlp.experts.148.down_proj.weight_scale": "mtp.safetensors",
|
| 87895 |
+
"model.layers.92.mlp.experts.148.gate_proj.weight": "mtp.safetensors",
|
| 87896 |
+
"model.layers.92.mlp.experts.148.gate_proj.weight_scale": "mtp.safetensors",
|
| 87897 |
+
"model.layers.92.mlp.experts.148.up_proj.weight": "mtp.safetensors",
|
| 87898 |
+
"model.layers.92.mlp.experts.148.up_proj.weight_scale": "mtp.safetensors",
|
| 87899 |
+
"model.layers.92.mlp.experts.149.down_proj.weight": "mtp.safetensors",
|
| 87900 |
+
"model.layers.92.mlp.experts.149.down_proj.weight_scale": "mtp.safetensors",
|
| 87901 |
+
"model.layers.92.mlp.experts.149.gate_proj.weight": "mtp.safetensors",
|
| 87902 |
+
"model.layers.92.mlp.experts.149.gate_proj.weight_scale": "mtp.safetensors",
|
| 87903 |
+
"model.layers.92.mlp.experts.149.up_proj.weight": "mtp.safetensors",
|
| 87904 |
+
"model.layers.92.mlp.experts.149.up_proj.weight_scale": "mtp.safetensors",
|
| 87905 |
+
"model.layers.92.mlp.experts.15.down_proj.weight": "mtp.safetensors",
|
| 87906 |
+
"model.layers.92.mlp.experts.15.down_proj.weight_scale": "mtp.safetensors",
|
| 87907 |
+
"model.layers.92.mlp.experts.15.gate_proj.weight": "mtp.safetensors",
|
| 87908 |
+
"model.layers.92.mlp.experts.15.gate_proj.weight_scale": "mtp.safetensors",
|
| 87909 |
+
"model.layers.92.mlp.experts.15.up_proj.weight": "mtp.safetensors",
|
| 87910 |
+
"model.layers.92.mlp.experts.15.up_proj.weight_scale": "mtp.safetensors",
|
| 87911 |
+
"model.layers.92.mlp.experts.150.down_proj.weight": "mtp.safetensors",
|
| 87912 |
+
"model.layers.92.mlp.experts.150.down_proj.weight_scale": "mtp.safetensors",
|
| 87913 |
+
"model.layers.92.mlp.experts.150.gate_proj.weight": "mtp.safetensors",
|
| 87914 |
+
"model.layers.92.mlp.experts.150.gate_proj.weight_scale": "mtp.safetensors",
|
| 87915 |
+
"model.layers.92.mlp.experts.150.up_proj.weight": "mtp.safetensors",
|
| 87916 |
+
"model.layers.92.mlp.experts.150.up_proj.weight_scale": "mtp.safetensors",
|
| 87917 |
+
"model.layers.92.mlp.experts.151.down_proj.weight": "mtp.safetensors",
|
| 87918 |
+
"model.layers.92.mlp.experts.151.down_proj.weight_scale": "mtp.safetensors",
|
| 87919 |
+
"model.layers.92.mlp.experts.151.gate_proj.weight": "mtp.safetensors",
|
| 87920 |
+
"model.layers.92.mlp.experts.151.gate_proj.weight_scale": "mtp.safetensors",
|
| 87921 |
+
"model.layers.92.mlp.experts.151.up_proj.weight": "mtp.safetensors",
|
| 87922 |
+
"model.layers.92.mlp.experts.151.up_proj.weight_scale": "mtp.safetensors",
|
| 87923 |
+
"model.layers.92.mlp.experts.152.down_proj.weight": "mtp.safetensors",
|
| 87924 |
+
"model.layers.92.mlp.experts.152.down_proj.weight_scale": "mtp.safetensors",
|
| 87925 |
+
"model.layers.92.mlp.experts.152.gate_proj.weight": "mtp.safetensors",
|
| 87926 |
+
"model.layers.92.mlp.experts.152.gate_proj.weight_scale": "mtp.safetensors",
|
| 87927 |
+
"model.layers.92.mlp.experts.152.up_proj.weight": "mtp.safetensors",
|
| 87928 |
+
"model.layers.92.mlp.experts.152.up_proj.weight_scale": "mtp.safetensors",
|
| 87929 |
+
"model.layers.92.mlp.experts.153.down_proj.weight": "mtp.safetensors",
|
| 87930 |
+
"model.layers.92.mlp.experts.153.down_proj.weight_scale": "mtp.safetensors",
|
| 87931 |
+
"model.layers.92.mlp.experts.153.gate_proj.weight": "mtp.safetensors",
|
| 87932 |
+
"model.layers.92.mlp.experts.153.gate_proj.weight_scale": "mtp.safetensors",
|
| 87933 |
+
"model.layers.92.mlp.experts.153.up_proj.weight": "mtp.safetensors",
|
| 87934 |
+
"model.layers.92.mlp.experts.153.up_proj.weight_scale": "mtp.safetensors",
|
| 87935 |
+
"model.layers.92.mlp.experts.154.down_proj.weight": "mtp.safetensors",
|
| 87936 |
+
"model.layers.92.mlp.experts.154.down_proj.weight_scale": "mtp.safetensors",
|
| 87937 |
+
"model.layers.92.mlp.experts.154.gate_proj.weight": "mtp.safetensors",
|
| 87938 |
+
"model.layers.92.mlp.experts.154.gate_proj.weight_scale": "mtp.safetensors",
|
| 87939 |
+
"model.layers.92.mlp.experts.154.up_proj.weight": "mtp.safetensors",
|
| 87940 |
+
"model.layers.92.mlp.experts.154.up_proj.weight_scale": "mtp.safetensors",
|
| 87941 |
+
"model.layers.92.mlp.experts.155.down_proj.weight": "mtp.safetensors",
|
| 87942 |
+
"model.layers.92.mlp.experts.155.down_proj.weight_scale": "mtp.safetensors",
|
| 87943 |
+
"model.layers.92.mlp.experts.155.gate_proj.weight": "mtp.safetensors",
|
| 87944 |
+
"model.layers.92.mlp.experts.155.gate_proj.weight_scale": "mtp.safetensors",
|
| 87945 |
+
"model.layers.92.mlp.experts.155.up_proj.weight": "mtp.safetensors",
|
| 87946 |
+
"model.layers.92.mlp.experts.155.up_proj.weight_scale": "mtp.safetensors",
|
| 87947 |
+
"model.layers.92.mlp.experts.156.down_proj.weight": "mtp.safetensors",
|
| 87948 |
+
"model.layers.92.mlp.experts.156.down_proj.weight_scale": "mtp.safetensors",
|
| 87949 |
+
"model.layers.92.mlp.experts.156.gate_proj.weight": "mtp.safetensors",
|
| 87950 |
+
"model.layers.92.mlp.experts.156.gate_proj.weight_scale": "mtp.safetensors",
|
| 87951 |
+
"model.layers.92.mlp.experts.156.up_proj.weight": "mtp.safetensors",
|
| 87952 |
+
"model.layers.92.mlp.experts.156.up_proj.weight_scale": "mtp.safetensors",
|
| 87953 |
+
"model.layers.92.mlp.experts.157.down_proj.weight": "mtp.safetensors",
|
| 87954 |
+
"model.layers.92.mlp.experts.157.down_proj.weight_scale": "mtp.safetensors",
|
| 87955 |
+
"model.layers.92.mlp.experts.157.gate_proj.weight": "mtp.safetensors",
|
| 87956 |
+
"model.layers.92.mlp.experts.157.gate_proj.weight_scale": "mtp.safetensors",
|
| 87957 |
+
"model.layers.92.mlp.experts.157.up_proj.weight": "mtp.safetensors",
|
| 87958 |
+
"model.layers.92.mlp.experts.157.up_proj.weight_scale": "mtp.safetensors",
|
| 87959 |
+
"model.layers.92.mlp.experts.158.down_proj.weight": "mtp.safetensors",
|
| 87960 |
+
"model.layers.92.mlp.experts.158.down_proj.weight_scale": "mtp.safetensors",
|
| 87961 |
+
"model.layers.92.mlp.experts.158.gate_proj.weight": "mtp.safetensors",
|
| 87962 |
+
"model.layers.92.mlp.experts.158.gate_proj.weight_scale": "mtp.safetensors",
|
| 87963 |
+
"model.layers.92.mlp.experts.158.up_proj.weight": "mtp.safetensors",
|
| 87964 |
+
"model.layers.92.mlp.experts.158.up_proj.weight_scale": "mtp.safetensors",
|
| 87965 |
+
"model.layers.92.mlp.experts.159.down_proj.weight": "mtp.safetensors",
|
| 87966 |
+
"model.layers.92.mlp.experts.159.down_proj.weight_scale": "mtp.safetensors",
|
| 87967 |
+
"model.layers.92.mlp.experts.159.gate_proj.weight": "mtp.safetensors",
|
| 87968 |
+
"model.layers.92.mlp.experts.159.gate_proj.weight_scale": "mtp.safetensors",
|
| 87969 |
+
"model.layers.92.mlp.experts.159.up_proj.weight": "mtp.safetensors",
|
| 87970 |
+
"model.layers.92.mlp.experts.159.up_proj.weight_scale": "mtp.safetensors",
|
| 87971 |
+
"model.layers.92.mlp.experts.16.down_proj.weight": "mtp.safetensors",
|
| 87972 |
+
"model.layers.92.mlp.experts.16.down_proj.weight_scale": "mtp.safetensors",
|
| 87973 |
+
"model.layers.92.mlp.experts.16.gate_proj.weight": "mtp.safetensors",
|
| 87974 |
+
"model.layers.92.mlp.experts.16.gate_proj.weight_scale": "mtp.safetensors",
|
| 87975 |
+
"model.layers.92.mlp.experts.16.up_proj.weight": "mtp.safetensors",
|
| 87976 |
+
"model.layers.92.mlp.experts.16.up_proj.weight_scale": "mtp.safetensors",
|
| 87977 |
+
"model.layers.92.mlp.experts.17.down_proj.weight": "mtp.safetensors",
|
| 87978 |
+
"model.layers.92.mlp.experts.17.down_proj.weight_scale": "mtp.safetensors",
|
| 87979 |
+
"model.layers.92.mlp.experts.17.gate_proj.weight": "mtp.safetensors",
|
| 87980 |
+
"model.layers.92.mlp.experts.17.gate_proj.weight_scale": "mtp.safetensors",
|
| 87981 |
+
"model.layers.92.mlp.experts.17.up_proj.weight": "mtp.safetensors",
|
| 87982 |
+
"model.layers.92.mlp.experts.17.up_proj.weight_scale": "mtp.safetensors",
|
| 87983 |
+
"model.layers.92.mlp.experts.18.down_proj.weight": "mtp.safetensors",
|
| 87984 |
+
"model.layers.92.mlp.experts.18.down_proj.weight_scale": "mtp.safetensors",
|
| 87985 |
+
"model.layers.92.mlp.experts.18.gate_proj.weight": "mtp.safetensors",
|
| 87986 |
+
"model.layers.92.mlp.experts.18.gate_proj.weight_scale": "mtp.safetensors",
|
| 87987 |
+
"model.layers.92.mlp.experts.18.up_proj.weight": "mtp.safetensors",
|
| 87988 |
+
"model.layers.92.mlp.experts.18.up_proj.weight_scale": "mtp.safetensors",
|
| 87989 |
+
"model.layers.92.mlp.experts.19.down_proj.weight": "mtp.safetensors",
|
| 87990 |
+
"model.layers.92.mlp.experts.19.down_proj.weight_scale": "mtp.safetensors",
|
| 87991 |
+
"model.layers.92.mlp.experts.19.gate_proj.weight": "mtp.safetensors",
|
| 87992 |
+
"model.layers.92.mlp.experts.19.gate_proj.weight_scale": "mtp.safetensors",
|
| 87993 |
+
"model.layers.92.mlp.experts.19.up_proj.weight": "mtp.safetensors",
|
| 87994 |
+
"model.layers.92.mlp.experts.19.up_proj.weight_scale": "mtp.safetensors",
|
| 87995 |
+
"model.layers.92.mlp.experts.2.down_proj.weight": "mtp.safetensors",
|
| 87996 |
+
"model.layers.92.mlp.experts.2.down_proj.weight_scale": "mtp.safetensors",
|
| 87997 |
+
"model.layers.92.mlp.experts.2.gate_proj.weight": "mtp.safetensors",
|
| 87998 |
+
"model.layers.92.mlp.experts.2.gate_proj.weight_scale": "mtp.safetensors",
|
| 87999 |
+
"model.layers.92.mlp.experts.2.up_proj.weight": "mtp.safetensors",
|
| 88000 |
+
"model.layers.92.mlp.experts.2.up_proj.weight_scale": "mtp.safetensors",
|
| 88001 |
+
"model.layers.92.mlp.experts.20.down_proj.weight": "mtp.safetensors",
|
| 88002 |
+
"model.layers.92.mlp.experts.20.down_proj.weight_scale": "mtp.safetensors",
|
| 88003 |
+
"model.layers.92.mlp.experts.20.gate_proj.weight": "mtp.safetensors",
|
| 88004 |
+
"model.layers.92.mlp.experts.20.gate_proj.weight_scale": "mtp.safetensors",
|
| 88005 |
+
"model.layers.92.mlp.experts.20.up_proj.weight": "mtp.safetensors",
|
| 88006 |
+
"model.layers.92.mlp.experts.20.up_proj.weight_scale": "mtp.safetensors",
|
| 88007 |
+
"model.layers.92.mlp.experts.21.down_proj.weight": "mtp.safetensors",
|
| 88008 |
+
"model.layers.92.mlp.experts.21.down_proj.weight_scale": "mtp.safetensors",
|
| 88009 |
+
"model.layers.92.mlp.experts.21.gate_proj.weight": "mtp.safetensors",
|
| 88010 |
+
"model.layers.92.mlp.experts.21.gate_proj.weight_scale": "mtp.safetensors",
|
| 88011 |
+
"model.layers.92.mlp.experts.21.up_proj.weight": "mtp.safetensors",
|
| 88012 |
+
"model.layers.92.mlp.experts.21.up_proj.weight_scale": "mtp.safetensors",
|
| 88013 |
+
"model.layers.92.mlp.experts.22.down_proj.weight": "mtp.safetensors",
|
| 88014 |
+
"model.layers.92.mlp.experts.22.down_proj.weight_scale": "mtp.safetensors",
|
| 88015 |
+
"model.layers.92.mlp.experts.22.gate_proj.weight": "mtp.safetensors",
|
| 88016 |
+
"model.layers.92.mlp.experts.22.gate_proj.weight_scale": "mtp.safetensors",
|
| 88017 |
+
"model.layers.92.mlp.experts.22.up_proj.weight": "mtp.safetensors",
|
| 88018 |
+
"model.layers.92.mlp.experts.22.up_proj.weight_scale": "mtp.safetensors",
|
| 88019 |
+
"model.layers.92.mlp.experts.23.down_proj.weight": "mtp.safetensors",
|
| 88020 |
+
"model.layers.92.mlp.experts.23.down_proj.weight_scale": "mtp.safetensors",
|
| 88021 |
+
"model.layers.92.mlp.experts.23.gate_proj.weight": "mtp.safetensors",
|
| 88022 |
+
"model.layers.92.mlp.experts.23.gate_proj.weight_scale": "mtp.safetensors",
|
| 88023 |
+
"model.layers.92.mlp.experts.23.up_proj.weight": "mtp.safetensors",
|
| 88024 |
+
"model.layers.92.mlp.experts.23.up_proj.weight_scale": "mtp.safetensors",
|
| 88025 |
+
"model.layers.92.mlp.experts.24.down_proj.weight": "mtp.safetensors",
|
| 88026 |
+
"model.layers.92.mlp.experts.24.down_proj.weight_scale": "mtp.safetensors",
|
| 88027 |
+
"model.layers.92.mlp.experts.24.gate_proj.weight": "mtp.safetensors",
|
| 88028 |
+
"model.layers.92.mlp.experts.24.gate_proj.weight_scale": "mtp.safetensors",
|
| 88029 |
+
"model.layers.92.mlp.experts.24.up_proj.weight": "mtp.safetensors",
|
| 88030 |
+
"model.layers.92.mlp.experts.24.up_proj.weight_scale": "mtp.safetensors",
|
| 88031 |
+
"model.layers.92.mlp.experts.25.down_proj.weight": "mtp.safetensors",
|
| 88032 |
+
"model.layers.92.mlp.experts.25.down_proj.weight_scale": "mtp.safetensors",
|
| 88033 |
+
"model.layers.92.mlp.experts.25.gate_proj.weight": "mtp.safetensors",
|
| 88034 |
+
"model.layers.92.mlp.experts.25.gate_proj.weight_scale": "mtp.safetensors",
|
| 88035 |
+
"model.layers.92.mlp.experts.25.up_proj.weight": "mtp.safetensors",
|
| 88036 |
+
"model.layers.92.mlp.experts.25.up_proj.weight_scale": "mtp.safetensors",
|
| 88037 |
+
"model.layers.92.mlp.experts.26.down_proj.weight": "mtp.safetensors",
|
| 88038 |
+
"model.layers.92.mlp.experts.26.down_proj.weight_scale": "mtp.safetensors",
|
| 88039 |
+
"model.layers.92.mlp.experts.26.gate_proj.weight": "mtp.safetensors",
|
| 88040 |
+
"model.layers.92.mlp.experts.26.gate_proj.weight_scale": "mtp.safetensors",
|
| 88041 |
+
"model.layers.92.mlp.experts.26.up_proj.weight": "mtp.safetensors",
|
| 88042 |
+
"model.layers.92.mlp.experts.26.up_proj.weight_scale": "mtp.safetensors",
|
| 88043 |
+
"model.layers.92.mlp.experts.27.down_proj.weight": "mtp.safetensors",
|
| 88044 |
+
"model.layers.92.mlp.experts.27.down_proj.weight_scale": "mtp.safetensors",
|
| 88045 |
+
"model.layers.92.mlp.experts.27.gate_proj.weight": "mtp.safetensors",
|
| 88046 |
+
"model.layers.92.mlp.experts.27.gate_proj.weight_scale": "mtp.safetensors",
|
| 88047 |
+
"model.layers.92.mlp.experts.27.up_proj.weight": "mtp.safetensors",
|
| 88048 |
+
"model.layers.92.mlp.experts.27.up_proj.weight_scale": "mtp.safetensors",
|
| 88049 |
+
"model.layers.92.mlp.experts.28.down_proj.weight": "mtp.safetensors",
|
| 88050 |
+
"model.layers.92.mlp.experts.28.down_proj.weight_scale": "mtp.safetensors",
|
| 88051 |
+
"model.layers.92.mlp.experts.28.gate_proj.weight": "mtp.safetensors",
|
| 88052 |
+
"model.layers.92.mlp.experts.28.gate_proj.weight_scale": "mtp.safetensors",
|
| 88053 |
+
"model.layers.92.mlp.experts.28.up_proj.weight": "mtp.safetensors",
|
| 88054 |
+
"model.layers.92.mlp.experts.28.up_proj.weight_scale": "mtp.safetensors",
|
| 88055 |
+
"model.layers.92.mlp.experts.29.down_proj.weight": "mtp.safetensors",
|
| 88056 |
+
"model.layers.92.mlp.experts.29.down_proj.weight_scale": "mtp.safetensors",
|
| 88057 |
+
"model.layers.92.mlp.experts.29.gate_proj.weight": "mtp.safetensors",
|
| 88058 |
+
"model.layers.92.mlp.experts.29.gate_proj.weight_scale": "mtp.safetensors",
|
| 88059 |
+
"model.layers.92.mlp.experts.29.up_proj.weight": "mtp.safetensors",
|
| 88060 |
+
"model.layers.92.mlp.experts.29.up_proj.weight_scale": "mtp.safetensors",
|
| 88061 |
+
"model.layers.92.mlp.experts.3.down_proj.weight": "mtp.safetensors",
|
| 88062 |
+
"model.layers.92.mlp.experts.3.down_proj.weight_scale": "mtp.safetensors",
|
| 88063 |
+
"model.layers.92.mlp.experts.3.gate_proj.weight": "mtp.safetensors",
|
| 88064 |
+
"model.layers.92.mlp.experts.3.gate_proj.weight_scale": "mtp.safetensors",
|
| 88065 |
+
"model.layers.92.mlp.experts.3.up_proj.weight": "mtp.safetensors",
|
| 88066 |
+
"model.layers.92.mlp.experts.3.up_proj.weight_scale": "mtp.safetensors",
|
| 88067 |
+
"model.layers.92.mlp.experts.30.down_proj.weight": "mtp.safetensors",
|
| 88068 |
+
"model.layers.92.mlp.experts.30.down_proj.weight_scale": "mtp.safetensors",
|
| 88069 |
+
"model.layers.92.mlp.experts.30.gate_proj.weight": "mtp.safetensors",
|
| 88070 |
+
"model.layers.92.mlp.experts.30.gate_proj.weight_scale": "mtp.safetensors",
|
| 88071 |
+
"model.layers.92.mlp.experts.30.up_proj.weight": "mtp.safetensors",
|
| 88072 |
+
"model.layers.92.mlp.experts.30.up_proj.weight_scale": "mtp.safetensors",
|
| 88073 |
+
"model.layers.92.mlp.experts.31.down_proj.weight": "mtp.safetensors",
|
| 88074 |
+
"model.layers.92.mlp.experts.31.down_proj.weight_scale": "mtp.safetensors",
|
| 88075 |
+
"model.layers.92.mlp.experts.31.gate_proj.weight": "mtp.safetensors",
|
| 88076 |
+
"model.layers.92.mlp.experts.31.gate_proj.weight_scale": "mtp.safetensors",
|
| 88077 |
+
"model.layers.92.mlp.experts.31.up_proj.weight": "mtp.safetensors",
|
| 88078 |
+
"model.layers.92.mlp.experts.31.up_proj.weight_scale": "mtp.safetensors",
|
| 88079 |
+
"model.layers.92.mlp.experts.32.down_proj.weight": "mtp.safetensors",
|
| 88080 |
+
"model.layers.92.mlp.experts.32.down_proj.weight_scale": "mtp.safetensors",
|
| 88081 |
+
"model.layers.92.mlp.experts.32.gate_proj.weight": "mtp.safetensors",
|
| 88082 |
+
"model.layers.92.mlp.experts.32.gate_proj.weight_scale": "mtp.safetensors",
|
| 88083 |
+
"model.layers.92.mlp.experts.32.up_proj.weight": "mtp.safetensors",
|
| 88084 |
+
"model.layers.92.mlp.experts.32.up_proj.weight_scale": "mtp.safetensors",
|
| 88085 |
+
"model.layers.92.mlp.experts.33.down_proj.weight": "mtp.safetensors",
|
| 88086 |
+
"model.layers.92.mlp.experts.33.down_proj.weight_scale": "mtp.safetensors",
|
| 88087 |
+
"model.layers.92.mlp.experts.33.gate_proj.weight": "mtp.safetensors",
|
| 88088 |
+
"model.layers.92.mlp.experts.33.gate_proj.weight_scale": "mtp.safetensors",
|
| 88089 |
+
"model.layers.92.mlp.experts.33.up_proj.weight": "mtp.safetensors",
|
| 88090 |
+
"model.layers.92.mlp.experts.33.up_proj.weight_scale": "mtp.safetensors",
|
| 88091 |
+
"model.layers.92.mlp.experts.34.down_proj.weight": "mtp.safetensors",
|
| 88092 |
+
"model.layers.92.mlp.experts.34.down_proj.weight_scale": "mtp.safetensors",
|
| 88093 |
+
"model.layers.92.mlp.experts.34.gate_proj.weight": "mtp.safetensors",
|
| 88094 |
+
"model.layers.92.mlp.experts.34.gate_proj.weight_scale": "mtp.safetensors",
|
| 88095 |
+
"model.layers.92.mlp.experts.34.up_proj.weight": "mtp.safetensors",
|
| 88096 |
+
"model.layers.92.mlp.experts.34.up_proj.weight_scale": "mtp.safetensors",
|
| 88097 |
+
"model.layers.92.mlp.experts.35.down_proj.weight": "mtp.safetensors",
|
| 88098 |
+
"model.layers.92.mlp.experts.35.down_proj.weight_scale": "mtp.safetensors",
|
| 88099 |
+
"model.layers.92.mlp.experts.35.gate_proj.weight": "mtp.safetensors",
|
| 88100 |
+
"model.layers.92.mlp.experts.35.gate_proj.weight_scale": "mtp.safetensors",
|
| 88101 |
+
"model.layers.92.mlp.experts.35.up_proj.weight": "mtp.safetensors",
|
| 88102 |
+
"model.layers.92.mlp.experts.35.up_proj.weight_scale": "mtp.safetensors",
|
| 88103 |
+
"model.layers.92.mlp.experts.36.down_proj.weight": "mtp.safetensors",
|
| 88104 |
+
"model.layers.92.mlp.experts.36.down_proj.weight_scale": "mtp.safetensors",
|
| 88105 |
+
"model.layers.92.mlp.experts.36.gate_proj.weight": "mtp.safetensors",
|
| 88106 |
+
"model.layers.92.mlp.experts.36.gate_proj.weight_scale": "mtp.safetensors",
|
| 88107 |
+
"model.layers.92.mlp.experts.36.up_proj.weight": "mtp.safetensors",
|
| 88108 |
+
"model.layers.92.mlp.experts.36.up_proj.weight_scale": "mtp.safetensors",
|
| 88109 |
+
"model.layers.92.mlp.experts.37.down_proj.weight": "mtp.safetensors",
|
| 88110 |
+
"model.layers.92.mlp.experts.37.down_proj.weight_scale": "mtp.safetensors",
|
| 88111 |
+
"model.layers.92.mlp.experts.37.gate_proj.weight": "mtp.safetensors",
|
| 88112 |
+
"model.layers.92.mlp.experts.37.gate_proj.weight_scale": "mtp.safetensors",
|
| 88113 |
+
"model.layers.92.mlp.experts.37.up_proj.weight": "mtp.safetensors",
|
| 88114 |
+
"model.layers.92.mlp.experts.37.up_proj.weight_scale": "mtp.safetensors",
|
| 88115 |
+
"model.layers.92.mlp.experts.38.down_proj.weight": "mtp.safetensors",
|
| 88116 |
+
"model.layers.92.mlp.experts.38.down_proj.weight_scale": "mtp.safetensors",
|
| 88117 |
+
"model.layers.92.mlp.experts.38.gate_proj.weight": "mtp.safetensors",
|
| 88118 |
+
"model.layers.92.mlp.experts.38.gate_proj.weight_scale": "mtp.safetensors",
|
| 88119 |
+
"model.layers.92.mlp.experts.38.up_proj.weight": "mtp.safetensors",
|
| 88120 |
+
"model.layers.92.mlp.experts.38.up_proj.weight_scale": "mtp.safetensors",
|
| 88121 |
+
"model.layers.92.mlp.experts.39.down_proj.weight": "mtp.safetensors",
|
| 88122 |
+
"model.layers.92.mlp.experts.39.down_proj.weight_scale": "mtp.safetensors",
|
| 88123 |
+
"model.layers.92.mlp.experts.39.gate_proj.weight": "mtp.safetensors",
|
| 88124 |
+
"model.layers.92.mlp.experts.39.gate_proj.weight_scale": "mtp.safetensors",
|
| 88125 |
+
"model.layers.92.mlp.experts.39.up_proj.weight": "mtp.safetensors",
|
| 88126 |
+
"model.layers.92.mlp.experts.39.up_proj.weight_scale": "mtp.safetensors",
|
| 88127 |
+
"model.layers.92.mlp.experts.4.down_proj.weight": "mtp.safetensors",
|
| 88128 |
+
"model.layers.92.mlp.experts.4.down_proj.weight_scale": "mtp.safetensors",
|
| 88129 |
+
"model.layers.92.mlp.experts.4.gate_proj.weight": "mtp.safetensors",
|
| 88130 |
+
"model.layers.92.mlp.experts.4.gate_proj.weight_scale": "mtp.safetensors",
|
| 88131 |
+
"model.layers.92.mlp.experts.4.up_proj.weight": "mtp.safetensors",
|
| 88132 |
+
"model.layers.92.mlp.experts.4.up_proj.weight_scale": "mtp.safetensors",
|
| 88133 |
+
"model.layers.92.mlp.experts.40.down_proj.weight": "mtp.safetensors",
|
| 88134 |
+
"model.layers.92.mlp.experts.40.down_proj.weight_scale": "mtp.safetensors",
|
| 88135 |
+
"model.layers.92.mlp.experts.40.gate_proj.weight": "mtp.safetensors",
|
| 88136 |
+
"model.layers.92.mlp.experts.40.gate_proj.weight_scale": "mtp.safetensors",
|
| 88137 |
+
"model.layers.92.mlp.experts.40.up_proj.weight": "mtp.safetensors",
|
| 88138 |
+
"model.layers.92.mlp.experts.40.up_proj.weight_scale": "mtp.safetensors",
|
| 88139 |
+
"model.layers.92.mlp.experts.41.down_proj.weight": "mtp.safetensors",
|
| 88140 |
+
"model.layers.92.mlp.experts.41.down_proj.weight_scale": "mtp.safetensors",
|
| 88141 |
+
"model.layers.92.mlp.experts.41.gate_proj.weight": "mtp.safetensors",
|
| 88142 |
+
"model.layers.92.mlp.experts.41.gate_proj.weight_scale": "mtp.safetensors",
|
| 88143 |
+
"model.layers.92.mlp.experts.41.up_proj.weight": "mtp.safetensors",
|
| 88144 |
+
"model.layers.92.mlp.experts.41.up_proj.weight_scale": "mtp.safetensors",
|
| 88145 |
+
"model.layers.92.mlp.experts.42.down_proj.weight": "mtp.safetensors",
|
| 88146 |
+
"model.layers.92.mlp.experts.42.down_proj.weight_scale": "mtp.safetensors",
|
| 88147 |
+
"model.layers.92.mlp.experts.42.gate_proj.weight": "mtp.safetensors",
|
| 88148 |
+
"model.layers.92.mlp.experts.42.gate_proj.weight_scale": "mtp.safetensors",
|
| 88149 |
+
"model.layers.92.mlp.experts.42.up_proj.weight": "mtp.safetensors",
|
| 88150 |
+
"model.layers.92.mlp.experts.42.up_proj.weight_scale": "mtp.safetensors",
|
| 88151 |
+
"model.layers.92.mlp.experts.43.down_proj.weight": "mtp.safetensors",
|
| 88152 |
+
"model.layers.92.mlp.experts.43.down_proj.weight_scale": "mtp.safetensors",
|
| 88153 |
+
"model.layers.92.mlp.experts.43.gate_proj.weight": "mtp.safetensors",
|
| 88154 |
+
"model.layers.92.mlp.experts.43.gate_proj.weight_scale": "mtp.safetensors",
|
| 88155 |
+
"model.layers.92.mlp.experts.43.up_proj.weight": "mtp.safetensors",
|
| 88156 |
+
"model.layers.92.mlp.experts.43.up_proj.weight_scale": "mtp.safetensors",
|
| 88157 |
+
"model.layers.92.mlp.experts.44.down_proj.weight": "mtp.safetensors",
|
| 88158 |
+
"model.layers.92.mlp.experts.44.down_proj.weight_scale": "mtp.safetensors",
|
| 88159 |
+
"model.layers.92.mlp.experts.44.gate_proj.weight": "mtp.safetensors",
|
| 88160 |
+
"model.layers.92.mlp.experts.44.gate_proj.weight_scale": "mtp.safetensors",
|
| 88161 |
+
"model.layers.92.mlp.experts.44.up_proj.weight": "mtp.safetensors",
|
| 88162 |
+
"model.layers.92.mlp.experts.44.up_proj.weight_scale": "mtp.safetensors",
|
| 88163 |
+
"model.layers.92.mlp.experts.45.down_proj.weight": "mtp.safetensors",
|
| 88164 |
+
"model.layers.92.mlp.experts.45.down_proj.weight_scale": "mtp.safetensors",
|
| 88165 |
+
"model.layers.92.mlp.experts.45.gate_proj.weight": "mtp.safetensors",
|
| 88166 |
+
"model.layers.92.mlp.experts.45.gate_proj.weight_scale": "mtp.safetensors",
|
| 88167 |
+
"model.layers.92.mlp.experts.45.up_proj.weight": "mtp.safetensors",
|
| 88168 |
+
"model.layers.92.mlp.experts.45.up_proj.weight_scale": "mtp.safetensors",
|
| 88169 |
+
"model.layers.92.mlp.experts.46.down_proj.weight": "mtp.safetensors",
|
| 88170 |
+
"model.layers.92.mlp.experts.46.down_proj.weight_scale": "mtp.safetensors",
|
| 88171 |
+
"model.layers.92.mlp.experts.46.gate_proj.weight": "mtp.safetensors",
|
| 88172 |
+
"model.layers.92.mlp.experts.46.gate_proj.weight_scale": "mtp.safetensors",
|
| 88173 |
+
"model.layers.92.mlp.experts.46.up_proj.weight": "mtp.safetensors",
|
| 88174 |
+
"model.layers.92.mlp.experts.46.up_proj.weight_scale": "mtp.safetensors",
|
| 88175 |
+
"model.layers.92.mlp.experts.47.down_proj.weight": "mtp.safetensors",
|
| 88176 |
+
"model.layers.92.mlp.experts.47.down_proj.weight_scale": "mtp.safetensors",
|
| 88177 |
+
"model.layers.92.mlp.experts.47.gate_proj.weight": "mtp.safetensors",
|
| 88178 |
+
"model.layers.92.mlp.experts.47.gate_proj.weight_scale": "mtp.safetensors",
|
| 88179 |
+
"model.layers.92.mlp.experts.47.up_proj.weight": "mtp.safetensors",
|
| 88180 |
+
"model.layers.92.mlp.experts.47.up_proj.weight_scale": "mtp.safetensors",
|
| 88181 |
+
"model.layers.92.mlp.experts.48.down_proj.weight": "mtp.safetensors",
|
| 88182 |
+
"model.layers.92.mlp.experts.48.down_proj.weight_scale": "mtp.safetensors",
|
| 88183 |
+
"model.layers.92.mlp.experts.48.gate_proj.weight": "mtp.safetensors",
|
| 88184 |
+
"model.layers.92.mlp.experts.48.gate_proj.weight_scale": "mtp.safetensors",
|
| 88185 |
+
"model.layers.92.mlp.experts.48.up_proj.weight": "mtp.safetensors",
|
| 88186 |
+
"model.layers.92.mlp.experts.48.up_proj.weight_scale": "mtp.safetensors",
|
| 88187 |
+
"model.layers.92.mlp.experts.49.down_proj.weight": "mtp.safetensors",
|
| 88188 |
+
"model.layers.92.mlp.experts.49.down_proj.weight_scale": "mtp.safetensors",
|
| 88189 |
+
"model.layers.92.mlp.experts.49.gate_proj.weight": "mtp.safetensors",
|
| 88190 |
+
"model.layers.92.mlp.experts.49.gate_proj.weight_scale": "mtp.safetensors",
|
| 88191 |
+
"model.layers.92.mlp.experts.49.up_proj.weight": "mtp.safetensors",
|
| 88192 |
+
"model.layers.92.mlp.experts.49.up_proj.weight_scale": "mtp.safetensors",
|
| 88193 |
+
"model.layers.92.mlp.experts.5.down_proj.weight": "mtp.safetensors",
|
| 88194 |
+
"model.layers.92.mlp.experts.5.down_proj.weight_scale": "mtp.safetensors",
|
| 88195 |
+
"model.layers.92.mlp.experts.5.gate_proj.weight": "mtp.safetensors",
|
| 88196 |
+
"model.layers.92.mlp.experts.5.gate_proj.weight_scale": "mtp.safetensors",
|
| 88197 |
+
"model.layers.92.mlp.experts.5.up_proj.weight": "mtp.safetensors",
|
| 88198 |
+
"model.layers.92.mlp.experts.5.up_proj.weight_scale": "mtp.safetensors",
|
| 88199 |
+
"model.layers.92.mlp.experts.50.down_proj.weight": "mtp.safetensors",
|
| 88200 |
+
"model.layers.92.mlp.experts.50.down_proj.weight_scale": "mtp.safetensors",
|
| 88201 |
+
"model.layers.92.mlp.experts.50.gate_proj.weight": "mtp.safetensors",
|
| 88202 |
+
"model.layers.92.mlp.experts.50.gate_proj.weight_scale": "mtp.safetensors",
|
| 88203 |
+
"model.layers.92.mlp.experts.50.up_proj.weight": "mtp.safetensors",
|
| 88204 |
+
"model.layers.92.mlp.experts.50.up_proj.weight_scale": "mtp.safetensors",
|
| 88205 |
+
"model.layers.92.mlp.experts.51.down_proj.weight": "mtp.safetensors",
|
| 88206 |
+
"model.layers.92.mlp.experts.51.down_proj.weight_scale": "mtp.safetensors",
|
| 88207 |
+
"model.layers.92.mlp.experts.51.gate_proj.weight": "mtp.safetensors",
|
| 88208 |
+
"model.layers.92.mlp.experts.51.gate_proj.weight_scale": "mtp.safetensors",
|
| 88209 |
+
"model.layers.92.mlp.experts.51.up_proj.weight": "mtp.safetensors",
|
| 88210 |
+
"model.layers.92.mlp.experts.51.up_proj.weight_scale": "mtp.safetensors",
|
| 88211 |
+
"model.layers.92.mlp.experts.52.down_proj.weight": "mtp.safetensors",
|
| 88212 |
+
"model.layers.92.mlp.experts.52.down_proj.weight_scale": "mtp.safetensors",
|
| 88213 |
+
"model.layers.92.mlp.experts.52.gate_proj.weight": "mtp.safetensors",
|
| 88214 |
+
"model.layers.92.mlp.experts.52.gate_proj.weight_scale": "mtp.safetensors",
|
| 88215 |
+
"model.layers.92.mlp.experts.52.up_proj.weight": "mtp.safetensors",
|
| 88216 |
+
"model.layers.92.mlp.experts.52.up_proj.weight_scale": "mtp.safetensors",
|
| 88217 |
+
"model.layers.92.mlp.experts.53.down_proj.weight": "mtp.safetensors",
|
| 88218 |
+
"model.layers.92.mlp.experts.53.down_proj.weight_scale": "mtp.safetensors",
|
| 88219 |
+
"model.layers.92.mlp.experts.53.gate_proj.weight": "mtp.safetensors",
|
| 88220 |
+
"model.layers.92.mlp.experts.53.gate_proj.weight_scale": "mtp.safetensors",
|
| 88221 |
+
"model.layers.92.mlp.experts.53.up_proj.weight": "mtp.safetensors",
|
| 88222 |
+
"model.layers.92.mlp.experts.53.up_proj.weight_scale": "mtp.safetensors",
|
| 88223 |
+
"model.layers.92.mlp.experts.54.down_proj.weight": "mtp.safetensors",
|
| 88224 |
+
"model.layers.92.mlp.experts.54.down_proj.weight_scale": "mtp.safetensors",
|
| 88225 |
+
"model.layers.92.mlp.experts.54.gate_proj.weight": "mtp.safetensors",
|
| 88226 |
+
"model.layers.92.mlp.experts.54.gate_proj.weight_scale": "mtp.safetensors",
|
| 88227 |
+
"model.layers.92.mlp.experts.54.up_proj.weight": "mtp.safetensors",
|
| 88228 |
+
"model.layers.92.mlp.experts.54.up_proj.weight_scale": "mtp.safetensors",
|
| 88229 |
+
"model.layers.92.mlp.experts.55.down_proj.weight": "mtp.safetensors",
|
| 88230 |
+
"model.layers.92.mlp.experts.55.down_proj.weight_scale": "mtp.safetensors",
|
| 88231 |
+
"model.layers.92.mlp.experts.55.gate_proj.weight": "mtp.safetensors",
|
| 88232 |
+
"model.layers.92.mlp.experts.55.gate_proj.weight_scale": "mtp.safetensors",
|
| 88233 |
+
"model.layers.92.mlp.experts.55.up_proj.weight": "mtp.safetensors",
|
| 88234 |
+
"model.layers.92.mlp.experts.55.up_proj.weight_scale": "mtp.safetensors",
|
| 88235 |
+
"model.layers.92.mlp.experts.56.down_proj.weight": "mtp.safetensors",
|
| 88236 |
+
"model.layers.92.mlp.experts.56.down_proj.weight_scale": "mtp.safetensors",
|
| 88237 |
+
"model.layers.92.mlp.experts.56.gate_proj.weight": "mtp.safetensors",
|
| 88238 |
+
"model.layers.92.mlp.experts.56.gate_proj.weight_scale": "mtp.safetensors",
|
| 88239 |
+
"model.layers.92.mlp.experts.56.up_proj.weight": "mtp.safetensors",
|
| 88240 |
+
"model.layers.92.mlp.experts.56.up_proj.weight_scale": "mtp.safetensors",
|
| 88241 |
+
"model.layers.92.mlp.experts.57.down_proj.weight": "mtp.safetensors",
|
| 88242 |
+
"model.layers.92.mlp.experts.57.down_proj.weight_scale": "mtp.safetensors",
|
| 88243 |
+
"model.layers.92.mlp.experts.57.gate_proj.weight": "mtp.safetensors",
|
| 88244 |
+
"model.layers.92.mlp.experts.57.gate_proj.weight_scale": "mtp.safetensors",
|
| 88245 |
+
"model.layers.92.mlp.experts.57.up_proj.weight": "mtp.safetensors",
|
| 88246 |
+
"model.layers.92.mlp.experts.57.up_proj.weight_scale": "mtp.safetensors",
|
| 88247 |
+
"model.layers.92.mlp.experts.58.down_proj.weight": "mtp.safetensors",
|
| 88248 |
+
"model.layers.92.mlp.experts.58.down_proj.weight_scale": "mtp.safetensors",
|
| 88249 |
+
"model.layers.92.mlp.experts.58.gate_proj.weight": "mtp.safetensors",
|
| 88250 |
+
"model.layers.92.mlp.experts.58.gate_proj.weight_scale": "mtp.safetensors",
|
| 88251 |
+
"model.layers.92.mlp.experts.58.up_proj.weight": "mtp.safetensors",
|
| 88252 |
+
"model.layers.92.mlp.experts.58.up_proj.weight_scale": "mtp.safetensors",
|
| 88253 |
+
"model.layers.92.mlp.experts.59.down_proj.weight": "mtp.safetensors",
|
| 88254 |
+
"model.layers.92.mlp.experts.59.down_proj.weight_scale": "mtp.safetensors",
|
| 88255 |
+
"model.layers.92.mlp.experts.59.gate_proj.weight": "mtp.safetensors",
|
| 88256 |
+
"model.layers.92.mlp.experts.59.gate_proj.weight_scale": "mtp.safetensors",
|
| 88257 |
+
"model.layers.92.mlp.experts.59.up_proj.weight": "mtp.safetensors",
|
| 88258 |
+
"model.layers.92.mlp.experts.59.up_proj.weight_scale": "mtp.safetensors",
|
| 88259 |
+
"model.layers.92.mlp.experts.6.down_proj.weight": "mtp.safetensors",
|
| 88260 |
+
"model.layers.92.mlp.experts.6.down_proj.weight_scale": "mtp.safetensors",
|
| 88261 |
+
"model.layers.92.mlp.experts.6.gate_proj.weight": "mtp.safetensors",
|
| 88262 |
+
"model.layers.92.mlp.experts.6.gate_proj.weight_scale": "mtp.safetensors",
|
| 88263 |
+
"model.layers.92.mlp.experts.6.up_proj.weight": "mtp.safetensors",
|
| 88264 |
+
"model.layers.92.mlp.experts.6.up_proj.weight_scale": "mtp.safetensors",
|
| 88265 |
+
"model.layers.92.mlp.experts.60.down_proj.weight": "mtp.safetensors",
|
| 88266 |
+
"model.layers.92.mlp.experts.60.down_proj.weight_scale": "mtp.safetensors",
|
| 88267 |
+
"model.layers.92.mlp.experts.60.gate_proj.weight": "mtp.safetensors",
|
| 88268 |
+
"model.layers.92.mlp.experts.60.gate_proj.weight_scale": "mtp.safetensors",
|
| 88269 |
+
"model.layers.92.mlp.experts.60.up_proj.weight": "mtp.safetensors",
|
| 88270 |
+
"model.layers.92.mlp.experts.60.up_proj.weight_scale": "mtp.safetensors",
|
| 88271 |
+
"model.layers.92.mlp.experts.61.down_proj.weight": "mtp.safetensors",
|
| 88272 |
+
"model.layers.92.mlp.experts.61.down_proj.weight_scale": "mtp.safetensors",
|
| 88273 |
+
"model.layers.92.mlp.experts.61.gate_proj.weight": "mtp.safetensors",
|
| 88274 |
+
"model.layers.92.mlp.experts.61.gate_proj.weight_scale": "mtp.safetensors",
|
| 88275 |
+
"model.layers.92.mlp.experts.61.up_proj.weight": "mtp.safetensors",
|
| 88276 |
+
"model.layers.92.mlp.experts.61.up_proj.weight_scale": "mtp.safetensors",
|
| 88277 |
+
"model.layers.92.mlp.experts.62.down_proj.weight": "mtp.safetensors",
|
| 88278 |
+
"model.layers.92.mlp.experts.62.down_proj.weight_scale": "mtp.safetensors",
|
| 88279 |
+
"model.layers.92.mlp.experts.62.gate_proj.weight": "mtp.safetensors",
|
| 88280 |
+
"model.layers.92.mlp.experts.62.gate_proj.weight_scale": "mtp.safetensors",
|
| 88281 |
+
"model.layers.92.mlp.experts.62.up_proj.weight": "mtp.safetensors",
|
| 88282 |
+
"model.layers.92.mlp.experts.62.up_proj.weight_scale": "mtp.safetensors",
|
| 88283 |
+
"model.layers.92.mlp.experts.63.down_proj.weight": "mtp.safetensors",
|
| 88284 |
+
"model.layers.92.mlp.experts.63.down_proj.weight_scale": "mtp.safetensors",
|
| 88285 |
+
"model.layers.92.mlp.experts.63.gate_proj.weight": "mtp.safetensors",
|
| 88286 |
+
"model.layers.92.mlp.experts.63.gate_proj.weight_scale": "mtp.safetensors",
|
| 88287 |
+
"model.layers.92.mlp.experts.63.up_proj.weight": "mtp.safetensors",
|
| 88288 |
+
"model.layers.92.mlp.experts.63.up_proj.weight_scale": "mtp.safetensors",
|
| 88289 |
+
"model.layers.92.mlp.experts.64.down_proj.weight": "mtp.safetensors",
|
| 88290 |
+
"model.layers.92.mlp.experts.64.down_proj.weight_scale": "mtp.safetensors",
|
| 88291 |
+
"model.layers.92.mlp.experts.64.gate_proj.weight": "mtp.safetensors",
|
| 88292 |
+
"model.layers.92.mlp.experts.64.gate_proj.weight_scale": "mtp.safetensors",
|
| 88293 |
+
"model.layers.92.mlp.experts.64.up_proj.weight": "mtp.safetensors",
|
| 88294 |
+
"model.layers.92.mlp.experts.64.up_proj.weight_scale": "mtp.safetensors",
|
| 88295 |
+
"model.layers.92.mlp.experts.65.down_proj.weight": "mtp.safetensors",
|
| 88296 |
+
"model.layers.92.mlp.experts.65.down_proj.weight_scale": "mtp.safetensors",
|
| 88297 |
+
"model.layers.92.mlp.experts.65.gate_proj.weight": "mtp.safetensors",
|
| 88298 |
+
"model.layers.92.mlp.experts.65.gate_proj.weight_scale": "mtp.safetensors",
|
| 88299 |
+
"model.layers.92.mlp.experts.65.up_proj.weight": "mtp.safetensors",
|
| 88300 |
+
"model.layers.92.mlp.experts.65.up_proj.weight_scale": "mtp.safetensors",
|
| 88301 |
+
"model.layers.92.mlp.experts.66.down_proj.weight": "mtp.safetensors",
|
| 88302 |
+
"model.layers.92.mlp.experts.66.down_proj.weight_scale": "mtp.safetensors",
|
| 88303 |
+
"model.layers.92.mlp.experts.66.gate_proj.weight": "mtp.safetensors",
|
| 88304 |
+
"model.layers.92.mlp.experts.66.gate_proj.weight_scale": "mtp.safetensors",
|
| 88305 |
+
"model.layers.92.mlp.experts.66.up_proj.weight": "mtp.safetensors",
|
| 88306 |
+
"model.layers.92.mlp.experts.66.up_proj.weight_scale": "mtp.safetensors",
|
| 88307 |
+
"model.layers.92.mlp.experts.67.down_proj.weight": "mtp.safetensors",
|
| 88308 |
+
"model.layers.92.mlp.experts.67.down_proj.weight_scale": "mtp.safetensors",
|
| 88309 |
+
"model.layers.92.mlp.experts.67.gate_proj.weight": "mtp.safetensors",
|
| 88310 |
+
"model.layers.92.mlp.experts.67.gate_proj.weight_scale": "mtp.safetensors",
|
| 88311 |
+
"model.layers.92.mlp.experts.67.up_proj.weight": "mtp.safetensors",
|
| 88312 |
+
"model.layers.92.mlp.experts.67.up_proj.weight_scale": "mtp.safetensors",
|
| 88313 |
+
"model.layers.92.mlp.experts.68.down_proj.weight": "mtp.safetensors",
|
| 88314 |
+
"model.layers.92.mlp.experts.68.down_proj.weight_scale": "mtp.safetensors",
|
| 88315 |
+
"model.layers.92.mlp.experts.68.gate_proj.weight": "mtp.safetensors",
|
| 88316 |
+
"model.layers.92.mlp.experts.68.gate_proj.weight_scale": "mtp.safetensors",
|
| 88317 |
+
"model.layers.92.mlp.experts.68.up_proj.weight": "mtp.safetensors",
|
| 88318 |
+
"model.layers.92.mlp.experts.68.up_proj.weight_scale": "mtp.safetensors",
|
| 88319 |
+
"model.layers.92.mlp.experts.69.down_proj.weight": "mtp.safetensors",
|
| 88320 |
+
"model.layers.92.mlp.experts.69.down_proj.weight_scale": "mtp.safetensors",
|
| 88321 |
+
"model.layers.92.mlp.experts.69.gate_proj.weight": "mtp.safetensors",
|
| 88322 |
+
"model.layers.92.mlp.experts.69.gate_proj.weight_scale": "mtp.safetensors",
|
| 88323 |
+
"model.layers.92.mlp.experts.69.up_proj.weight": "mtp.safetensors",
|
| 88324 |
+
"model.layers.92.mlp.experts.69.up_proj.weight_scale": "mtp.safetensors",
|
| 88325 |
+
"model.layers.92.mlp.experts.7.down_proj.weight": "mtp.safetensors",
|
| 88326 |
+
"model.layers.92.mlp.experts.7.down_proj.weight_scale": "mtp.safetensors",
|
| 88327 |
+
"model.layers.92.mlp.experts.7.gate_proj.weight": "mtp.safetensors",
|
| 88328 |
+
"model.layers.92.mlp.experts.7.gate_proj.weight_scale": "mtp.safetensors",
|
| 88329 |
+
"model.layers.92.mlp.experts.7.up_proj.weight": "mtp.safetensors",
|
| 88330 |
+
"model.layers.92.mlp.experts.7.up_proj.weight_scale": "mtp.safetensors",
|
| 88331 |
+
"model.layers.92.mlp.experts.70.down_proj.weight": "mtp.safetensors",
|
| 88332 |
+
"model.layers.92.mlp.experts.70.down_proj.weight_scale": "mtp.safetensors",
|
| 88333 |
+
"model.layers.92.mlp.experts.70.gate_proj.weight": "mtp.safetensors",
|
| 88334 |
+
"model.layers.92.mlp.experts.70.gate_proj.weight_scale": "mtp.safetensors",
|
| 88335 |
+
"model.layers.92.mlp.experts.70.up_proj.weight": "mtp.safetensors",
|
| 88336 |
+
"model.layers.92.mlp.experts.70.up_proj.weight_scale": "mtp.safetensors",
|
| 88337 |
+
"model.layers.92.mlp.experts.71.down_proj.weight": "mtp.safetensors",
|
| 88338 |
+
"model.layers.92.mlp.experts.71.down_proj.weight_scale": "mtp.safetensors",
|
| 88339 |
+
"model.layers.92.mlp.experts.71.gate_proj.weight": "mtp.safetensors",
|
| 88340 |
+
"model.layers.92.mlp.experts.71.gate_proj.weight_scale": "mtp.safetensors",
|
| 88341 |
+
"model.layers.92.mlp.experts.71.up_proj.weight": "mtp.safetensors",
|
| 88342 |
+
"model.layers.92.mlp.experts.71.up_proj.weight_scale": "mtp.safetensors",
|
| 88343 |
+
"model.layers.92.mlp.experts.72.down_proj.weight": "mtp.safetensors",
|
| 88344 |
+
"model.layers.92.mlp.experts.72.down_proj.weight_scale": "mtp.safetensors",
|
| 88345 |
+
"model.layers.92.mlp.experts.72.gate_proj.weight": "mtp.safetensors",
|
| 88346 |
+
"model.layers.92.mlp.experts.72.gate_proj.weight_scale": "mtp.safetensors",
|
| 88347 |
+
"model.layers.92.mlp.experts.72.up_proj.weight": "mtp.safetensors",
|
| 88348 |
+
"model.layers.92.mlp.experts.72.up_proj.weight_scale": "mtp.safetensors",
|
| 88349 |
+
"model.layers.92.mlp.experts.73.down_proj.weight": "mtp.safetensors",
|
| 88350 |
+
"model.layers.92.mlp.experts.73.down_proj.weight_scale": "mtp.safetensors",
|
| 88351 |
+
"model.layers.92.mlp.experts.73.gate_proj.weight": "mtp.safetensors",
|
| 88352 |
+
"model.layers.92.mlp.experts.73.gate_proj.weight_scale": "mtp.safetensors",
|
| 88353 |
+
"model.layers.92.mlp.experts.73.up_proj.weight": "mtp.safetensors",
|
| 88354 |
+
"model.layers.92.mlp.experts.73.up_proj.weight_scale": "mtp.safetensors",
|
| 88355 |
+
"model.layers.92.mlp.experts.74.down_proj.weight": "mtp.safetensors",
|
| 88356 |
+
"model.layers.92.mlp.experts.74.down_proj.weight_scale": "mtp.safetensors",
|
| 88357 |
+
"model.layers.92.mlp.experts.74.gate_proj.weight": "mtp.safetensors",
|
| 88358 |
+
"model.layers.92.mlp.experts.74.gate_proj.weight_scale": "mtp.safetensors",
|
| 88359 |
+
"model.layers.92.mlp.experts.74.up_proj.weight": "mtp.safetensors",
|
| 88360 |
+
"model.layers.92.mlp.experts.74.up_proj.weight_scale": "mtp.safetensors",
|
| 88361 |
+
"model.layers.92.mlp.experts.75.down_proj.weight": "mtp.safetensors",
|
| 88362 |
+
"model.layers.92.mlp.experts.75.down_proj.weight_scale": "mtp.safetensors",
|
| 88363 |
+
"model.layers.92.mlp.experts.75.gate_proj.weight": "mtp.safetensors",
|
| 88364 |
+
"model.layers.92.mlp.experts.75.gate_proj.weight_scale": "mtp.safetensors",
|
| 88365 |
+
"model.layers.92.mlp.experts.75.up_proj.weight": "mtp.safetensors",
|
| 88366 |
+
"model.layers.92.mlp.experts.75.up_proj.weight_scale": "mtp.safetensors",
|
| 88367 |
+
"model.layers.92.mlp.experts.76.down_proj.weight": "mtp.safetensors",
|
| 88368 |
+
"model.layers.92.mlp.experts.76.down_proj.weight_scale": "mtp.safetensors",
|
| 88369 |
+
"model.layers.92.mlp.experts.76.gate_proj.weight": "mtp.safetensors",
|
| 88370 |
+
"model.layers.92.mlp.experts.76.gate_proj.weight_scale": "mtp.safetensors",
|
| 88371 |
+
"model.layers.92.mlp.experts.76.up_proj.weight": "mtp.safetensors",
|
| 88372 |
+
"model.layers.92.mlp.experts.76.up_proj.weight_scale": "mtp.safetensors",
|
| 88373 |
+
"model.layers.92.mlp.experts.77.down_proj.weight": "mtp.safetensors",
|
| 88374 |
+
"model.layers.92.mlp.experts.77.down_proj.weight_scale": "mtp.safetensors",
|
| 88375 |
+
"model.layers.92.mlp.experts.77.gate_proj.weight": "mtp.safetensors",
|
| 88376 |
+
"model.layers.92.mlp.experts.77.gate_proj.weight_scale": "mtp.safetensors",
|
| 88377 |
+
"model.layers.92.mlp.experts.77.up_proj.weight": "mtp.safetensors",
|
| 88378 |
+
"model.layers.92.mlp.experts.77.up_proj.weight_scale": "mtp.safetensors",
|
| 88379 |
+
"model.layers.92.mlp.experts.78.down_proj.weight": "mtp.safetensors",
|
| 88380 |
+
"model.layers.92.mlp.experts.78.down_proj.weight_scale": "mtp.safetensors",
|
| 88381 |
+
"model.layers.92.mlp.experts.78.gate_proj.weight": "mtp.safetensors",
|
| 88382 |
+
"model.layers.92.mlp.experts.78.gate_proj.weight_scale": "mtp.safetensors",
|
| 88383 |
+
"model.layers.92.mlp.experts.78.up_proj.weight": "mtp.safetensors",
|
| 88384 |
+
"model.layers.92.mlp.experts.78.up_proj.weight_scale": "mtp.safetensors",
|
| 88385 |
+
"model.layers.92.mlp.experts.79.down_proj.weight": "mtp.safetensors",
|
| 88386 |
+
"model.layers.92.mlp.experts.79.down_proj.weight_scale": "mtp.safetensors",
|
| 88387 |
+
"model.layers.92.mlp.experts.79.gate_proj.weight": "mtp.safetensors",
|
| 88388 |
+
"model.layers.92.mlp.experts.79.gate_proj.weight_scale": "mtp.safetensors",
|
| 88389 |
+
"model.layers.92.mlp.experts.79.up_proj.weight": "mtp.safetensors",
|
| 88390 |
+
"model.layers.92.mlp.experts.79.up_proj.weight_scale": "mtp.safetensors",
|
| 88391 |
+
"model.layers.92.mlp.experts.8.down_proj.weight": "mtp.safetensors",
|
| 88392 |
+
"model.layers.92.mlp.experts.8.down_proj.weight_scale": "mtp.safetensors",
|
| 88393 |
+
"model.layers.92.mlp.experts.8.gate_proj.weight": "mtp.safetensors",
|
| 88394 |
+
"model.layers.92.mlp.experts.8.gate_proj.weight_scale": "mtp.safetensors",
|
| 88395 |
+
"model.layers.92.mlp.experts.8.up_proj.weight": "mtp.safetensors",
|
| 88396 |
+
"model.layers.92.mlp.experts.8.up_proj.weight_scale": "mtp.safetensors",
|
| 88397 |
+
"model.layers.92.mlp.experts.80.down_proj.weight": "mtp.safetensors",
|
| 88398 |
+
"model.layers.92.mlp.experts.80.down_proj.weight_scale": "mtp.safetensors",
|
| 88399 |
+
"model.layers.92.mlp.experts.80.gate_proj.weight": "mtp.safetensors",
|
| 88400 |
+
"model.layers.92.mlp.experts.80.gate_proj.weight_scale": "mtp.safetensors",
|
| 88401 |
+
"model.layers.92.mlp.experts.80.up_proj.weight": "mtp.safetensors",
|
| 88402 |
+
"model.layers.92.mlp.experts.80.up_proj.weight_scale": "mtp.safetensors",
|
| 88403 |
+
"model.layers.92.mlp.experts.81.down_proj.weight": "mtp.safetensors",
|
| 88404 |
+
"model.layers.92.mlp.experts.81.down_proj.weight_scale": "mtp.safetensors",
|
| 88405 |
+
"model.layers.92.mlp.experts.81.gate_proj.weight": "mtp.safetensors",
|
| 88406 |
+
"model.layers.92.mlp.experts.81.gate_proj.weight_scale": "mtp.safetensors",
|
| 88407 |
+
"model.layers.92.mlp.experts.81.up_proj.weight": "mtp.safetensors",
|
| 88408 |
+
"model.layers.92.mlp.experts.81.up_proj.weight_scale": "mtp.safetensors",
|
| 88409 |
+
"model.layers.92.mlp.experts.82.down_proj.weight": "mtp.safetensors",
|
| 88410 |
+
"model.layers.92.mlp.experts.82.down_proj.weight_scale": "mtp.safetensors",
|
| 88411 |
+
"model.layers.92.mlp.experts.82.gate_proj.weight": "mtp.safetensors",
|
| 88412 |
+
"model.layers.92.mlp.experts.82.gate_proj.weight_scale": "mtp.safetensors",
|
| 88413 |
+
"model.layers.92.mlp.experts.82.up_proj.weight": "mtp.safetensors",
|
| 88414 |
+
"model.layers.92.mlp.experts.82.up_proj.weight_scale": "mtp.safetensors",
|
| 88415 |
+
"model.layers.92.mlp.experts.83.down_proj.weight": "mtp.safetensors",
|
| 88416 |
+
"model.layers.92.mlp.experts.83.down_proj.weight_scale": "mtp.safetensors",
|
| 88417 |
+
"model.layers.92.mlp.experts.83.gate_proj.weight": "mtp.safetensors",
|
| 88418 |
+
"model.layers.92.mlp.experts.83.gate_proj.weight_scale": "mtp.safetensors",
|
| 88419 |
+
"model.layers.92.mlp.experts.83.up_proj.weight": "mtp.safetensors",
|
| 88420 |
+
"model.layers.92.mlp.experts.83.up_proj.weight_scale": "mtp.safetensors",
|
| 88421 |
+
"model.layers.92.mlp.experts.84.down_proj.weight": "mtp.safetensors",
|
| 88422 |
+
"model.layers.92.mlp.experts.84.down_proj.weight_scale": "mtp.safetensors",
|
| 88423 |
+
"model.layers.92.mlp.experts.84.gate_proj.weight": "mtp.safetensors",
|
| 88424 |
+
"model.layers.92.mlp.experts.84.gate_proj.weight_scale": "mtp.safetensors",
|
| 88425 |
+
"model.layers.92.mlp.experts.84.up_proj.weight": "mtp.safetensors",
|
| 88426 |
+
"model.layers.92.mlp.experts.84.up_proj.weight_scale": "mtp.safetensors",
|
| 88427 |
+
"model.layers.92.mlp.experts.85.down_proj.weight": "mtp.safetensors",
|
| 88428 |
+
"model.layers.92.mlp.experts.85.down_proj.weight_scale": "mtp.safetensors",
|
| 88429 |
+
"model.layers.92.mlp.experts.85.gate_proj.weight": "mtp.safetensors",
|
| 88430 |
+
"model.layers.92.mlp.experts.85.gate_proj.weight_scale": "mtp.safetensors",
|
| 88431 |
+
"model.layers.92.mlp.experts.85.up_proj.weight": "mtp.safetensors",
|
| 88432 |
+
"model.layers.92.mlp.experts.85.up_proj.weight_scale": "mtp.safetensors",
|
| 88433 |
+
"model.layers.92.mlp.experts.86.down_proj.weight": "mtp.safetensors",
|
| 88434 |
+
"model.layers.92.mlp.experts.86.down_proj.weight_scale": "mtp.safetensors",
|
| 88435 |
+
"model.layers.92.mlp.experts.86.gate_proj.weight": "mtp.safetensors",
|
| 88436 |
+
"model.layers.92.mlp.experts.86.gate_proj.weight_scale": "mtp.safetensors",
|
| 88437 |
+
"model.layers.92.mlp.experts.86.up_proj.weight": "mtp.safetensors",
|
| 88438 |
+
"model.layers.92.mlp.experts.86.up_proj.weight_scale": "mtp.safetensors",
|
| 88439 |
+
"model.layers.92.mlp.experts.87.down_proj.weight": "mtp.safetensors",
|
| 88440 |
+
"model.layers.92.mlp.experts.87.down_proj.weight_scale": "mtp.safetensors",
|
| 88441 |
+
"model.layers.92.mlp.experts.87.gate_proj.weight": "mtp.safetensors",
|
| 88442 |
+
"model.layers.92.mlp.experts.87.gate_proj.weight_scale": "mtp.safetensors",
|
| 88443 |
+
"model.layers.92.mlp.experts.87.up_proj.weight": "mtp.safetensors",
|
| 88444 |
+
"model.layers.92.mlp.experts.87.up_proj.weight_scale": "mtp.safetensors",
|
| 88445 |
+
"model.layers.92.mlp.experts.88.down_proj.weight": "mtp.safetensors",
|
| 88446 |
+
"model.layers.92.mlp.experts.88.down_proj.weight_scale": "mtp.safetensors",
|
| 88447 |
+
"model.layers.92.mlp.experts.88.gate_proj.weight": "mtp.safetensors",
|
| 88448 |
+
"model.layers.92.mlp.experts.88.gate_proj.weight_scale": "mtp.safetensors",
|
| 88449 |
+
"model.layers.92.mlp.experts.88.up_proj.weight": "mtp.safetensors",
|
| 88450 |
+
"model.layers.92.mlp.experts.88.up_proj.weight_scale": "mtp.safetensors",
|
| 88451 |
+
"model.layers.92.mlp.experts.89.down_proj.weight": "mtp.safetensors",
|
| 88452 |
+
"model.layers.92.mlp.experts.89.down_proj.weight_scale": "mtp.safetensors",
|
| 88453 |
+
"model.layers.92.mlp.experts.89.gate_proj.weight": "mtp.safetensors",
|
| 88454 |
+
"model.layers.92.mlp.experts.89.gate_proj.weight_scale": "mtp.safetensors",
|
| 88455 |
+
"model.layers.92.mlp.experts.89.up_proj.weight": "mtp.safetensors",
|
| 88456 |
+
"model.layers.92.mlp.experts.89.up_proj.weight_scale": "mtp.safetensors",
|
| 88457 |
+
"model.layers.92.mlp.experts.9.down_proj.weight": "mtp.safetensors",
|
| 88458 |
+
"model.layers.92.mlp.experts.9.down_proj.weight_scale": "mtp.safetensors",
|
| 88459 |
+
"model.layers.92.mlp.experts.9.gate_proj.weight": "mtp.safetensors",
|
| 88460 |
+
"model.layers.92.mlp.experts.9.gate_proj.weight_scale": "mtp.safetensors",
|
| 88461 |
+
"model.layers.92.mlp.experts.9.up_proj.weight": "mtp.safetensors",
|
| 88462 |
+
"model.layers.92.mlp.experts.9.up_proj.weight_scale": "mtp.safetensors",
|
| 88463 |
+
"model.layers.92.mlp.experts.90.down_proj.weight": "mtp.safetensors",
|
| 88464 |
+
"model.layers.92.mlp.experts.90.down_proj.weight_scale": "mtp.safetensors",
|
| 88465 |
+
"model.layers.92.mlp.experts.90.gate_proj.weight": "mtp.safetensors",
|
| 88466 |
+
"model.layers.92.mlp.experts.90.gate_proj.weight_scale": "mtp.safetensors",
|
| 88467 |
+
"model.layers.92.mlp.experts.90.up_proj.weight": "mtp.safetensors",
|
| 88468 |
+
"model.layers.92.mlp.experts.90.up_proj.weight_scale": "mtp.safetensors",
|
| 88469 |
+
"model.layers.92.mlp.experts.91.down_proj.weight": "mtp.safetensors",
|
| 88470 |
+
"model.layers.92.mlp.experts.91.down_proj.weight_scale": "mtp.safetensors",
|
| 88471 |
+
"model.layers.92.mlp.experts.91.gate_proj.weight": "mtp.safetensors",
|
| 88472 |
+
"model.layers.92.mlp.experts.91.gate_proj.weight_scale": "mtp.safetensors",
|
| 88473 |
+
"model.layers.92.mlp.experts.91.up_proj.weight": "mtp.safetensors",
|
| 88474 |
+
"model.layers.92.mlp.experts.91.up_proj.weight_scale": "mtp.safetensors",
|
| 88475 |
+
"model.layers.92.mlp.experts.92.down_proj.weight": "mtp.safetensors",
|
| 88476 |
+
"model.layers.92.mlp.experts.92.down_proj.weight_scale": "mtp.safetensors",
|
| 88477 |
+
"model.layers.92.mlp.experts.92.gate_proj.weight": "mtp.safetensors",
|
| 88478 |
+
"model.layers.92.mlp.experts.92.gate_proj.weight_scale": "mtp.safetensors",
|
| 88479 |
+
"model.layers.92.mlp.experts.92.up_proj.weight": "mtp.safetensors",
|
| 88480 |
+
"model.layers.92.mlp.experts.92.up_proj.weight_scale": "mtp.safetensors",
|
| 88481 |
+
"model.layers.92.mlp.experts.93.down_proj.weight": "mtp.safetensors",
|
| 88482 |
+
"model.layers.92.mlp.experts.93.down_proj.weight_scale": "mtp.safetensors",
|
| 88483 |
+
"model.layers.92.mlp.experts.93.gate_proj.weight": "mtp.safetensors",
|
| 88484 |
+
"model.layers.92.mlp.experts.93.gate_proj.weight_scale": "mtp.safetensors",
|
| 88485 |
+
"model.layers.92.mlp.experts.93.up_proj.weight": "mtp.safetensors",
|
| 88486 |
+
"model.layers.92.mlp.experts.93.up_proj.weight_scale": "mtp.safetensors",
|
| 88487 |
+
"model.layers.92.mlp.experts.94.down_proj.weight": "mtp.safetensors",
|
| 88488 |
+
"model.layers.92.mlp.experts.94.down_proj.weight_scale": "mtp.safetensors",
|
| 88489 |
+
"model.layers.92.mlp.experts.94.gate_proj.weight": "mtp.safetensors",
|
| 88490 |
+
"model.layers.92.mlp.experts.94.gate_proj.weight_scale": "mtp.safetensors",
|
| 88491 |
+
"model.layers.92.mlp.experts.94.up_proj.weight": "mtp.safetensors",
|
| 88492 |
+
"model.layers.92.mlp.experts.94.up_proj.weight_scale": "mtp.safetensors",
|
| 88493 |
+
"model.layers.92.mlp.experts.95.down_proj.weight": "mtp.safetensors",
|
| 88494 |
+
"model.layers.92.mlp.experts.95.down_proj.weight_scale": "mtp.safetensors",
|
| 88495 |
+
"model.layers.92.mlp.experts.95.gate_proj.weight": "mtp.safetensors",
|
| 88496 |
+
"model.layers.92.mlp.experts.95.gate_proj.weight_scale": "mtp.safetensors",
|
| 88497 |
+
"model.layers.92.mlp.experts.95.up_proj.weight": "mtp.safetensors",
|
| 88498 |
+
"model.layers.92.mlp.experts.95.up_proj.weight_scale": "mtp.safetensors",
|
| 88499 |
+
"model.layers.92.mlp.experts.96.down_proj.weight": "mtp.safetensors",
|
| 88500 |
+
"model.layers.92.mlp.experts.96.down_proj.weight_scale": "mtp.safetensors",
|
| 88501 |
+
"model.layers.92.mlp.experts.96.gate_proj.weight": "mtp.safetensors",
|
| 88502 |
+
"model.layers.92.mlp.experts.96.gate_proj.weight_scale": "mtp.safetensors",
|
| 88503 |
+
"model.layers.92.mlp.experts.96.up_proj.weight": "mtp.safetensors",
|
| 88504 |
+
"model.layers.92.mlp.experts.96.up_proj.weight_scale": "mtp.safetensors",
|
| 88505 |
+
"model.layers.92.mlp.experts.97.down_proj.weight": "mtp.safetensors",
|
| 88506 |
+
"model.layers.92.mlp.experts.97.down_proj.weight_scale": "mtp.safetensors",
|
| 88507 |
+
"model.layers.92.mlp.experts.97.gate_proj.weight": "mtp.safetensors",
|
| 88508 |
+
"model.layers.92.mlp.experts.97.gate_proj.weight_scale": "mtp.safetensors",
|
| 88509 |
+
"model.layers.92.mlp.experts.97.up_proj.weight": "mtp.safetensors",
|
| 88510 |
+
"model.layers.92.mlp.experts.97.up_proj.weight_scale": "mtp.safetensors",
|
| 88511 |
+
"model.layers.92.mlp.experts.98.down_proj.weight": "mtp.safetensors",
|
| 88512 |
+
"model.layers.92.mlp.experts.98.down_proj.weight_scale": "mtp.safetensors",
|
| 88513 |
+
"model.layers.92.mlp.experts.98.gate_proj.weight": "mtp.safetensors",
|
| 88514 |
+
"model.layers.92.mlp.experts.98.gate_proj.weight_scale": "mtp.safetensors",
|
| 88515 |
+
"model.layers.92.mlp.experts.98.up_proj.weight": "mtp.safetensors",
|
| 88516 |
+
"model.layers.92.mlp.experts.98.up_proj.weight_scale": "mtp.safetensors",
|
| 88517 |
+
"model.layers.92.mlp.experts.99.down_proj.weight": "mtp.safetensors",
|
| 88518 |
+
"model.layers.92.mlp.experts.99.down_proj.weight_scale": "mtp.safetensors",
|
| 88519 |
+
"model.layers.92.mlp.experts.99.gate_proj.weight": "mtp.safetensors",
|
| 88520 |
+
"model.layers.92.mlp.experts.99.gate_proj.weight_scale": "mtp.safetensors",
|
| 88521 |
+
"model.layers.92.mlp.experts.99.up_proj.weight": "mtp.safetensors",
|
| 88522 |
+
"model.layers.92.mlp.experts.99.up_proj.weight_scale": "mtp.safetensors",
|
| 88523 |
+
"model.layers.92.mlp.gate.e_score_correction_bias": "mtp.safetensors",
|
| 88524 |
+
"model.layers.92.mlp.gate.weight": "mtp.safetensors",
|
| 88525 |
+
"model.layers.92.mlp.shared_experts.down_proj.weight": "mtp.safetensors",
|
| 88526 |
+
"model.layers.92.mlp.shared_experts.down_proj.weight_scale": "mtp.safetensors",
|
| 88527 |
+
"model.layers.92.mlp.shared_experts.gate_proj.weight": "mtp.safetensors",
|
| 88528 |
+
"model.layers.92.mlp.shared_experts.gate_proj.weight_scale": "mtp.safetensors",
|
| 88529 |
+
"model.layers.92.mlp.shared_experts.up_proj.weight": "mtp.safetensors",
|
| 88530 |
+
"model.layers.92.mlp.shared_experts.up_proj.weight_scale": "mtp.safetensors",
|
| 88531 |
+
"model.layers.92.post_attention_layernorm.weight": "mtp.safetensors",
|
| 88532 |
+
"model.layers.92.self_attn.k_norm.weight": "mtp.safetensors",
|
| 88533 |
+
"model.layers.92.self_attn.k_proj.bias": "mtp.safetensors",
|
| 88534 |
+
"model.layers.92.self_attn.k_proj.weight": "mtp.safetensors",
|
| 88535 |
+
"model.layers.92.self_attn.k_proj.weight_scale": "mtp.safetensors",
|
| 88536 |
+
"model.layers.92.self_attn.o_proj.weight": "mtp.safetensors",
|
| 88537 |
+
"model.layers.92.self_attn.o_proj.weight_scale": "mtp.safetensors",
|
| 88538 |
+
"model.layers.92.self_attn.q_norm.weight": "mtp.safetensors",
|
| 88539 |
+
"model.layers.92.self_attn.q_proj.bias": "mtp.safetensors",
|
| 88540 |
+
"model.layers.92.self_attn.q_proj.weight": "mtp.safetensors",
|
| 88541 |
+
"model.layers.92.self_attn.q_proj.weight_scale": "mtp.safetensors",
|
| 88542 |
+
"model.layers.92.self_attn.v_proj.bias": "mtp.safetensors",
|
| 88543 |
+
"model.layers.92.self_attn.v_proj.weight": "mtp.safetensors",
|
| 88544 |
+
"model.layers.92.self_attn.v_proj.weight_scale": "mtp.safetensors",
|
| 88545 |
+
"model.layers.92.shared_head.norm.weight": "mtp.safetensors"
|
| 88546 |
},
|
| 88547 |
"metadata": {
|
| 88548 |
"total_size": 241145664
|