{ "metadata": { "total_size": 150871132160 }, "weight_map": { "lm_heads.0.norm.weight": "model-00031-of-00032.safetensors", "lm_heads.0.weight": "model-00031-of-00032.safetensors", "lm_heads.1.norm.weight": "model-00031-of-00032.safetensors", "lm_heads.1.weight": "model-00031-of-00032.safetensors", "lm_heads.2.norm.weight": "model-00031-of-00032.safetensors", "lm_heads.2.weight": "model-00031-of-00032.safetensors", "lm_heads.3.norm.weight": "model-00032-of-00032.safetensors", "lm_heads.3.weight": "model-00032-of-00032.safetensors", "model.embeddings.weight": "model-00001-of-00032.safetensors", "model.layers.0.attn.f_proj.norm.weight": "model-00001-of-00032.safetensors", "model.layers.0.attn.f_proj.weight": "model-00001-of-00032.safetensors", "model.layers.0.attn.g_norm.weight": "model-00001-of-00032.safetensors", "model.layers.0.attn.g_proj.norm.weight": "model-00001-of-00032.safetensors", "model.layers.0.attn.g_proj.weight": "model-00001-of-00032.safetensors", "model.layers.0.attn.i_proj.norm.weight": "model-00001-of-00032.safetensors", "model.layers.0.attn.i_proj.weight": "model-00001-of-00032.safetensors", "model.layers.0.attn.o_proj.norm.weight": "model-00001-of-00032.safetensors", "model.layers.0.attn.o_proj.weight": "model-00001-of-00032.safetensors", "model.layers.0.attn_norm.weight": "model-00001-of-00032.safetensors", "model.layers.0.mlp.down_proj.norm.weight": "model-00001-of-00032.safetensors", "model.layers.0.mlp.down_proj.weight": "model-00001-of-00032.safetensors", "model.layers.0.mlp.gate_proj.norm.weight": "model-00001-of-00032.safetensors", "model.layers.0.mlp.gate_proj.weight": "model-00001-of-00032.safetensors", "model.layers.0.mlp_norm.weight": "model-00001-of-00032.safetensors", "model.layers.1.attn.f_proj.norm.weight": "model-00001-of-00032.safetensors", "model.layers.1.attn.f_proj.weight": "model-00001-of-00032.safetensors", "model.layers.1.attn.g_norm.weight": "model-00001-of-00032.safetensors", "model.layers.1.attn.g_proj.norm.weight": "model-00001-of-00032.safetensors", "model.layers.1.attn.g_proj.weight": "model-00001-of-00032.safetensors", "model.layers.1.attn.i_proj.norm.weight": "model-00001-of-00032.safetensors", "model.layers.1.attn.i_proj.weight": "model-00001-of-00032.safetensors", "model.layers.1.attn.o_proj.norm.weight": "model-00001-of-00032.safetensors", "model.layers.1.attn.o_proj.weight": "model-00001-of-00032.safetensors", "model.layers.1.attn_norm.weight": "model-00001-of-00032.safetensors", "model.layers.1.mlp.experts.0.down_proj.norm.weight": "model-00001-of-00032.safetensors", "model.layers.1.mlp.experts.0.down_proj.weight": "model-00001-of-00032.safetensors", "model.layers.1.mlp.experts.0.gate_proj.norm.weight": "model-00001-of-00032.safetensors", "model.layers.1.mlp.experts.0.gate_proj.weight": "model-00001-of-00032.safetensors", "model.layers.1.mlp.experts.1.down_proj.norm.weight": "model-00001-of-00032.safetensors", "model.layers.1.mlp.experts.1.down_proj.weight": "model-00001-of-00032.safetensors", "model.layers.1.mlp.experts.1.gate_proj.norm.weight": "model-00001-of-00032.safetensors", "model.layers.1.mlp.experts.1.gate_proj.weight": "model-00001-of-00032.safetensors", "model.layers.1.mlp.experts.2.down_proj.norm.weight": "model-00001-of-00032.safetensors", "model.layers.1.mlp.experts.2.down_proj.weight": "model-00001-of-00032.safetensors", "model.layers.1.mlp.experts.2.gate_proj.norm.weight": "model-00001-of-00032.safetensors", "model.layers.1.mlp.experts.2.gate_proj.weight": "model-00001-of-00032.safetensors", "model.layers.1.mlp.experts.3.down_proj.norm.weight": "model-00001-of-00032.safetensors", "model.layers.1.mlp.experts.3.down_proj.weight": "model-00001-of-00032.safetensors", "model.layers.1.mlp.experts.3.gate_proj.norm.weight": "model-00001-of-00032.safetensors", "model.layers.1.mlp.experts.3.gate_proj.weight": "model-00001-of-00032.safetensors", "model.layers.1.mlp.experts.4.down_proj.norm.weight": "model-00001-of-00032.safetensors", "model.layers.1.mlp.experts.4.down_proj.weight": "model-00001-of-00032.safetensors", "model.layers.1.mlp.experts.4.gate_proj.norm.weight": "model-00001-of-00032.safetensors", "model.layers.1.mlp.experts.4.gate_proj.weight": "model-00001-of-00032.safetensors", "model.layers.1.mlp.experts.5.down_proj.norm.weight": "model-00002-of-00032.safetensors", "model.layers.1.mlp.experts.5.down_proj.weight": "model-00002-of-00032.safetensors", "model.layers.1.mlp.experts.5.gate_proj.norm.weight": "model-00002-of-00032.safetensors", "model.layers.1.mlp.experts.5.gate_proj.weight": "model-00002-of-00032.safetensors", "model.layers.1.mlp.experts.6.down_proj.norm.weight": "model-00002-of-00032.safetensors", "model.layers.1.mlp.experts.6.down_proj.weight": "model-00002-of-00032.safetensors", "model.layers.1.mlp.experts.6.gate_proj.norm.weight": "model-00002-of-00032.safetensors", "model.layers.1.mlp.experts.6.gate_proj.weight": "model-00002-of-00032.safetensors", "model.layers.1.mlp.experts.7.down_proj.norm.weight": "model-00002-of-00032.safetensors", "model.layers.1.mlp.experts.7.down_proj.weight": "model-00002-of-00032.safetensors", "model.layers.1.mlp.experts.7.gate_proj.norm.weight": "model-00002-of-00032.safetensors", "model.layers.1.mlp.experts.7.gate_proj.weight": "model-00002-of-00032.safetensors", "model.layers.1.mlp.router.norm.weight": "model-00001-of-00032.safetensors", "model.layers.1.mlp.router.weight": "model-00001-of-00032.safetensors", "model.layers.1.mlp_norm.weight": "model-00001-of-00032.safetensors", "model.layers.10.attn.f_proj.norm.weight": "model-00005-of-00032.safetensors", "model.layers.10.attn.f_proj.weight": "model-00005-of-00032.safetensors", "model.layers.10.attn.g_norm.weight": "model-00006-of-00032.safetensors", "model.layers.10.attn.g_proj.norm.weight": "model-00006-of-00032.safetensors", "model.layers.10.attn.g_proj.weight": "model-00006-of-00032.safetensors", "model.layers.10.attn.i_proj.norm.weight": "model-00005-of-00032.safetensors", "model.layers.10.attn.i_proj.weight": "model-00005-of-00032.safetensors", "model.layers.10.attn.o_proj.norm.weight": "model-00006-of-00032.safetensors", "model.layers.10.attn.o_proj.weight": "model-00006-of-00032.safetensors", "model.layers.10.attn_norm.weight": "model-00005-of-00032.safetensors", "model.layers.10.mlp.down_proj.norm.weight": "model-00006-of-00032.safetensors", "model.layers.10.mlp.down_proj.weight": "model-00006-of-00032.safetensors", "model.layers.10.mlp.gate_proj.norm.weight": "model-00006-of-00032.safetensors", "model.layers.10.mlp.gate_proj.weight": "model-00006-of-00032.safetensors", "model.layers.10.mlp_norm.weight": "model-00006-of-00032.safetensors", "model.layers.11.attn.f_proj.norm.weight": "model-00006-of-00032.safetensors", "model.layers.11.attn.f_proj.weight": "model-00006-of-00032.safetensors", "model.layers.11.attn.g_norm.weight": "model-00006-of-00032.safetensors", "model.layers.11.attn.g_proj.norm.weight": "model-00006-of-00032.safetensors", "model.layers.11.attn.g_proj.weight": "model-00006-of-00032.safetensors", "model.layers.11.attn.i_proj.norm.weight": "model-00006-of-00032.safetensors", "model.layers.11.attn.i_proj.weight": "model-00006-of-00032.safetensors", "model.layers.11.attn.o_proj.norm.weight": "model-00006-of-00032.safetensors", "model.layers.11.attn.o_proj.weight": "model-00006-of-00032.safetensors", "model.layers.11.attn_norm.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp.experts.0.down_proj.norm.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp.experts.0.down_proj.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp.experts.0.gate_proj.norm.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp.experts.0.gate_proj.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp.experts.1.down_proj.norm.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp.experts.1.down_proj.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp.experts.1.gate_proj.norm.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp.experts.1.gate_proj.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp.experts.2.down_proj.norm.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp.experts.2.down_proj.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp.experts.2.gate_proj.norm.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp.experts.2.gate_proj.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp.experts.3.down_proj.norm.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp.experts.3.down_proj.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp.experts.3.gate_proj.norm.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp.experts.3.gate_proj.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp.experts.4.down_proj.norm.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp.experts.4.down_proj.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp.experts.4.gate_proj.norm.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp.experts.4.gate_proj.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp.experts.5.down_proj.norm.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp.experts.5.down_proj.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp.experts.5.gate_proj.norm.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp.experts.5.gate_proj.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp.experts.6.down_proj.norm.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp.experts.6.down_proj.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp.experts.6.gate_proj.norm.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp.experts.6.gate_proj.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp.experts.7.down_proj.norm.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp.experts.7.down_proj.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp.experts.7.gate_proj.norm.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp.experts.7.gate_proj.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp.router.norm.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp.router.weight": "model-00006-of-00032.safetensors", "model.layers.11.mlp_norm.weight": "model-00006-of-00032.safetensors", "model.layers.12.attn.f_proj.norm.weight": "model-00006-of-00032.safetensors", "model.layers.12.attn.f_proj.weight": "model-00006-of-00032.safetensors", "model.layers.12.attn.g_norm.weight": "model-00006-of-00032.safetensors", "model.layers.12.attn.g_proj.norm.weight": "model-00006-of-00032.safetensors", "model.layers.12.attn.g_proj.weight": "model-00006-of-00032.safetensors", "model.layers.12.attn.i_proj.norm.weight": "model-00006-of-00032.safetensors", "model.layers.12.attn.i_proj.weight": "model-00006-of-00032.safetensors", "model.layers.12.attn.o_proj.norm.weight": "model-00006-of-00032.safetensors", "model.layers.12.attn.o_proj.weight": "model-00006-of-00032.safetensors", "model.layers.12.attn_norm.weight": "model-00006-of-00032.safetensors", "model.layers.12.mlp.down_proj.norm.weight": "model-00007-of-00032.safetensors", "model.layers.12.mlp.down_proj.weight": "model-00007-of-00032.safetensors", "model.layers.12.mlp.gate_proj.norm.weight": "model-00007-of-00032.safetensors", "model.layers.12.mlp.gate_proj.weight": "model-00007-of-00032.safetensors", "model.layers.12.mlp_norm.weight": "model-00006-of-00032.safetensors", "model.layers.13.attn.f_proj.norm.weight": "model-00007-of-00032.safetensors", "model.layers.13.attn.f_proj.weight": "model-00007-of-00032.safetensors", "model.layers.13.attn.g_norm.weight": "model-00007-of-00032.safetensors", "model.layers.13.attn.g_proj.norm.weight": "model-00007-of-00032.safetensors", "model.layers.13.attn.g_proj.weight": "model-00007-of-00032.safetensors", "model.layers.13.attn.i_proj.norm.weight": "model-00007-of-00032.safetensors", "model.layers.13.attn.i_proj.weight": "model-00007-of-00032.safetensors", "model.layers.13.attn.o_proj.norm.weight": "model-00007-of-00032.safetensors", "model.layers.13.attn.o_proj.weight": "model-00007-of-00032.safetensors", "model.layers.13.attn_norm.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp.experts.0.down_proj.norm.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp.experts.0.down_proj.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp.experts.0.gate_proj.norm.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp.experts.0.gate_proj.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp.experts.1.down_proj.norm.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp.experts.1.down_proj.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp.experts.1.gate_proj.norm.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp.experts.1.gate_proj.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp.experts.2.down_proj.norm.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp.experts.2.down_proj.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp.experts.2.gate_proj.norm.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp.experts.2.gate_proj.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp.experts.3.down_proj.norm.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp.experts.3.down_proj.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp.experts.3.gate_proj.norm.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp.experts.3.gate_proj.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp.experts.4.down_proj.norm.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp.experts.4.down_proj.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp.experts.4.gate_proj.norm.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp.experts.4.gate_proj.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp.experts.5.down_proj.norm.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp.experts.5.down_proj.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp.experts.5.gate_proj.norm.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp.experts.5.gate_proj.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp.experts.6.down_proj.norm.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp.experts.6.down_proj.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp.experts.6.gate_proj.norm.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp.experts.6.gate_proj.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp.experts.7.down_proj.norm.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp.experts.7.down_proj.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp.experts.7.gate_proj.norm.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp.experts.7.gate_proj.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp.router.norm.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp.router.weight": "model-00007-of-00032.safetensors", "model.layers.13.mlp_norm.weight": "model-00007-of-00032.safetensors", "model.layers.14.attn.f_proj.norm.weight": "model-00007-of-00032.safetensors", "model.layers.14.attn.f_proj.weight": "model-00007-of-00032.safetensors", "model.layers.14.attn.g_norm.weight": "model-00007-of-00032.safetensors", "model.layers.14.attn.g_proj.norm.weight": "model-00007-of-00032.safetensors", "model.layers.14.attn.g_proj.weight": "model-00007-of-00032.safetensors", "model.layers.14.attn.i_proj.norm.weight": "model-00007-of-00032.safetensors", "model.layers.14.attn.i_proj.weight": "model-00007-of-00032.safetensors", "model.layers.14.attn.o_proj.norm.weight": "model-00007-of-00032.safetensors", "model.layers.14.attn.o_proj.weight": "model-00007-of-00032.safetensors", "model.layers.14.attn_norm.weight": "model-00007-of-00032.safetensors", "model.layers.14.mlp.down_proj.norm.weight": "model-00007-of-00032.safetensors", "model.layers.14.mlp.down_proj.weight": "model-00007-of-00032.safetensors", "model.layers.14.mlp.gate_proj.norm.weight": "model-00007-of-00032.safetensors", "model.layers.14.mlp.gate_proj.weight": "model-00007-of-00032.safetensors", "model.layers.14.mlp_norm.weight": "model-00007-of-00032.safetensors", "model.layers.15.attn.f_proj.norm.weight": "model-00008-of-00032.safetensors", "model.layers.15.attn.f_proj.weight": "model-00008-of-00032.safetensors", "model.layers.15.attn.g_norm.weight": "model-00008-of-00032.safetensors", "model.layers.15.attn.g_proj.norm.weight": "model-00008-of-00032.safetensors", "model.layers.15.attn.g_proj.weight": "model-00008-of-00032.safetensors", "model.layers.15.attn.i_proj.norm.weight": "model-00008-of-00032.safetensors", "model.layers.15.attn.i_proj.weight": "model-00008-of-00032.safetensors", "model.layers.15.attn.o_proj.norm.weight": "model-00008-of-00032.safetensors", "model.layers.15.attn.o_proj.weight": "model-00008-of-00032.safetensors", "model.layers.15.attn_norm.weight": "model-00007-of-00032.safetensors", "model.layers.15.mlp.experts.0.down_proj.norm.weight": "model-00008-of-00032.safetensors", "model.layers.15.mlp.experts.0.down_proj.weight": "model-00008-of-00032.safetensors", "model.layers.15.mlp.experts.0.gate_proj.norm.weight": "model-00008-of-00032.safetensors", "model.layers.15.mlp.experts.0.gate_proj.weight": "model-00008-of-00032.safetensors", "model.layers.15.mlp.experts.1.down_proj.norm.weight": "model-00008-of-00032.safetensors", "model.layers.15.mlp.experts.1.down_proj.weight": "model-00008-of-00032.safetensors", "model.layers.15.mlp.experts.1.gate_proj.norm.weight": "model-00008-of-00032.safetensors", "model.layers.15.mlp.experts.1.gate_proj.weight": "model-00008-of-00032.safetensors", "model.layers.15.mlp.experts.2.down_proj.norm.weight": "model-00008-of-00032.safetensors", "model.layers.15.mlp.experts.2.down_proj.weight": "model-00008-of-00032.safetensors", "model.layers.15.mlp.experts.2.gate_proj.norm.weight": "model-00008-of-00032.safetensors", "model.layers.15.mlp.experts.2.gate_proj.weight": "model-00008-of-00032.safetensors", "model.layers.15.mlp.experts.3.down_proj.norm.weight": "model-00008-of-00032.safetensors", "model.layers.15.mlp.experts.3.down_proj.weight": "model-00008-of-00032.safetensors", "model.layers.15.mlp.experts.3.gate_proj.norm.weight": "model-00008-of-00032.safetensors", "model.layers.15.mlp.experts.3.gate_proj.weight": "model-00008-of-00032.safetensors", "model.layers.15.mlp.experts.4.down_proj.norm.weight": "model-00008-of-00032.safetensors", "model.layers.15.mlp.experts.4.down_proj.weight": "model-00008-of-00032.safetensors", "model.layers.15.mlp.experts.4.gate_proj.norm.weight": "model-00008-of-00032.safetensors", "model.layers.15.mlp.experts.4.gate_proj.weight": "model-00008-of-00032.safetensors", "model.layers.15.mlp.experts.5.down_proj.norm.weight": "model-00008-of-00032.safetensors", "model.layers.15.mlp.experts.5.down_proj.weight": "model-00008-of-00032.safetensors", "model.layers.15.mlp.experts.5.gate_proj.norm.weight": "model-00008-of-00032.safetensors", "model.layers.15.mlp.experts.5.gate_proj.weight": "model-00008-of-00032.safetensors", "model.layers.15.mlp.experts.6.down_proj.norm.weight": "model-00008-of-00032.safetensors", "model.layers.15.mlp.experts.6.down_proj.weight": "model-00008-of-00032.safetensors", "model.layers.15.mlp.experts.6.gate_proj.norm.weight": "model-00008-of-00032.safetensors", "model.layers.15.mlp.experts.6.gate_proj.weight": "model-00008-of-00032.safetensors", "model.layers.15.mlp.experts.7.down_proj.norm.weight": "model-00008-of-00032.safetensors", "model.layers.15.mlp.experts.7.down_proj.weight": "model-00008-of-00032.safetensors", "model.layers.15.mlp.experts.7.gate_proj.norm.weight": "model-00008-of-00032.safetensors", "model.layers.15.mlp.experts.7.gate_proj.weight": "model-00008-of-00032.safetensors", "model.layers.15.mlp.router.norm.weight": "model-00008-of-00032.safetensors", "model.layers.15.mlp.router.weight": "model-00008-of-00032.safetensors", "model.layers.15.mlp_norm.weight": "model-00008-of-00032.safetensors", "model.layers.16.attn.f_proj.norm.weight": "model-00008-of-00032.safetensors", "model.layers.16.attn.f_proj.weight": "model-00008-of-00032.safetensors", "model.layers.16.attn.g_norm.weight": "model-00008-of-00032.safetensors", "model.layers.16.attn.g_proj.norm.weight": "model-00008-of-00032.safetensors", "model.layers.16.attn.g_proj.weight": "model-00008-of-00032.safetensors", "model.layers.16.attn.i_proj.norm.weight": "model-00008-of-00032.safetensors", "model.layers.16.attn.i_proj.weight": "model-00008-of-00032.safetensors", "model.layers.16.attn.o_proj.norm.weight": "model-00008-of-00032.safetensors", "model.layers.16.attn.o_proj.weight": "model-00008-of-00032.safetensors", "model.layers.16.attn_norm.weight": "model-00008-of-00032.safetensors", "model.layers.16.mlp.down_proj.norm.weight": "model-00008-of-00032.safetensors", "model.layers.16.mlp.down_proj.weight": "model-00008-of-00032.safetensors", "model.layers.16.mlp.gate_proj.norm.weight": "model-00008-of-00032.safetensors", "model.layers.16.mlp.gate_proj.weight": "model-00008-of-00032.safetensors", "model.layers.16.mlp_norm.weight": "model-00008-of-00032.safetensors", "model.layers.17.attn.f_proj.norm.weight": "model-00008-of-00032.safetensors", "model.layers.17.attn.f_proj.weight": "model-00008-of-00032.safetensors", "model.layers.17.attn.g_norm.weight": "model-00009-of-00032.safetensors", "model.layers.17.attn.g_proj.norm.weight": "model-00009-of-00032.safetensors", "model.layers.17.attn.g_proj.weight": "model-00009-of-00032.safetensors", "model.layers.17.attn.i_proj.norm.weight": "model-00008-of-00032.safetensors", "model.layers.17.attn.i_proj.weight": "model-00008-of-00032.safetensors", "model.layers.17.attn.o_proj.norm.weight": "model-00009-of-00032.safetensors", "model.layers.17.attn.o_proj.weight": "model-00009-of-00032.safetensors", "model.layers.17.attn_norm.weight": "model-00008-of-00032.safetensors", "model.layers.17.mlp.experts.0.down_proj.norm.weight": "model-00009-of-00032.safetensors", "model.layers.17.mlp.experts.0.down_proj.weight": "model-00009-of-00032.safetensors", "model.layers.17.mlp.experts.0.gate_proj.norm.weight": "model-00009-of-00032.safetensors", "model.layers.17.mlp.experts.0.gate_proj.weight": "model-00009-of-00032.safetensors", "model.layers.17.mlp.experts.1.down_proj.norm.weight": "model-00009-of-00032.safetensors", "model.layers.17.mlp.experts.1.down_proj.weight": "model-00009-of-00032.safetensors", "model.layers.17.mlp.experts.1.gate_proj.norm.weight": "model-00009-of-00032.safetensors", "model.layers.17.mlp.experts.1.gate_proj.weight": "model-00009-of-00032.safetensors", "model.layers.17.mlp.experts.2.down_proj.norm.weight": "model-00009-of-00032.safetensors", "model.layers.17.mlp.experts.2.down_proj.weight": "model-00009-of-00032.safetensors", "model.layers.17.mlp.experts.2.gate_proj.norm.weight": "model-00009-of-00032.safetensors", "model.layers.17.mlp.experts.2.gate_proj.weight": "model-00009-of-00032.safetensors", "model.layers.17.mlp.experts.3.down_proj.norm.weight": "model-00009-of-00032.safetensors", "model.layers.17.mlp.experts.3.down_proj.weight": "model-00009-of-00032.safetensors", "model.layers.17.mlp.experts.3.gate_proj.norm.weight": "model-00009-of-00032.safetensors", "model.layers.17.mlp.experts.3.gate_proj.weight": "model-00009-of-00032.safetensors", "model.layers.17.mlp.experts.4.down_proj.norm.weight": "model-00009-of-00032.safetensors", "model.layers.17.mlp.experts.4.down_proj.weight": "model-00009-of-00032.safetensors", "model.layers.17.mlp.experts.4.gate_proj.norm.weight": "model-00009-of-00032.safetensors", "model.layers.17.mlp.experts.4.gate_proj.weight": "model-00009-of-00032.safetensors", "model.layers.17.mlp.experts.5.down_proj.norm.weight": "model-00009-of-00032.safetensors", "model.layers.17.mlp.experts.5.down_proj.weight": "model-00009-of-00032.safetensors", "model.layers.17.mlp.experts.5.gate_proj.norm.weight": "model-00009-of-00032.safetensors", "model.layers.17.mlp.experts.5.gate_proj.weight": "model-00009-of-00032.safetensors", "model.layers.17.mlp.experts.6.down_proj.norm.weight": "model-00009-of-00032.safetensors", "model.layers.17.mlp.experts.6.down_proj.weight": "model-00009-of-00032.safetensors", "model.layers.17.mlp.experts.6.gate_proj.norm.weight": "model-00009-of-00032.safetensors", "model.layers.17.mlp.experts.6.gate_proj.weight": "model-00009-of-00032.safetensors", "model.layers.17.mlp.experts.7.down_proj.norm.weight": "model-00009-of-00032.safetensors", "model.layers.17.mlp.experts.7.down_proj.weight": "model-00009-of-00032.safetensors", "model.layers.17.mlp.experts.7.gate_proj.norm.weight": "model-00009-of-00032.safetensors", "model.layers.17.mlp.experts.7.gate_proj.weight": "model-00009-of-00032.safetensors", "model.layers.17.mlp.router.norm.weight": "model-00009-of-00032.safetensors", "model.layers.17.mlp.router.weight": "model-00009-of-00032.safetensors", "model.layers.17.mlp_norm.weight": "model-00009-of-00032.safetensors", "model.layers.18.attn.f_proj.norm.weight": "model-00009-of-00032.safetensors", "model.layers.18.attn.f_proj.weight": "model-00009-of-00032.safetensors", "model.layers.18.attn.g_norm.weight": "model-00009-of-00032.safetensors", "model.layers.18.attn.g_proj.norm.weight": "model-00009-of-00032.safetensors", "model.layers.18.attn.g_proj.weight": "model-00009-of-00032.safetensors", "model.layers.18.attn.i_proj.norm.weight": "model-00009-of-00032.safetensors", "model.layers.18.attn.i_proj.weight": "model-00009-of-00032.safetensors", "model.layers.18.attn.o_proj.norm.weight": "model-00009-of-00032.safetensors", "model.layers.18.attn.o_proj.weight": "model-00009-of-00032.safetensors", "model.layers.18.attn_norm.weight": "model-00009-of-00032.safetensors", "model.layers.18.mlp.down_proj.norm.weight": "model-00009-of-00032.safetensors", "model.layers.18.mlp.down_proj.weight": "model-00009-of-00032.safetensors", "model.layers.18.mlp.gate_proj.norm.weight": "model-00009-of-00032.safetensors", "model.layers.18.mlp.gate_proj.weight": "model-00009-of-00032.safetensors", "model.layers.18.mlp_norm.weight": "model-00009-of-00032.safetensors", "model.layers.19.attn.f_proj.norm.weight": "model-00009-of-00032.safetensors", "model.layers.19.attn.f_proj.weight": "model-00009-of-00032.safetensors", "model.layers.19.attn.g_norm.weight": "model-00009-of-00032.safetensors", "model.layers.19.attn.g_proj.norm.weight": "model-00009-of-00032.safetensors", "model.layers.19.attn.g_proj.weight": "model-00009-of-00032.safetensors", "model.layers.19.attn.i_proj.norm.weight": "model-00009-of-00032.safetensors", "model.layers.19.attn.i_proj.weight": "model-00009-of-00032.safetensors", "model.layers.19.attn.o_proj.norm.weight": "model-00009-of-00032.safetensors", "model.layers.19.attn.o_proj.weight": "model-00009-of-00032.safetensors", "model.layers.19.attn_norm.weight": "model-00009-of-00032.safetensors", "model.layers.19.mlp.experts.0.down_proj.norm.weight": "model-00010-of-00032.safetensors", "model.layers.19.mlp.experts.0.down_proj.weight": "model-00010-of-00032.safetensors", "model.layers.19.mlp.experts.0.gate_proj.norm.weight": "model-00010-of-00032.safetensors", "model.layers.19.mlp.experts.0.gate_proj.weight": "model-00010-of-00032.safetensors", "model.layers.19.mlp.experts.1.down_proj.norm.weight": "model-00010-of-00032.safetensors", "model.layers.19.mlp.experts.1.down_proj.weight": "model-00010-of-00032.safetensors", "model.layers.19.mlp.experts.1.gate_proj.norm.weight": "model-00010-of-00032.safetensors", "model.layers.19.mlp.experts.1.gate_proj.weight": "model-00010-of-00032.safetensors", "model.layers.19.mlp.experts.2.down_proj.norm.weight": "model-00010-of-00032.safetensors", "model.layers.19.mlp.experts.2.down_proj.weight": "model-00010-of-00032.safetensors", "model.layers.19.mlp.experts.2.gate_proj.norm.weight": "model-00010-of-00032.safetensors", "model.layers.19.mlp.experts.2.gate_proj.weight": "model-00010-of-00032.safetensors", "model.layers.19.mlp.experts.3.down_proj.norm.weight": "model-00010-of-00032.safetensors", "model.layers.19.mlp.experts.3.down_proj.weight": "model-00010-of-00032.safetensors", "model.layers.19.mlp.experts.3.gate_proj.norm.weight": "model-00010-of-00032.safetensors", "model.layers.19.mlp.experts.3.gate_proj.weight": "model-00010-of-00032.safetensors", "model.layers.19.mlp.experts.4.down_proj.norm.weight": "model-00010-of-00032.safetensors", "model.layers.19.mlp.experts.4.down_proj.weight": "model-00010-of-00032.safetensors", "model.layers.19.mlp.experts.4.gate_proj.norm.weight": "model-00010-of-00032.safetensors", "model.layers.19.mlp.experts.4.gate_proj.weight": "model-00010-of-00032.safetensors", "model.layers.19.mlp.experts.5.down_proj.norm.weight": "model-00010-of-00032.safetensors", "model.layers.19.mlp.experts.5.down_proj.weight": "model-00010-of-00032.safetensors", "model.layers.19.mlp.experts.5.gate_proj.norm.weight": "model-00010-of-00032.safetensors", "model.layers.19.mlp.experts.5.gate_proj.weight": "model-00010-of-00032.safetensors", "model.layers.19.mlp.experts.6.down_proj.norm.weight": "model-00010-of-00032.safetensors", "model.layers.19.mlp.experts.6.down_proj.weight": "model-00010-of-00032.safetensors", "model.layers.19.mlp.experts.6.gate_proj.norm.weight": "model-00010-of-00032.safetensors", "model.layers.19.mlp.experts.6.gate_proj.weight": "model-00010-of-00032.safetensors", "model.layers.19.mlp.experts.7.down_proj.norm.weight": "model-00010-of-00032.safetensors", "model.layers.19.mlp.experts.7.down_proj.weight": "model-00010-of-00032.safetensors", "model.layers.19.mlp.experts.7.gate_proj.norm.weight": "model-00010-of-00032.safetensors", "model.layers.19.mlp.experts.7.gate_proj.weight": "model-00010-of-00032.safetensors", "model.layers.19.mlp.router.norm.weight": "model-00009-of-00032.safetensors", "model.layers.19.mlp.router.weight": "model-00009-of-00032.safetensors", "model.layers.19.mlp_norm.weight": "model-00009-of-00032.safetensors", "model.layers.2.attn.f_proj.norm.weight": "model-00002-of-00032.safetensors", "model.layers.2.attn.f_proj.weight": "model-00002-of-00032.safetensors", "model.layers.2.attn.g_norm.weight": "model-00002-of-00032.safetensors", "model.layers.2.attn.g_proj.norm.weight": "model-00002-of-00032.safetensors", "model.layers.2.attn.g_proj.weight": "model-00002-of-00032.safetensors", "model.layers.2.attn.i_proj.norm.weight": "model-00002-of-00032.safetensors", "model.layers.2.attn.i_proj.weight": "model-00002-of-00032.safetensors", "model.layers.2.attn.o_proj.norm.weight": "model-00002-of-00032.safetensors", "model.layers.2.attn.o_proj.weight": "model-00002-of-00032.safetensors", "model.layers.2.attn_norm.weight": "model-00002-of-00032.safetensors", "model.layers.2.mlp.down_proj.norm.weight": "model-00002-of-00032.safetensors", "model.layers.2.mlp.down_proj.weight": "model-00002-of-00032.safetensors", "model.layers.2.mlp.gate_proj.norm.weight": "model-00002-of-00032.safetensors", "model.layers.2.mlp.gate_proj.weight": "model-00002-of-00032.safetensors", "model.layers.2.mlp_norm.weight": "model-00002-of-00032.safetensors", "model.layers.20.attn.f_proj.norm.weight": "model-00010-of-00032.safetensors", "model.layers.20.attn.f_proj.weight": "model-00010-of-00032.safetensors", "model.layers.20.attn.g_norm.weight": "model-00010-of-00032.safetensors", "model.layers.20.attn.g_proj.norm.weight": "model-00010-of-00032.safetensors", "model.layers.20.attn.g_proj.weight": "model-00010-of-00032.safetensors", "model.layers.20.attn.i_proj.norm.weight": "model-00010-of-00032.safetensors", "model.layers.20.attn.i_proj.weight": "model-00010-of-00032.safetensors", "model.layers.20.attn.o_proj.norm.weight": "model-00010-of-00032.safetensors", "model.layers.20.attn.o_proj.weight": "model-00010-of-00032.safetensors", "model.layers.20.attn_norm.weight": "model-00010-of-00032.safetensors", "model.layers.20.mlp.down_proj.norm.weight": "model-00010-of-00032.safetensors", "model.layers.20.mlp.down_proj.weight": "model-00010-of-00032.safetensors", "model.layers.20.mlp.gate_proj.norm.weight": "model-00010-of-00032.safetensors", "model.layers.20.mlp.gate_proj.weight": "model-00010-of-00032.safetensors", "model.layers.20.mlp_norm.weight": "model-00010-of-00032.safetensors", "model.layers.21.attn.f_proj.norm.weight": "model-00010-of-00032.safetensors", "model.layers.21.attn.f_proj.weight": "model-00010-of-00032.safetensors", "model.layers.21.attn.g_norm.weight": "model-00010-of-00032.safetensors", "model.layers.21.attn.g_proj.norm.weight": "model-00010-of-00032.safetensors", "model.layers.21.attn.g_proj.weight": "model-00010-of-00032.safetensors", "model.layers.21.attn.i_proj.norm.weight": "model-00010-of-00032.safetensors", "model.layers.21.attn.i_proj.weight": "model-00010-of-00032.safetensors", "model.layers.21.attn.o_proj.norm.weight": "model-00010-of-00032.safetensors", "model.layers.21.attn.o_proj.weight": "model-00010-of-00032.safetensors", "model.layers.21.attn_norm.weight": "model-00010-of-00032.safetensors", "model.layers.21.mlp.experts.0.down_proj.norm.weight": "model-00010-of-00032.safetensors", "model.layers.21.mlp.experts.0.down_proj.weight": "model-00010-of-00032.safetensors", "model.layers.21.mlp.experts.0.gate_proj.norm.weight": "model-00010-of-00032.safetensors", "model.layers.21.mlp.experts.0.gate_proj.weight": "model-00010-of-00032.safetensors", "model.layers.21.mlp.experts.1.down_proj.norm.weight": "model-00011-of-00032.safetensors", "model.layers.21.mlp.experts.1.down_proj.weight": "model-00011-of-00032.safetensors", "model.layers.21.mlp.experts.1.gate_proj.norm.weight": "model-00011-of-00032.safetensors", "model.layers.21.mlp.experts.1.gate_proj.weight": "model-00011-of-00032.safetensors", "model.layers.21.mlp.experts.2.down_proj.norm.weight": "model-00011-of-00032.safetensors", "model.layers.21.mlp.experts.2.down_proj.weight": "model-00011-of-00032.safetensors", "model.layers.21.mlp.experts.2.gate_proj.norm.weight": "model-00011-of-00032.safetensors", "model.layers.21.mlp.experts.2.gate_proj.weight": "model-00011-of-00032.safetensors", "model.layers.21.mlp.experts.3.down_proj.norm.weight": "model-00011-of-00032.safetensors", "model.layers.21.mlp.experts.3.down_proj.weight": "model-00011-of-00032.safetensors", "model.layers.21.mlp.experts.3.gate_proj.norm.weight": "model-00011-of-00032.safetensors", "model.layers.21.mlp.experts.3.gate_proj.weight": "model-00011-of-00032.safetensors", "model.layers.21.mlp.experts.4.down_proj.norm.weight": "model-00011-of-00032.safetensors", "model.layers.21.mlp.experts.4.down_proj.weight": "model-00011-of-00032.safetensors", "model.layers.21.mlp.experts.4.gate_proj.norm.weight": "model-00011-of-00032.safetensors", "model.layers.21.mlp.experts.4.gate_proj.weight": "model-00011-of-00032.safetensors", "model.layers.21.mlp.experts.5.down_proj.norm.weight": "model-00011-of-00032.safetensors", "model.layers.21.mlp.experts.5.down_proj.weight": "model-00011-of-00032.safetensors", "model.layers.21.mlp.experts.5.gate_proj.norm.weight": "model-00011-of-00032.safetensors", "model.layers.21.mlp.experts.5.gate_proj.weight": "model-00011-of-00032.safetensors", "model.layers.21.mlp.experts.6.down_proj.norm.weight": "model-00011-of-00032.safetensors", "model.layers.21.mlp.experts.6.down_proj.weight": "model-00011-of-00032.safetensors", "model.layers.21.mlp.experts.6.gate_proj.norm.weight": "model-00011-of-00032.safetensors", "model.layers.21.mlp.experts.6.gate_proj.weight": "model-00011-of-00032.safetensors", "model.layers.21.mlp.experts.7.down_proj.norm.weight": "model-00011-of-00032.safetensors", "model.layers.21.mlp.experts.7.down_proj.weight": "model-00011-of-00032.safetensors", "model.layers.21.mlp.experts.7.gate_proj.norm.weight": "model-00011-of-00032.safetensors", "model.layers.21.mlp.experts.7.gate_proj.weight": "model-00011-of-00032.safetensors", "model.layers.21.mlp.router.norm.weight": "model-00010-of-00032.safetensors", "model.layers.21.mlp.router.weight": "model-00010-of-00032.safetensors", "model.layers.21.mlp_norm.weight": "model-00010-of-00032.safetensors", "model.layers.22.attn.f_proj.norm.weight": "model-00011-of-00032.safetensors", "model.layers.22.attn.f_proj.weight": "model-00011-of-00032.safetensors", "model.layers.22.attn.g_norm.weight": "model-00011-of-00032.safetensors", "model.layers.22.attn.g_proj.norm.weight": "model-00011-of-00032.safetensors", "model.layers.22.attn.g_proj.weight": "model-00011-of-00032.safetensors", "model.layers.22.attn.i_proj.norm.weight": "model-00011-of-00032.safetensors", "model.layers.22.attn.i_proj.weight": "model-00011-of-00032.safetensors", "model.layers.22.attn.o_proj.norm.weight": "model-00011-of-00032.safetensors", "model.layers.22.attn.o_proj.weight": "model-00011-of-00032.safetensors", "model.layers.22.attn_norm.weight": "model-00011-of-00032.safetensors", "model.layers.22.mlp.down_proj.norm.weight": "model-00011-of-00032.safetensors", "model.layers.22.mlp.down_proj.weight": "model-00011-of-00032.safetensors", "model.layers.22.mlp.gate_proj.norm.weight": "model-00011-of-00032.safetensors", "model.layers.22.mlp.gate_proj.weight": "model-00011-of-00032.safetensors", "model.layers.22.mlp_norm.weight": "model-00011-of-00032.safetensors", "model.layers.23.attn.f_proj.norm.weight": "model-00011-of-00032.safetensors", "model.layers.23.attn.f_proj.weight": "model-00011-of-00032.safetensors", "model.layers.23.attn.g_norm.weight": "model-00011-of-00032.safetensors", "model.layers.23.attn.g_proj.norm.weight": "model-00011-of-00032.safetensors", "model.layers.23.attn.g_proj.weight": "model-00011-of-00032.safetensors", "model.layers.23.attn.i_proj.norm.weight": "model-00011-of-00032.safetensors", "model.layers.23.attn.i_proj.weight": "model-00011-of-00032.safetensors", "model.layers.23.attn.o_proj.norm.weight": "model-00011-of-00032.safetensors", "model.layers.23.attn.o_proj.weight": "model-00011-of-00032.safetensors", "model.layers.23.attn_norm.weight": "model-00011-of-00032.safetensors", "model.layers.23.mlp.experts.0.down_proj.norm.weight": "model-00011-of-00032.safetensors", "model.layers.23.mlp.experts.0.down_proj.weight": "model-00011-of-00032.safetensors", "model.layers.23.mlp.experts.0.gate_proj.norm.weight": "model-00011-of-00032.safetensors", "model.layers.23.mlp.experts.0.gate_proj.weight": "model-00011-of-00032.safetensors", "model.layers.23.mlp.experts.1.down_proj.norm.weight": "model-00011-of-00032.safetensors", "model.layers.23.mlp.experts.1.down_proj.weight": "model-00011-of-00032.safetensors", "model.layers.23.mlp.experts.1.gate_proj.norm.weight": "model-00011-of-00032.safetensors", "model.layers.23.mlp.experts.1.gate_proj.weight": "model-00011-of-00032.safetensors", "model.layers.23.mlp.experts.2.down_proj.norm.weight": "model-00012-of-00032.safetensors", "model.layers.23.mlp.experts.2.down_proj.weight": "model-00012-of-00032.safetensors", "model.layers.23.mlp.experts.2.gate_proj.norm.weight": "model-00012-of-00032.safetensors", "model.layers.23.mlp.experts.2.gate_proj.weight": "model-00012-of-00032.safetensors", "model.layers.23.mlp.experts.3.down_proj.norm.weight": "model-00012-of-00032.safetensors", "model.layers.23.mlp.experts.3.down_proj.weight": "model-00012-of-00032.safetensors", "model.layers.23.mlp.experts.3.gate_proj.norm.weight": "model-00012-of-00032.safetensors", "model.layers.23.mlp.experts.3.gate_proj.weight": "model-00012-of-00032.safetensors", "model.layers.23.mlp.experts.4.down_proj.norm.weight": "model-00012-of-00032.safetensors", "model.layers.23.mlp.experts.4.down_proj.weight": "model-00012-of-00032.safetensors", "model.layers.23.mlp.experts.4.gate_proj.norm.weight": "model-00012-of-00032.safetensors", "model.layers.23.mlp.experts.4.gate_proj.weight": "model-00012-of-00032.safetensors", "model.layers.23.mlp.experts.5.down_proj.norm.weight": "model-00012-of-00032.safetensors", "model.layers.23.mlp.experts.5.down_proj.weight": "model-00012-of-00032.safetensors", "model.layers.23.mlp.experts.5.gate_proj.norm.weight": "model-00012-of-00032.safetensors", "model.layers.23.mlp.experts.5.gate_proj.weight": "model-00012-of-00032.safetensors", "model.layers.23.mlp.experts.6.down_proj.norm.weight": "model-00012-of-00032.safetensors", "model.layers.23.mlp.experts.6.down_proj.weight": "model-00012-of-00032.safetensors", "model.layers.23.mlp.experts.6.gate_proj.norm.weight": "model-00012-of-00032.safetensors", "model.layers.23.mlp.experts.6.gate_proj.weight": "model-00012-of-00032.safetensors", "model.layers.23.mlp.experts.7.down_proj.norm.weight": "model-00012-of-00032.safetensors", "model.layers.23.mlp.experts.7.down_proj.weight": "model-00012-of-00032.safetensors", "model.layers.23.mlp.experts.7.gate_proj.norm.weight": "model-00012-of-00032.safetensors", "model.layers.23.mlp.experts.7.gate_proj.weight": "model-00012-of-00032.safetensors", "model.layers.23.mlp.router.norm.weight": "model-00011-of-00032.safetensors", "model.layers.23.mlp.router.weight": "model-00011-of-00032.safetensors", "model.layers.23.mlp_norm.weight": "model-00011-of-00032.safetensors", "model.layers.24.attn.f_proj.norm.weight": "model-00012-of-00032.safetensors", "model.layers.24.attn.f_proj.weight": "model-00012-of-00032.safetensors", "model.layers.24.attn.g_norm.weight": "model-00012-of-00032.safetensors", "model.layers.24.attn.g_proj.norm.weight": "model-00012-of-00032.safetensors", "model.layers.24.attn.g_proj.weight": "model-00012-of-00032.safetensors", "model.layers.24.attn.i_proj.norm.weight": "model-00012-of-00032.safetensors", "model.layers.24.attn.i_proj.weight": "model-00012-of-00032.safetensors", "model.layers.24.attn.o_proj.norm.weight": "model-00012-of-00032.safetensors", "model.layers.24.attn.o_proj.weight": "model-00012-of-00032.safetensors", "model.layers.24.attn_norm.weight": "model-00012-of-00032.safetensors", "model.layers.24.mlp.down_proj.norm.weight": "model-00012-of-00032.safetensors", "model.layers.24.mlp.down_proj.weight": "model-00012-of-00032.safetensors", "model.layers.24.mlp.gate_proj.norm.weight": "model-00012-of-00032.safetensors", "model.layers.24.mlp.gate_proj.weight": "model-00012-of-00032.safetensors", "model.layers.24.mlp_norm.weight": "model-00012-of-00032.safetensors", "model.layers.25.attn.f_proj.norm.weight": "model-00012-of-00032.safetensors", "model.layers.25.attn.f_proj.weight": "model-00012-of-00032.safetensors", "model.layers.25.attn.g_norm.weight": "model-00012-of-00032.safetensors", "model.layers.25.attn.g_proj.norm.weight": "model-00012-of-00032.safetensors", "model.layers.25.attn.g_proj.weight": "model-00012-of-00032.safetensors", "model.layers.25.attn.i_proj.norm.weight": "model-00012-of-00032.safetensors", "model.layers.25.attn.i_proj.weight": "model-00012-of-00032.safetensors", "model.layers.25.attn.o_proj.norm.weight": "model-00012-of-00032.safetensors", "model.layers.25.attn.o_proj.weight": "model-00012-of-00032.safetensors", "model.layers.25.attn_norm.weight": "model-00012-of-00032.safetensors", "model.layers.25.mlp.experts.0.down_proj.norm.weight": "model-00012-of-00032.safetensors", "model.layers.25.mlp.experts.0.down_proj.weight": "model-00012-of-00032.safetensors", "model.layers.25.mlp.experts.0.gate_proj.norm.weight": "model-00012-of-00032.safetensors", "model.layers.25.mlp.experts.0.gate_proj.weight": "model-00012-of-00032.safetensors", "model.layers.25.mlp.experts.1.down_proj.norm.weight": "model-00012-of-00032.safetensors", "model.layers.25.mlp.experts.1.down_proj.weight": "model-00012-of-00032.safetensors", "model.layers.25.mlp.experts.1.gate_proj.norm.weight": "model-00012-of-00032.safetensors", "model.layers.25.mlp.experts.1.gate_proj.weight": "model-00012-of-00032.safetensors", "model.layers.25.mlp.experts.2.down_proj.norm.weight": "model-00012-of-00032.safetensors", "model.layers.25.mlp.experts.2.down_proj.weight": "model-00012-of-00032.safetensors", "model.layers.25.mlp.experts.2.gate_proj.norm.weight": "model-00012-of-00032.safetensors", "model.layers.25.mlp.experts.2.gate_proj.weight": "model-00012-of-00032.safetensors", "model.layers.25.mlp.experts.3.down_proj.norm.weight": "model-00013-of-00032.safetensors", "model.layers.25.mlp.experts.3.down_proj.weight": "model-00013-of-00032.safetensors", "model.layers.25.mlp.experts.3.gate_proj.norm.weight": "model-00013-of-00032.safetensors", "model.layers.25.mlp.experts.3.gate_proj.weight": "model-00013-of-00032.safetensors", "model.layers.25.mlp.experts.4.down_proj.norm.weight": "model-00013-of-00032.safetensors", "model.layers.25.mlp.experts.4.down_proj.weight": "model-00013-of-00032.safetensors", "model.layers.25.mlp.experts.4.gate_proj.norm.weight": "model-00013-of-00032.safetensors", "model.layers.25.mlp.experts.4.gate_proj.weight": "model-00013-of-00032.safetensors", "model.layers.25.mlp.experts.5.down_proj.norm.weight": "model-00013-of-00032.safetensors", "model.layers.25.mlp.experts.5.down_proj.weight": "model-00013-of-00032.safetensors", "model.layers.25.mlp.experts.5.gate_proj.norm.weight": "model-00013-of-00032.safetensors", "model.layers.25.mlp.experts.5.gate_proj.weight": "model-00013-of-00032.safetensors", "model.layers.25.mlp.experts.6.down_proj.norm.weight": "model-00013-of-00032.safetensors", "model.layers.25.mlp.experts.6.down_proj.weight": "model-00013-of-00032.safetensors", "model.layers.25.mlp.experts.6.gate_proj.norm.weight": "model-00013-of-00032.safetensors", "model.layers.25.mlp.experts.6.gate_proj.weight": "model-00013-of-00032.safetensors", "model.layers.25.mlp.experts.7.down_proj.norm.weight": "model-00013-of-00032.safetensors", "model.layers.25.mlp.experts.7.down_proj.weight": "model-00013-of-00032.safetensors", "model.layers.25.mlp.experts.7.gate_proj.norm.weight": "model-00013-of-00032.safetensors", "model.layers.25.mlp.experts.7.gate_proj.weight": "model-00013-of-00032.safetensors", "model.layers.25.mlp.router.norm.weight": "model-00012-of-00032.safetensors", "model.layers.25.mlp.router.weight": "model-00012-of-00032.safetensors", "model.layers.25.mlp_norm.weight": "model-00012-of-00032.safetensors", "model.layers.26.attn.f_proj.norm.weight": "model-00013-of-00032.safetensors", "model.layers.26.attn.f_proj.weight": "model-00013-of-00032.safetensors", "model.layers.26.attn.g_norm.weight": "model-00013-of-00032.safetensors", "model.layers.26.attn.g_proj.norm.weight": "model-00013-of-00032.safetensors", "model.layers.26.attn.g_proj.weight": "model-00013-of-00032.safetensors", "model.layers.26.attn.i_proj.norm.weight": "model-00013-of-00032.safetensors", "model.layers.26.attn.i_proj.weight": "model-00013-of-00032.safetensors", "model.layers.26.attn.o_proj.norm.weight": "model-00013-of-00032.safetensors", "model.layers.26.attn.o_proj.weight": "model-00013-of-00032.safetensors", "model.layers.26.attn_norm.weight": "model-00013-of-00032.safetensors", "model.layers.26.mlp.down_proj.norm.weight": "model-00013-of-00032.safetensors", "model.layers.26.mlp.down_proj.weight": "model-00013-of-00032.safetensors", "model.layers.26.mlp.gate_proj.norm.weight": "model-00013-of-00032.safetensors", "model.layers.26.mlp.gate_proj.weight": "model-00013-of-00032.safetensors", "model.layers.26.mlp_norm.weight": "model-00013-of-00032.safetensors", "model.layers.27.attn.f_proj.norm.weight": "model-00013-of-00032.safetensors", "model.layers.27.attn.f_proj.weight": "model-00013-of-00032.safetensors", "model.layers.27.attn.g_norm.weight": "model-00013-of-00032.safetensors", "model.layers.27.attn.g_proj.norm.weight": "model-00013-of-00032.safetensors", "model.layers.27.attn.g_proj.weight": "model-00013-of-00032.safetensors", "model.layers.27.attn.i_proj.norm.weight": "model-00013-of-00032.safetensors", "model.layers.27.attn.i_proj.weight": "model-00013-of-00032.safetensors", "model.layers.27.attn.o_proj.norm.weight": "model-00013-of-00032.safetensors", "model.layers.27.attn.o_proj.weight": "model-00013-of-00032.safetensors", "model.layers.27.attn_norm.weight": "model-00013-of-00032.safetensors", "model.layers.27.mlp.experts.0.down_proj.norm.weight": "model-00013-of-00032.safetensors", "model.layers.27.mlp.experts.0.down_proj.weight": "model-00013-of-00032.safetensors", "model.layers.27.mlp.experts.0.gate_proj.norm.weight": "model-00013-of-00032.safetensors", "model.layers.27.mlp.experts.0.gate_proj.weight": "model-00013-of-00032.safetensors", "model.layers.27.mlp.experts.1.down_proj.norm.weight": "model-00013-of-00032.safetensors", "model.layers.27.mlp.experts.1.down_proj.weight": "model-00013-of-00032.safetensors", "model.layers.27.mlp.experts.1.gate_proj.norm.weight": "model-00013-of-00032.safetensors", "model.layers.27.mlp.experts.1.gate_proj.weight": "model-00013-of-00032.safetensors", "model.layers.27.mlp.experts.2.down_proj.norm.weight": "model-00013-of-00032.safetensors", "model.layers.27.mlp.experts.2.down_proj.weight": "model-00013-of-00032.safetensors", "model.layers.27.mlp.experts.2.gate_proj.norm.weight": "model-00013-of-00032.safetensors", "model.layers.27.mlp.experts.2.gate_proj.weight": "model-00013-of-00032.safetensors", "model.layers.27.mlp.experts.3.down_proj.norm.weight": "model-00013-of-00032.safetensors", "model.layers.27.mlp.experts.3.down_proj.weight": "model-00013-of-00032.safetensors", "model.layers.27.mlp.experts.3.gate_proj.norm.weight": "model-00013-of-00032.safetensors", "model.layers.27.mlp.experts.3.gate_proj.weight": "model-00013-of-00032.safetensors", "model.layers.27.mlp.experts.4.down_proj.norm.weight": "model-00014-of-00032.safetensors", "model.layers.27.mlp.experts.4.down_proj.weight": "model-00014-of-00032.safetensors", "model.layers.27.mlp.experts.4.gate_proj.norm.weight": "model-00014-of-00032.safetensors", "model.layers.27.mlp.experts.4.gate_proj.weight": "model-00014-of-00032.safetensors", "model.layers.27.mlp.experts.5.down_proj.norm.weight": "model-00014-of-00032.safetensors", "model.layers.27.mlp.experts.5.down_proj.weight": "model-00014-of-00032.safetensors", "model.layers.27.mlp.experts.5.gate_proj.norm.weight": "model-00014-of-00032.safetensors", "model.layers.27.mlp.experts.5.gate_proj.weight": "model-00014-of-00032.safetensors", "model.layers.27.mlp.experts.6.down_proj.norm.weight": "model-00014-of-00032.safetensors", "model.layers.27.mlp.experts.6.down_proj.weight": "model-00014-of-00032.safetensors", "model.layers.27.mlp.experts.6.gate_proj.norm.weight": "model-00014-of-00032.safetensors", "model.layers.27.mlp.experts.6.gate_proj.weight": "model-00014-of-00032.safetensors", "model.layers.27.mlp.experts.7.down_proj.norm.weight": "model-00014-of-00032.safetensors", "model.layers.27.mlp.experts.7.down_proj.weight": "model-00014-of-00032.safetensors", "model.layers.27.mlp.experts.7.gate_proj.norm.weight": "model-00014-of-00032.safetensors", "model.layers.27.mlp.experts.7.gate_proj.weight": "model-00014-of-00032.safetensors", "model.layers.27.mlp.router.norm.weight": "model-00013-of-00032.safetensors", "model.layers.27.mlp.router.weight": "model-00013-of-00032.safetensors", "model.layers.27.mlp_norm.weight": "model-00013-of-00032.safetensors", "model.layers.28.attn.f_proj.norm.weight": "model-00014-of-00032.safetensors", "model.layers.28.attn.f_proj.weight": "model-00014-of-00032.safetensors", "model.layers.28.attn.g_norm.weight": "model-00014-of-00032.safetensors", "model.layers.28.attn.g_proj.norm.weight": "model-00014-of-00032.safetensors", "model.layers.28.attn.g_proj.weight": "model-00014-of-00032.safetensors", "model.layers.28.attn.i_proj.norm.weight": "model-00014-of-00032.safetensors", "model.layers.28.attn.i_proj.weight": "model-00014-of-00032.safetensors", "model.layers.28.attn.o_proj.norm.weight": "model-00014-of-00032.safetensors", "model.layers.28.attn.o_proj.weight": "model-00014-of-00032.safetensors", "model.layers.28.attn_norm.weight": "model-00014-of-00032.safetensors", "model.layers.28.mlp.down_proj.norm.weight": "model-00014-of-00032.safetensors", "model.layers.28.mlp.down_proj.weight": "model-00014-of-00032.safetensors", "model.layers.28.mlp.gate_proj.norm.weight": "model-00014-of-00032.safetensors", "model.layers.28.mlp.gate_proj.weight": "model-00014-of-00032.safetensors", "model.layers.28.mlp_norm.weight": "model-00014-of-00032.safetensors", "model.layers.29.attn.f_proj.norm.weight": "model-00014-of-00032.safetensors", "model.layers.29.attn.f_proj.weight": "model-00014-of-00032.safetensors", "model.layers.29.attn.g_norm.weight": "model-00014-of-00032.safetensors", "model.layers.29.attn.g_proj.norm.weight": "model-00014-of-00032.safetensors", "model.layers.29.attn.g_proj.weight": "model-00014-of-00032.safetensors", "model.layers.29.attn.i_proj.norm.weight": "model-00014-of-00032.safetensors", "model.layers.29.attn.i_proj.weight": "model-00014-of-00032.safetensors", "model.layers.29.attn.o_proj.norm.weight": "model-00014-of-00032.safetensors", "model.layers.29.attn.o_proj.weight": "model-00014-of-00032.safetensors", "model.layers.29.attn_norm.weight": "model-00014-of-00032.safetensors", "model.layers.29.mlp.experts.0.down_proj.norm.weight": "model-00014-of-00032.safetensors", "model.layers.29.mlp.experts.0.down_proj.weight": "model-00014-of-00032.safetensors", "model.layers.29.mlp.experts.0.gate_proj.norm.weight": "model-00014-of-00032.safetensors", "model.layers.29.mlp.experts.0.gate_proj.weight": "model-00014-of-00032.safetensors", "model.layers.29.mlp.experts.1.down_proj.norm.weight": "model-00014-of-00032.safetensors", "model.layers.29.mlp.experts.1.down_proj.weight": "model-00014-of-00032.safetensors", "model.layers.29.mlp.experts.1.gate_proj.norm.weight": "model-00014-of-00032.safetensors", "model.layers.29.mlp.experts.1.gate_proj.weight": "model-00014-of-00032.safetensors", "model.layers.29.mlp.experts.2.down_proj.norm.weight": "model-00014-of-00032.safetensors", "model.layers.29.mlp.experts.2.down_proj.weight": "model-00014-of-00032.safetensors", "model.layers.29.mlp.experts.2.gate_proj.norm.weight": "model-00014-of-00032.safetensors", "model.layers.29.mlp.experts.2.gate_proj.weight": "model-00014-of-00032.safetensors", "model.layers.29.mlp.experts.3.down_proj.norm.weight": "model-00014-of-00032.safetensors", "model.layers.29.mlp.experts.3.down_proj.weight": "model-00014-of-00032.safetensors", "model.layers.29.mlp.experts.3.gate_proj.norm.weight": "model-00014-of-00032.safetensors", "model.layers.29.mlp.experts.3.gate_proj.weight": "model-00014-of-00032.safetensors", "model.layers.29.mlp.experts.4.down_proj.norm.weight": "model-00014-of-00032.safetensors", "model.layers.29.mlp.experts.4.down_proj.weight": "model-00014-of-00032.safetensors", "model.layers.29.mlp.experts.4.gate_proj.norm.weight": "model-00014-of-00032.safetensors", "model.layers.29.mlp.experts.4.gate_proj.weight": "model-00014-of-00032.safetensors", "model.layers.29.mlp.experts.5.down_proj.norm.weight": "model-00015-of-00032.safetensors", "model.layers.29.mlp.experts.5.down_proj.weight": "model-00015-of-00032.safetensors", "model.layers.29.mlp.experts.5.gate_proj.norm.weight": "model-00015-of-00032.safetensors", "model.layers.29.mlp.experts.5.gate_proj.weight": "model-00015-of-00032.safetensors", "model.layers.29.mlp.experts.6.down_proj.norm.weight": "model-00015-of-00032.safetensors", "model.layers.29.mlp.experts.6.down_proj.weight": "model-00015-of-00032.safetensors", "model.layers.29.mlp.experts.6.gate_proj.norm.weight": "model-00015-of-00032.safetensors", "model.layers.29.mlp.experts.6.gate_proj.weight": "model-00015-of-00032.safetensors", "model.layers.29.mlp.experts.7.down_proj.norm.weight": "model-00015-of-00032.safetensors", "model.layers.29.mlp.experts.7.down_proj.weight": "model-00015-of-00032.safetensors", "model.layers.29.mlp.experts.7.gate_proj.norm.weight": "model-00015-of-00032.safetensors", "model.layers.29.mlp.experts.7.gate_proj.weight": "model-00015-of-00032.safetensors", "model.layers.29.mlp.router.norm.weight": "model-00014-of-00032.safetensors", "model.layers.29.mlp.router.weight": "model-00014-of-00032.safetensors", "model.layers.29.mlp_norm.weight": "model-00014-of-00032.safetensors", "model.layers.3.attn.f_proj.norm.weight": "model-00002-of-00032.safetensors", "model.layers.3.attn.f_proj.weight": "model-00002-of-00032.safetensors", "model.layers.3.attn.g_norm.weight": "model-00002-of-00032.safetensors", "model.layers.3.attn.g_proj.norm.weight": "model-00002-of-00032.safetensors", "model.layers.3.attn.g_proj.weight": "model-00002-of-00032.safetensors", "model.layers.3.attn.i_proj.norm.weight": "model-00002-of-00032.safetensors", "model.layers.3.attn.i_proj.weight": "model-00002-of-00032.safetensors", "model.layers.3.attn.o_proj.norm.weight": "model-00002-of-00032.safetensors", "model.layers.3.attn.o_proj.weight": "model-00002-of-00032.safetensors", "model.layers.3.attn_norm.weight": "model-00002-of-00032.safetensors", "model.layers.3.mlp.experts.0.down_proj.norm.weight": "model-00002-of-00032.safetensors", "model.layers.3.mlp.experts.0.down_proj.weight": "model-00002-of-00032.safetensors", "model.layers.3.mlp.experts.0.gate_proj.norm.weight": "model-00002-of-00032.safetensors", "model.layers.3.mlp.experts.0.gate_proj.weight": "model-00002-of-00032.safetensors", "model.layers.3.mlp.experts.1.down_proj.norm.weight": "model-00002-of-00032.safetensors", "model.layers.3.mlp.experts.1.down_proj.weight": "model-00002-of-00032.safetensors", "model.layers.3.mlp.experts.1.gate_proj.norm.weight": "model-00002-of-00032.safetensors", "model.layers.3.mlp.experts.1.gate_proj.weight": "model-00002-of-00032.safetensors", "model.layers.3.mlp.experts.2.down_proj.norm.weight": "model-00002-of-00032.safetensors", "model.layers.3.mlp.experts.2.down_proj.weight": "model-00002-of-00032.safetensors", "model.layers.3.mlp.experts.2.gate_proj.norm.weight": "model-00002-of-00032.safetensors", "model.layers.3.mlp.experts.2.gate_proj.weight": "model-00002-of-00032.safetensors", "model.layers.3.mlp.experts.3.down_proj.norm.weight": "model-00002-of-00032.safetensors", "model.layers.3.mlp.experts.3.down_proj.weight": "model-00002-of-00032.safetensors", "model.layers.3.mlp.experts.3.gate_proj.norm.weight": "model-00002-of-00032.safetensors", "model.layers.3.mlp.experts.3.gate_proj.weight": "model-00002-of-00032.safetensors", "model.layers.3.mlp.experts.4.down_proj.norm.weight": "model-00002-of-00032.safetensors", "model.layers.3.mlp.experts.4.down_proj.weight": "model-00002-of-00032.safetensors", "model.layers.3.mlp.experts.4.gate_proj.norm.weight": "model-00002-of-00032.safetensors", "model.layers.3.mlp.experts.4.gate_proj.weight": "model-00002-of-00032.safetensors", "model.layers.3.mlp.experts.5.down_proj.norm.weight": "model-00002-of-00032.safetensors", "model.layers.3.mlp.experts.5.down_proj.weight": "model-00002-of-00032.safetensors", "model.layers.3.mlp.experts.5.gate_proj.norm.weight": "model-00002-of-00032.safetensors", "model.layers.3.mlp.experts.5.gate_proj.weight": "model-00002-of-00032.safetensors", "model.layers.3.mlp.experts.6.down_proj.norm.weight": "model-00003-of-00032.safetensors", "model.layers.3.mlp.experts.6.down_proj.weight": "model-00003-of-00032.safetensors", "model.layers.3.mlp.experts.6.gate_proj.norm.weight": "model-00003-of-00032.safetensors", "model.layers.3.mlp.experts.6.gate_proj.weight": "model-00003-of-00032.safetensors", "model.layers.3.mlp.experts.7.down_proj.norm.weight": "model-00003-of-00032.safetensors", "model.layers.3.mlp.experts.7.down_proj.weight": "model-00003-of-00032.safetensors", "model.layers.3.mlp.experts.7.gate_proj.norm.weight": "model-00003-of-00032.safetensors", "model.layers.3.mlp.experts.7.gate_proj.weight": "model-00003-of-00032.safetensors", "model.layers.3.mlp.router.norm.weight": "model-00002-of-00032.safetensors", "model.layers.3.mlp.router.weight": "model-00002-of-00032.safetensors", "model.layers.3.mlp_norm.weight": "model-00002-of-00032.safetensors", "model.layers.30.attn.f_proj.norm.weight": "model-00015-of-00032.safetensors", "model.layers.30.attn.f_proj.weight": "model-00015-of-00032.safetensors", "model.layers.30.attn.g_norm.weight": "model-00015-of-00032.safetensors", "model.layers.30.attn.g_proj.norm.weight": "model-00015-of-00032.safetensors", "model.layers.30.attn.g_proj.weight": "model-00015-of-00032.safetensors", "model.layers.30.attn.i_proj.norm.weight": "model-00015-of-00032.safetensors", "model.layers.30.attn.i_proj.weight": "model-00015-of-00032.safetensors", "model.layers.30.attn.o_proj.norm.weight": "model-00015-of-00032.safetensors", "model.layers.30.attn.o_proj.weight": "model-00015-of-00032.safetensors", "model.layers.30.attn_norm.weight": "model-00015-of-00032.safetensors", "model.layers.30.mlp.down_proj.norm.weight": "model-00015-of-00032.safetensors", "model.layers.30.mlp.down_proj.weight": "model-00015-of-00032.safetensors", "model.layers.30.mlp.gate_proj.norm.weight": "model-00015-of-00032.safetensors", "model.layers.30.mlp.gate_proj.weight": "model-00015-of-00032.safetensors", "model.layers.30.mlp_norm.weight": "model-00015-of-00032.safetensors", "model.layers.31.attn.f_proj.norm.weight": "model-00015-of-00032.safetensors", "model.layers.31.attn.f_proj.weight": "model-00015-of-00032.safetensors", "model.layers.31.attn.g_norm.weight": "model-00015-of-00032.safetensors", "model.layers.31.attn.g_proj.norm.weight": "model-00015-of-00032.safetensors", "model.layers.31.attn.g_proj.weight": "model-00015-of-00032.safetensors", "model.layers.31.attn.i_proj.norm.weight": "model-00015-of-00032.safetensors", "model.layers.31.attn.i_proj.weight": "model-00015-of-00032.safetensors", "model.layers.31.attn.o_proj.norm.weight": "model-00015-of-00032.safetensors", "model.layers.31.attn.o_proj.weight": "model-00015-of-00032.safetensors", "model.layers.31.attn_norm.weight": "model-00015-of-00032.safetensors", "model.layers.31.mlp.experts.0.down_proj.norm.weight": "model-00015-of-00032.safetensors", "model.layers.31.mlp.experts.0.down_proj.weight": "model-00015-of-00032.safetensors", "model.layers.31.mlp.experts.0.gate_proj.norm.weight": "model-00015-of-00032.safetensors", "model.layers.31.mlp.experts.0.gate_proj.weight": "model-00015-of-00032.safetensors", "model.layers.31.mlp.experts.1.down_proj.norm.weight": "model-00015-of-00032.safetensors", "model.layers.31.mlp.experts.1.down_proj.weight": "model-00015-of-00032.safetensors", "model.layers.31.mlp.experts.1.gate_proj.norm.weight": "model-00015-of-00032.safetensors", "model.layers.31.mlp.experts.1.gate_proj.weight": "model-00015-of-00032.safetensors", "model.layers.31.mlp.experts.2.down_proj.norm.weight": "model-00015-of-00032.safetensors", "model.layers.31.mlp.experts.2.down_proj.weight": "model-00015-of-00032.safetensors", "model.layers.31.mlp.experts.2.gate_proj.norm.weight": "model-00015-of-00032.safetensors", "model.layers.31.mlp.experts.2.gate_proj.weight": "model-00015-of-00032.safetensors", "model.layers.31.mlp.experts.3.down_proj.norm.weight": "model-00015-of-00032.safetensors", "model.layers.31.mlp.experts.3.down_proj.weight": "model-00015-of-00032.safetensors", "model.layers.31.mlp.experts.3.gate_proj.norm.weight": "model-00015-of-00032.safetensors", "model.layers.31.mlp.experts.3.gate_proj.weight": "model-00015-of-00032.safetensors", "model.layers.31.mlp.experts.4.down_proj.norm.weight": "model-00015-of-00032.safetensors", "model.layers.31.mlp.experts.4.down_proj.weight": "model-00015-of-00032.safetensors", "model.layers.31.mlp.experts.4.gate_proj.norm.weight": "model-00015-of-00032.safetensors", "model.layers.31.mlp.experts.4.gate_proj.weight": "model-00015-of-00032.safetensors", "model.layers.31.mlp.experts.5.down_proj.norm.weight": "model-00015-of-00032.safetensors", "model.layers.31.mlp.experts.5.down_proj.weight": "model-00015-of-00032.safetensors", "model.layers.31.mlp.experts.5.gate_proj.norm.weight": "model-00015-of-00032.safetensors", "model.layers.31.mlp.experts.5.gate_proj.weight": "model-00015-of-00032.safetensors", "model.layers.31.mlp.experts.6.down_proj.norm.weight": "model-00016-of-00032.safetensors", "model.layers.31.mlp.experts.6.down_proj.weight": "model-00016-of-00032.safetensors", "model.layers.31.mlp.experts.6.gate_proj.norm.weight": "model-00016-of-00032.safetensors", "model.layers.31.mlp.experts.6.gate_proj.weight": "model-00016-of-00032.safetensors", "model.layers.31.mlp.experts.7.down_proj.norm.weight": "model-00016-of-00032.safetensors", "model.layers.31.mlp.experts.7.down_proj.weight": "model-00016-of-00032.safetensors", "model.layers.31.mlp.experts.7.gate_proj.norm.weight": "model-00016-of-00032.safetensors", "model.layers.31.mlp.experts.7.gate_proj.weight": "model-00016-of-00032.safetensors", "model.layers.31.mlp.router.norm.weight": "model-00015-of-00032.safetensors", "model.layers.31.mlp.router.weight": "model-00015-of-00032.safetensors", "model.layers.31.mlp_norm.weight": "model-00015-of-00032.safetensors", "model.layers.32.attn.f_proj.norm.weight": "model-00016-of-00032.safetensors", "model.layers.32.attn.f_proj.weight": "model-00016-of-00032.safetensors", "model.layers.32.attn.g_norm.weight": "model-00016-of-00032.safetensors", "model.layers.32.attn.g_proj.norm.weight": "model-00016-of-00032.safetensors", "model.layers.32.attn.g_proj.weight": "model-00016-of-00032.safetensors", "model.layers.32.attn.i_proj.norm.weight": "model-00016-of-00032.safetensors", "model.layers.32.attn.i_proj.weight": "model-00016-of-00032.safetensors", "model.layers.32.attn.o_proj.norm.weight": "model-00016-of-00032.safetensors", "model.layers.32.attn.o_proj.weight": "model-00016-of-00032.safetensors", "model.layers.32.attn_norm.weight": "model-00016-of-00032.safetensors", "model.layers.32.mlp.down_proj.norm.weight": "model-00016-of-00032.safetensors", "model.layers.32.mlp.down_proj.weight": "model-00016-of-00032.safetensors", "model.layers.32.mlp.gate_proj.norm.weight": "model-00016-of-00032.safetensors", "model.layers.32.mlp.gate_proj.weight": "model-00016-of-00032.safetensors", "model.layers.32.mlp_norm.weight": "model-00016-of-00032.safetensors", "model.layers.33.attn.f_proj.norm.weight": "model-00016-of-00032.safetensors", "model.layers.33.attn.f_proj.weight": "model-00016-of-00032.safetensors", "model.layers.33.attn.g_norm.weight": "model-00016-of-00032.safetensors", "model.layers.33.attn.g_proj.norm.weight": "model-00016-of-00032.safetensors", "model.layers.33.attn.g_proj.weight": "model-00016-of-00032.safetensors", "model.layers.33.attn.i_proj.norm.weight": "model-00016-of-00032.safetensors", "model.layers.33.attn.i_proj.weight": "model-00016-of-00032.safetensors", "model.layers.33.attn.o_proj.norm.weight": "model-00016-of-00032.safetensors", "model.layers.33.attn.o_proj.weight": "model-00016-of-00032.safetensors", "model.layers.33.attn_norm.weight": "model-00016-of-00032.safetensors", "model.layers.33.mlp.experts.0.down_proj.norm.weight": "model-00016-of-00032.safetensors", "model.layers.33.mlp.experts.0.down_proj.weight": "model-00016-of-00032.safetensors", "model.layers.33.mlp.experts.0.gate_proj.norm.weight": "model-00016-of-00032.safetensors", "model.layers.33.mlp.experts.0.gate_proj.weight": "model-00016-of-00032.safetensors", "model.layers.33.mlp.experts.1.down_proj.norm.weight": "model-00016-of-00032.safetensors", "model.layers.33.mlp.experts.1.down_proj.weight": "model-00016-of-00032.safetensors", "model.layers.33.mlp.experts.1.gate_proj.norm.weight": "model-00016-of-00032.safetensors", "model.layers.33.mlp.experts.1.gate_proj.weight": "model-00016-of-00032.safetensors", "model.layers.33.mlp.experts.2.down_proj.norm.weight": "model-00016-of-00032.safetensors", "model.layers.33.mlp.experts.2.down_proj.weight": "model-00016-of-00032.safetensors", "model.layers.33.mlp.experts.2.gate_proj.norm.weight": "model-00016-of-00032.safetensors", "model.layers.33.mlp.experts.2.gate_proj.weight": "model-00016-of-00032.safetensors", "model.layers.33.mlp.experts.3.down_proj.norm.weight": "model-00016-of-00032.safetensors", "model.layers.33.mlp.experts.3.down_proj.weight": "model-00016-of-00032.safetensors", "model.layers.33.mlp.experts.3.gate_proj.norm.weight": "model-00016-of-00032.safetensors", "model.layers.33.mlp.experts.3.gate_proj.weight": "model-00016-of-00032.safetensors", "model.layers.33.mlp.experts.4.down_proj.norm.weight": "model-00016-of-00032.safetensors", "model.layers.33.mlp.experts.4.down_proj.weight": "model-00016-of-00032.safetensors", "model.layers.33.mlp.experts.4.gate_proj.norm.weight": "model-00016-of-00032.safetensors", "model.layers.33.mlp.experts.4.gate_proj.weight": "model-00016-of-00032.safetensors", "model.layers.33.mlp.experts.5.down_proj.norm.weight": "model-00016-of-00032.safetensors", "model.layers.33.mlp.experts.5.down_proj.weight": "model-00016-of-00032.safetensors", "model.layers.33.mlp.experts.5.gate_proj.norm.weight": "model-00016-of-00032.safetensors", "model.layers.33.mlp.experts.5.gate_proj.weight": "model-00016-of-00032.safetensors", "model.layers.33.mlp.experts.6.down_proj.norm.weight": "model-00016-of-00032.safetensors", "model.layers.33.mlp.experts.6.down_proj.weight": "model-00016-of-00032.safetensors", "model.layers.33.mlp.experts.6.gate_proj.norm.weight": "model-00016-of-00032.safetensors", "model.layers.33.mlp.experts.6.gate_proj.weight": "model-00016-of-00032.safetensors", "model.layers.33.mlp.experts.7.down_proj.norm.weight": "model-00017-of-00032.safetensors", "model.layers.33.mlp.experts.7.down_proj.weight": "model-00017-of-00032.safetensors", "model.layers.33.mlp.experts.7.gate_proj.norm.weight": "model-00017-of-00032.safetensors", "model.layers.33.mlp.experts.7.gate_proj.weight": "model-00017-of-00032.safetensors", "model.layers.33.mlp.router.norm.weight": "model-00016-of-00032.safetensors", "model.layers.33.mlp.router.weight": "model-00016-of-00032.safetensors", "model.layers.33.mlp_norm.weight": "model-00016-of-00032.safetensors", "model.layers.34.attn.f_proj.norm.weight": "model-00017-of-00032.safetensors", "model.layers.34.attn.f_proj.weight": "model-00017-of-00032.safetensors", "model.layers.34.attn.g_norm.weight": "model-00017-of-00032.safetensors", "model.layers.34.attn.g_proj.norm.weight": "model-00017-of-00032.safetensors", "model.layers.34.attn.g_proj.weight": "model-00017-of-00032.safetensors", "model.layers.34.attn.i_proj.norm.weight": "model-00017-of-00032.safetensors", "model.layers.34.attn.i_proj.weight": "model-00017-of-00032.safetensors", "model.layers.34.attn.o_proj.norm.weight": "model-00017-of-00032.safetensors", "model.layers.34.attn.o_proj.weight": "model-00017-of-00032.safetensors", "model.layers.34.attn_norm.weight": "model-00017-of-00032.safetensors", "model.layers.34.mlp.down_proj.norm.weight": "model-00017-of-00032.safetensors", "model.layers.34.mlp.down_proj.weight": "model-00017-of-00032.safetensors", "model.layers.34.mlp.gate_proj.norm.weight": "model-00017-of-00032.safetensors", "model.layers.34.mlp.gate_proj.weight": "model-00017-of-00032.safetensors", "model.layers.34.mlp_norm.weight": "model-00017-of-00032.safetensors", "model.layers.35.attn.f_proj.norm.weight": "model-00017-of-00032.safetensors", "model.layers.35.attn.f_proj.weight": "model-00017-of-00032.safetensors", "model.layers.35.attn.g_norm.weight": "model-00017-of-00032.safetensors", "model.layers.35.attn.g_proj.norm.weight": "model-00017-of-00032.safetensors", "model.layers.35.attn.g_proj.weight": "model-00017-of-00032.safetensors", "model.layers.35.attn.i_proj.norm.weight": "model-00017-of-00032.safetensors", "model.layers.35.attn.i_proj.weight": "model-00017-of-00032.safetensors", "model.layers.35.attn.o_proj.norm.weight": "model-00017-of-00032.safetensors", "model.layers.35.attn.o_proj.weight": "model-00017-of-00032.safetensors", "model.layers.35.attn_norm.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp.experts.0.down_proj.norm.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp.experts.0.down_proj.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp.experts.0.gate_proj.norm.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp.experts.0.gate_proj.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp.experts.1.down_proj.norm.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp.experts.1.down_proj.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp.experts.1.gate_proj.norm.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp.experts.1.gate_proj.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp.experts.2.down_proj.norm.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp.experts.2.down_proj.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp.experts.2.gate_proj.norm.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp.experts.2.gate_proj.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp.experts.3.down_proj.norm.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp.experts.3.down_proj.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp.experts.3.gate_proj.norm.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp.experts.3.gate_proj.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp.experts.4.down_proj.norm.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp.experts.4.down_proj.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp.experts.4.gate_proj.norm.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp.experts.4.gate_proj.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp.experts.5.down_proj.norm.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp.experts.5.down_proj.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp.experts.5.gate_proj.norm.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp.experts.5.gate_proj.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp.experts.6.down_proj.norm.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp.experts.6.down_proj.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp.experts.6.gate_proj.norm.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp.experts.6.gate_proj.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp.experts.7.down_proj.norm.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp.experts.7.down_proj.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp.experts.7.gate_proj.norm.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp.experts.7.gate_proj.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp.router.norm.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp.router.weight": "model-00017-of-00032.safetensors", "model.layers.35.mlp_norm.weight": "model-00017-of-00032.safetensors", "model.layers.36.attn.f_proj.norm.weight": "model-00018-of-00032.safetensors", "model.layers.36.attn.f_proj.weight": "model-00018-of-00032.safetensors", "model.layers.36.attn.g_norm.weight": "model-00018-of-00032.safetensors", "model.layers.36.attn.g_proj.norm.weight": "model-00018-of-00032.safetensors", "model.layers.36.attn.g_proj.weight": "model-00018-of-00032.safetensors", "model.layers.36.attn.i_proj.norm.weight": "model-00018-of-00032.safetensors", "model.layers.36.attn.i_proj.weight": "model-00018-of-00032.safetensors", "model.layers.36.attn.o_proj.norm.weight": "model-00018-of-00032.safetensors", "model.layers.36.attn.o_proj.weight": "model-00018-of-00032.safetensors", "model.layers.36.attn_norm.weight": "model-00017-of-00032.safetensors", "model.layers.36.mlp.down_proj.norm.weight": "model-00018-of-00032.safetensors", "model.layers.36.mlp.down_proj.weight": "model-00018-of-00032.safetensors", "model.layers.36.mlp.gate_proj.norm.weight": "model-00018-of-00032.safetensors", "model.layers.36.mlp.gate_proj.weight": "model-00018-of-00032.safetensors", "model.layers.36.mlp_norm.weight": "model-00018-of-00032.safetensors", "model.layers.37.attn.f_proj.norm.weight": "model-00018-of-00032.safetensors", "model.layers.37.attn.f_proj.weight": "model-00018-of-00032.safetensors", "model.layers.37.attn.g_norm.weight": "model-00018-of-00032.safetensors", "model.layers.37.attn.g_proj.norm.weight": "model-00018-of-00032.safetensors", "model.layers.37.attn.g_proj.weight": "model-00018-of-00032.safetensors", "model.layers.37.attn.i_proj.norm.weight": "model-00018-of-00032.safetensors", "model.layers.37.attn.i_proj.weight": "model-00018-of-00032.safetensors", "model.layers.37.attn.o_proj.norm.weight": "model-00018-of-00032.safetensors", "model.layers.37.attn.o_proj.weight": "model-00018-of-00032.safetensors", "model.layers.37.attn_norm.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp.experts.0.down_proj.norm.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp.experts.0.down_proj.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp.experts.0.gate_proj.norm.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp.experts.0.gate_proj.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp.experts.1.down_proj.norm.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp.experts.1.down_proj.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp.experts.1.gate_proj.norm.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp.experts.1.gate_proj.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp.experts.2.down_proj.norm.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp.experts.2.down_proj.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp.experts.2.gate_proj.norm.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp.experts.2.gate_proj.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp.experts.3.down_proj.norm.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp.experts.3.down_proj.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp.experts.3.gate_proj.norm.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp.experts.3.gate_proj.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp.experts.4.down_proj.norm.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp.experts.4.down_proj.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp.experts.4.gate_proj.norm.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp.experts.4.gate_proj.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp.experts.5.down_proj.norm.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp.experts.5.down_proj.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp.experts.5.gate_proj.norm.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp.experts.5.gate_proj.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp.experts.6.down_proj.norm.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp.experts.6.down_proj.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp.experts.6.gate_proj.norm.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp.experts.6.gate_proj.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp.experts.7.down_proj.norm.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp.experts.7.down_proj.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp.experts.7.gate_proj.norm.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp.experts.7.gate_proj.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp.router.norm.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp.router.weight": "model-00018-of-00032.safetensors", "model.layers.37.mlp_norm.weight": "model-00018-of-00032.safetensors", "model.layers.38.attn.f_proj.norm.weight": "model-00018-of-00032.safetensors", "model.layers.38.attn.f_proj.weight": "model-00018-of-00032.safetensors", "model.layers.38.attn.g_norm.weight": "model-00019-of-00032.safetensors", "model.layers.38.attn.g_proj.norm.weight": "model-00019-of-00032.safetensors", "model.layers.38.attn.g_proj.weight": "model-00019-of-00032.safetensors", "model.layers.38.attn.i_proj.norm.weight": "model-00018-of-00032.safetensors", "model.layers.38.attn.i_proj.weight": "model-00018-of-00032.safetensors", "model.layers.38.attn.o_proj.norm.weight": "model-00019-of-00032.safetensors", "model.layers.38.attn.o_proj.weight": "model-00019-of-00032.safetensors", "model.layers.38.attn_norm.weight": "model-00018-of-00032.safetensors", "model.layers.38.mlp.down_proj.norm.weight": "model-00019-of-00032.safetensors", "model.layers.38.mlp.down_proj.weight": "model-00019-of-00032.safetensors", "model.layers.38.mlp.gate_proj.norm.weight": "model-00019-of-00032.safetensors", "model.layers.38.mlp.gate_proj.weight": "model-00019-of-00032.safetensors", "model.layers.38.mlp_norm.weight": "model-00019-of-00032.safetensors", "model.layers.39.attn.f_proj.norm.weight": "model-00019-of-00032.safetensors", "model.layers.39.attn.f_proj.weight": "model-00019-of-00032.safetensors", "model.layers.39.attn.g_norm.weight": "model-00019-of-00032.safetensors", "model.layers.39.attn.g_proj.norm.weight": "model-00019-of-00032.safetensors", "model.layers.39.attn.g_proj.weight": "model-00019-of-00032.safetensors", "model.layers.39.attn.i_proj.norm.weight": "model-00019-of-00032.safetensors", "model.layers.39.attn.i_proj.weight": "model-00019-of-00032.safetensors", "model.layers.39.attn.o_proj.norm.weight": "model-00019-of-00032.safetensors", "model.layers.39.attn.o_proj.weight": "model-00019-of-00032.safetensors", "model.layers.39.attn_norm.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp.experts.0.down_proj.norm.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp.experts.0.down_proj.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp.experts.0.gate_proj.norm.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp.experts.0.gate_proj.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp.experts.1.down_proj.norm.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp.experts.1.down_proj.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp.experts.1.gate_proj.norm.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp.experts.1.gate_proj.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp.experts.2.down_proj.norm.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp.experts.2.down_proj.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp.experts.2.gate_proj.norm.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp.experts.2.gate_proj.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp.experts.3.down_proj.norm.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp.experts.3.down_proj.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp.experts.3.gate_proj.norm.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp.experts.3.gate_proj.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp.experts.4.down_proj.norm.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp.experts.4.down_proj.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp.experts.4.gate_proj.norm.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp.experts.4.gate_proj.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp.experts.5.down_proj.norm.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp.experts.5.down_proj.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp.experts.5.gate_proj.norm.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp.experts.5.gate_proj.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp.experts.6.down_proj.norm.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp.experts.6.down_proj.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp.experts.6.gate_proj.norm.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp.experts.6.gate_proj.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp.experts.7.down_proj.norm.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp.experts.7.down_proj.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp.experts.7.gate_proj.norm.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp.experts.7.gate_proj.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp.router.norm.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp.router.weight": "model-00019-of-00032.safetensors", "model.layers.39.mlp_norm.weight": "model-00019-of-00032.safetensors", "model.layers.4.attn.f_proj.norm.weight": "model-00003-of-00032.safetensors", "model.layers.4.attn.f_proj.weight": "model-00003-of-00032.safetensors", "model.layers.4.attn.g_norm.weight": "model-00003-of-00032.safetensors", "model.layers.4.attn.g_proj.norm.weight": "model-00003-of-00032.safetensors", "model.layers.4.attn.g_proj.weight": "model-00003-of-00032.safetensors", "model.layers.4.attn.i_proj.norm.weight": "model-00003-of-00032.safetensors", "model.layers.4.attn.i_proj.weight": "model-00003-of-00032.safetensors", "model.layers.4.attn.o_proj.norm.weight": "model-00003-of-00032.safetensors", "model.layers.4.attn.o_proj.weight": "model-00003-of-00032.safetensors", "model.layers.4.attn_norm.weight": "model-00003-of-00032.safetensors", "model.layers.4.mlp.down_proj.norm.weight": "model-00003-of-00032.safetensors", "model.layers.4.mlp.down_proj.weight": "model-00003-of-00032.safetensors", "model.layers.4.mlp.gate_proj.norm.weight": "model-00003-of-00032.safetensors", "model.layers.4.mlp.gate_proj.weight": "model-00003-of-00032.safetensors", "model.layers.4.mlp_norm.weight": "model-00003-of-00032.safetensors", "model.layers.40.attn.f_proj.norm.weight": "model-00019-of-00032.safetensors", "model.layers.40.attn.f_proj.weight": "model-00019-of-00032.safetensors", "model.layers.40.attn.g_norm.weight": "model-00019-of-00032.safetensors", "model.layers.40.attn.g_proj.norm.weight": "model-00019-of-00032.safetensors", "model.layers.40.attn.g_proj.weight": "model-00019-of-00032.safetensors", "model.layers.40.attn.i_proj.norm.weight": "model-00019-of-00032.safetensors", "model.layers.40.attn.i_proj.weight": "model-00019-of-00032.safetensors", "model.layers.40.attn.o_proj.norm.weight": "model-00019-of-00032.safetensors", "model.layers.40.attn.o_proj.weight": "model-00019-of-00032.safetensors", "model.layers.40.attn_norm.weight": "model-00019-of-00032.safetensors", "model.layers.40.mlp.down_proj.norm.weight": "model-00020-of-00032.safetensors", "model.layers.40.mlp.down_proj.weight": "model-00020-of-00032.safetensors", "model.layers.40.mlp.gate_proj.norm.weight": "model-00020-of-00032.safetensors", "model.layers.40.mlp.gate_proj.weight": "model-00020-of-00032.safetensors", "model.layers.40.mlp_norm.weight": "model-00019-of-00032.safetensors", "model.layers.41.attn.f_proj.norm.weight": "model-00020-of-00032.safetensors", "model.layers.41.attn.f_proj.weight": "model-00020-of-00032.safetensors", "model.layers.41.attn.g_norm.weight": "model-00020-of-00032.safetensors", "model.layers.41.attn.g_proj.norm.weight": "model-00020-of-00032.safetensors", "model.layers.41.attn.g_proj.weight": "model-00020-of-00032.safetensors", "model.layers.41.attn.i_proj.norm.weight": "model-00020-of-00032.safetensors", "model.layers.41.attn.i_proj.weight": "model-00020-of-00032.safetensors", "model.layers.41.attn.o_proj.norm.weight": "model-00020-of-00032.safetensors", "model.layers.41.attn.o_proj.weight": "model-00020-of-00032.safetensors", "model.layers.41.attn_norm.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp.experts.0.down_proj.norm.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp.experts.0.down_proj.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp.experts.0.gate_proj.norm.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp.experts.0.gate_proj.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp.experts.1.down_proj.norm.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp.experts.1.down_proj.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp.experts.1.gate_proj.norm.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp.experts.1.gate_proj.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp.experts.2.down_proj.norm.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp.experts.2.down_proj.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp.experts.2.gate_proj.norm.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp.experts.2.gate_proj.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp.experts.3.down_proj.norm.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp.experts.3.down_proj.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp.experts.3.gate_proj.norm.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp.experts.3.gate_proj.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp.experts.4.down_proj.norm.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp.experts.4.down_proj.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp.experts.4.gate_proj.norm.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp.experts.4.gate_proj.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp.experts.5.down_proj.norm.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp.experts.5.down_proj.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp.experts.5.gate_proj.norm.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp.experts.5.gate_proj.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp.experts.6.down_proj.norm.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp.experts.6.down_proj.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp.experts.6.gate_proj.norm.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp.experts.6.gate_proj.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp.experts.7.down_proj.norm.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp.experts.7.down_proj.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp.experts.7.gate_proj.norm.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp.experts.7.gate_proj.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp.router.norm.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp.router.weight": "model-00020-of-00032.safetensors", "model.layers.41.mlp_norm.weight": "model-00020-of-00032.safetensors", "model.layers.42.attn.f_proj.norm.weight": "model-00020-of-00032.safetensors", "model.layers.42.attn.f_proj.weight": "model-00020-of-00032.safetensors", "model.layers.42.attn.g_norm.weight": "model-00020-of-00032.safetensors", "model.layers.42.attn.g_proj.norm.weight": "model-00020-of-00032.safetensors", "model.layers.42.attn.g_proj.weight": "model-00020-of-00032.safetensors", "model.layers.42.attn.i_proj.norm.weight": "model-00020-of-00032.safetensors", "model.layers.42.attn.i_proj.weight": "model-00020-of-00032.safetensors", "model.layers.42.attn.o_proj.norm.weight": "model-00020-of-00032.safetensors", "model.layers.42.attn.o_proj.weight": "model-00020-of-00032.safetensors", "model.layers.42.attn_norm.weight": "model-00020-of-00032.safetensors", "model.layers.42.mlp.down_proj.norm.weight": "model-00020-of-00032.safetensors", "model.layers.42.mlp.down_proj.weight": "model-00020-of-00032.safetensors", "model.layers.42.mlp.gate_proj.norm.weight": "model-00020-of-00032.safetensors", "model.layers.42.mlp.gate_proj.weight": "model-00020-of-00032.safetensors", "model.layers.42.mlp_norm.weight": "model-00020-of-00032.safetensors", "model.layers.43.attn.f_proj.norm.weight": "model-00021-of-00032.safetensors", "model.layers.43.attn.f_proj.weight": "model-00021-of-00032.safetensors", "model.layers.43.attn.g_norm.weight": "model-00021-of-00032.safetensors", "model.layers.43.attn.g_proj.norm.weight": "model-00021-of-00032.safetensors", "model.layers.43.attn.g_proj.weight": "model-00021-of-00032.safetensors", "model.layers.43.attn.i_proj.norm.weight": "model-00021-of-00032.safetensors", "model.layers.43.attn.i_proj.weight": "model-00021-of-00032.safetensors", "model.layers.43.attn.o_proj.norm.weight": "model-00021-of-00032.safetensors", "model.layers.43.attn.o_proj.weight": "model-00021-of-00032.safetensors", "model.layers.43.attn_norm.weight": "model-00020-of-00032.safetensors", "model.layers.43.mlp.experts.0.down_proj.norm.weight": "model-00021-of-00032.safetensors", "model.layers.43.mlp.experts.0.down_proj.weight": "model-00021-of-00032.safetensors", "model.layers.43.mlp.experts.0.gate_proj.norm.weight": "model-00021-of-00032.safetensors", "model.layers.43.mlp.experts.0.gate_proj.weight": "model-00021-of-00032.safetensors", "model.layers.43.mlp.experts.1.down_proj.norm.weight": "model-00021-of-00032.safetensors", "model.layers.43.mlp.experts.1.down_proj.weight": "model-00021-of-00032.safetensors", "model.layers.43.mlp.experts.1.gate_proj.norm.weight": "model-00021-of-00032.safetensors", "model.layers.43.mlp.experts.1.gate_proj.weight": "model-00021-of-00032.safetensors", "model.layers.43.mlp.experts.2.down_proj.norm.weight": "model-00021-of-00032.safetensors", "model.layers.43.mlp.experts.2.down_proj.weight": "model-00021-of-00032.safetensors", "model.layers.43.mlp.experts.2.gate_proj.norm.weight": "model-00021-of-00032.safetensors", "model.layers.43.mlp.experts.2.gate_proj.weight": "model-00021-of-00032.safetensors", "model.layers.43.mlp.experts.3.down_proj.norm.weight": "model-00021-of-00032.safetensors", "model.layers.43.mlp.experts.3.down_proj.weight": "model-00021-of-00032.safetensors", "model.layers.43.mlp.experts.3.gate_proj.norm.weight": "model-00021-of-00032.safetensors", "model.layers.43.mlp.experts.3.gate_proj.weight": "model-00021-of-00032.safetensors", "model.layers.43.mlp.experts.4.down_proj.norm.weight": "model-00021-of-00032.safetensors", "model.layers.43.mlp.experts.4.down_proj.weight": "model-00021-of-00032.safetensors", "model.layers.43.mlp.experts.4.gate_proj.norm.weight": "model-00021-of-00032.safetensors", "model.layers.43.mlp.experts.4.gate_proj.weight": "model-00021-of-00032.safetensors", "model.layers.43.mlp.experts.5.down_proj.norm.weight": "model-00021-of-00032.safetensors", "model.layers.43.mlp.experts.5.down_proj.weight": "model-00021-of-00032.safetensors", "model.layers.43.mlp.experts.5.gate_proj.norm.weight": "model-00021-of-00032.safetensors", "model.layers.43.mlp.experts.5.gate_proj.weight": "model-00021-of-00032.safetensors", "model.layers.43.mlp.experts.6.down_proj.norm.weight": "model-00021-of-00032.safetensors", "model.layers.43.mlp.experts.6.down_proj.weight": "model-00021-of-00032.safetensors", "model.layers.43.mlp.experts.6.gate_proj.norm.weight": "model-00021-of-00032.safetensors", "model.layers.43.mlp.experts.6.gate_proj.weight": "model-00021-of-00032.safetensors", "model.layers.43.mlp.experts.7.down_proj.norm.weight": "model-00021-of-00032.safetensors", "model.layers.43.mlp.experts.7.down_proj.weight": "model-00021-of-00032.safetensors", "model.layers.43.mlp.experts.7.gate_proj.norm.weight": "model-00021-of-00032.safetensors", "model.layers.43.mlp.experts.7.gate_proj.weight": "model-00021-of-00032.safetensors", "model.layers.43.mlp.router.norm.weight": "model-00021-of-00032.safetensors", "model.layers.43.mlp.router.weight": "model-00021-of-00032.safetensors", "model.layers.43.mlp_norm.weight": "model-00021-of-00032.safetensors", "model.layers.44.attn.f_proj.norm.weight": "model-00021-of-00032.safetensors", "model.layers.44.attn.f_proj.weight": "model-00021-of-00032.safetensors", "model.layers.44.attn.g_norm.weight": "model-00021-of-00032.safetensors", "model.layers.44.attn.g_proj.norm.weight": "model-00021-of-00032.safetensors", "model.layers.44.attn.g_proj.weight": "model-00021-of-00032.safetensors", "model.layers.44.attn.i_proj.norm.weight": "model-00021-of-00032.safetensors", "model.layers.44.attn.i_proj.weight": "model-00021-of-00032.safetensors", "model.layers.44.attn.o_proj.norm.weight": "model-00021-of-00032.safetensors", "model.layers.44.attn.o_proj.weight": "model-00021-of-00032.safetensors", "model.layers.44.attn_norm.weight": "model-00021-of-00032.safetensors", "model.layers.44.mlp.down_proj.norm.weight": "model-00021-of-00032.safetensors", "model.layers.44.mlp.down_proj.weight": "model-00021-of-00032.safetensors", "model.layers.44.mlp.gate_proj.norm.weight": "model-00021-of-00032.safetensors", "model.layers.44.mlp.gate_proj.weight": "model-00021-of-00032.safetensors", "model.layers.44.mlp_norm.weight": "model-00021-of-00032.safetensors", "model.layers.45.attn.f_proj.norm.weight": "model-00021-of-00032.safetensors", "model.layers.45.attn.f_proj.weight": "model-00021-of-00032.safetensors", "model.layers.45.attn.g_norm.weight": "model-00022-of-00032.safetensors", "model.layers.45.attn.g_proj.norm.weight": "model-00022-of-00032.safetensors", "model.layers.45.attn.g_proj.weight": "model-00022-of-00032.safetensors", "model.layers.45.attn.i_proj.norm.weight": "model-00021-of-00032.safetensors", "model.layers.45.attn.i_proj.weight": "model-00021-of-00032.safetensors", "model.layers.45.attn.o_proj.norm.weight": "model-00022-of-00032.safetensors", "model.layers.45.attn.o_proj.weight": "model-00022-of-00032.safetensors", "model.layers.45.attn_norm.weight": "model-00021-of-00032.safetensors", "model.layers.45.mlp.experts.0.down_proj.norm.weight": "model-00022-of-00032.safetensors", "model.layers.45.mlp.experts.0.down_proj.weight": "model-00022-of-00032.safetensors", "model.layers.45.mlp.experts.0.gate_proj.norm.weight": "model-00022-of-00032.safetensors", "model.layers.45.mlp.experts.0.gate_proj.weight": "model-00022-of-00032.safetensors", "model.layers.45.mlp.experts.1.down_proj.norm.weight": "model-00022-of-00032.safetensors", "model.layers.45.mlp.experts.1.down_proj.weight": "model-00022-of-00032.safetensors", "model.layers.45.mlp.experts.1.gate_proj.norm.weight": "model-00022-of-00032.safetensors", "model.layers.45.mlp.experts.1.gate_proj.weight": "model-00022-of-00032.safetensors", "model.layers.45.mlp.experts.2.down_proj.norm.weight": "model-00022-of-00032.safetensors", "model.layers.45.mlp.experts.2.down_proj.weight": "model-00022-of-00032.safetensors", "model.layers.45.mlp.experts.2.gate_proj.norm.weight": "model-00022-of-00032.safetensors", "model.layers.45.mlp.experts.2.gate_proj.weight": "model-00022-of-00032.safetensors", "model.layers.45.mlp.experts.3.down_proj.norm.weight": "model-00022-of-00032.safetensors", "model.layers.45.mlp.experts.3.down_proj.weight": "model-00022-of-00032.safetensors", "model.layers.45.mlp.experts.3.gate_proj.norm.weight": "model-00022-of-00032.safetensors", "model.layers.45.mlp.experts.3.gate_proj.weight": "model-00022-of-00032.safetensors", "model.layers.45.mlp.experts.4.down_proj.norm.weight": "model-00022-of-00032.safetensors", "model.layers.45.mlp.experts.4.down_proj.weight": "model-00022-of-00032.safetensors", "model.layers.45.mlp.experts.4.gate_proj.norm.weight": "model-00022-of-00032.safetensors", "model.layers.45.mlp.experts.4.gate_proj.weight": "model-00022-of-00032.safetensors", "model.layers.45.mlp.experts.5.down_proj.norm.weight": "model-00022-of-00032.safetensors", "model.layers.45.mlp.experts.5.down_proj.weight": "model-00022-of-00032.safetensors", "model.layers.45.mlp.experts.5.gate_proj.norm.weight": "model-00022-of-00032.safetensors", "model.layers.45.mlp.experts.5.gate_proj.weight": "model-00022-of-00032.safetensors", "model.layers.45.mlp.experts.6.down_proj.norm.weight": "model-00022-of-00032.safetensors", "model.layers.45.mlp.experts.6.down_proj.weight": "model-00022-of-00032.safetensors", "model.layers.45.mlp.experts.6.gate_proj.norm.weight": "model-00022-of-00032.safetensors", "model.layers.45.mlp.experts.6.gate_proj.weight": "model-00022-of-00032.safetensors", "model.layers.45.mlp.experts.7.down_proj.norm.weight": "model-00022-of-00032.safetensors", "model.layers.45.mlp.experts.7.down_proj.weight": "model-00022-of-00032.safetensors", "model.layers.45.mlp.experts.7.gate_proj.norm.weight": "model-00022-of-00032.safetensors", "model.layers.45.mlp.experts.7.gate_proj.weight": "model-00022-of-00032.safetensors", "model.layers.45.mlp.router.norm.weight": "model-00022-of-00032.safetensors", "model.layers.45.mlp.router.weight": "model-00022-of-00032.safetensors", "model.layers.45.mlp_norm.weight": "model-00022-of-00032.safetensors", "model.layers.46.attn.f_proj.norm.weight": "model-00022-of-00032.safetensors", "model.layers.46.attn.f_proj.weight": "model-00022-of-00032.safetensors", "model.layers.46.attn.g_norm.weight": "model-00022-of-00032.safetensors", "model.layers.46.attn.g_proj.norm.weight": "model-00022-of-00032.safetensors", "model.layers.46.attn.g_proj.weight": "model-00022-of-00032.safetensors", "model.layers.46.attn.i_proj.norm.weight": "model-00022-of-00032.safetensors", "model.layers.46.attn.i_proj.weight": "model-00022-of-00032.safetensors", "model.layers.46.attn.o_proj.norm.weight": "model-00022-of-00032.safetensors", "model.layers.46.attn.o_proj.weight": "model-00022-of-00032.safetensors", "model.layers.46.attn_norm.weight": "model-00022-of-00032.safetensors", "model.layers.46.mlp.down_proj.norm.weight": "model-00022-of-00032.safetensors", "model.layers.46.mlp.down_proj.weight": "model-00022-of-00032.safetensors", "model.layers.46.mlp.gate_proj.norm.weight": "model-00022-of-00032.safetensors", "model.layers.46.mlp.gate_proj.weight": "model-00022-of-00032.safetensors", "model.layers.46.mlp_norm.weight": "model-00022-of-00032.safetensors", "model.layers.47.attn.f_proj.norm.weight": "model-00022-of-00032.safetensors", "model.layers.47.attn.f_proj.weight": "model-00022-of-00032.safetensors", "model.layers.47.attn.g_norm.weight": "model-00022-of-00032.safetensors", "model.layers.47.attn.g_proj.norm.weight": "model-00022-of-00032.safetensors", "model.layers.47.attn.g_proj.weight": "model-00022-of-00032.safetensors", "model.layers.47.attn.i_proj.norm.weight": "model-00022-of-00032.safetensors", "model.layers.47.attn.i_proj.weight": "model-00022-of-00032.safetensors", "model.layers.47.attn.o_proj.norm.weight": "model-00022-of-00032.safetensors", "model.layers.47.attn.o_proj.weight": "model-00022-of-00032.safetensors", "model.layers.47.attn_norm.weight": "model-00022-of-00032.safetensors", "model.layers.47.mlp.experts.0.down_proj.norm.weight": "model-00023-of-00032.safetensors", "model.layers.47.mlp.experts.0.down_proj.weight": "model-00023-of-00032.safetensors", "model.layers.47.mlp.experts.0.gate_proj.norm.weight": "model-00023-of-00032.safetensors", "model.layers.47.mlp.experts.0.gate_proj.weight": "model-00023-of-00032.safetensors", "model.layers.47.mlp.experts.1.down_proj.norm.weight": "model-00023-of-00032.safetensors", "model.layers.47.mlp.experts.1.down_proj.weight": "model-00023-of-00032.safetensors", "model.layers.47.mlp.experts.1.gate_proj.norm.weight": "model-00023-of-00032.safetensors", "model.layers.47.mlp.experts.1.gate_proj.weight": "model-00023-of-00032.safetensors", "model.layers.47.mlp.experts.2.down_proj.norm.weight": "model-00023-of-00032.safetensors", "model.layers.47.mlp.experts.2.down_proj.weight": "model-00023-of-00032.safetensors", "model.layers.47.mlp.experts.2.gate_proj.norm.weight": "model-00023-of-00032.safetensors", "model.layers.47.mlp.experts.2.gate_proj.weight": "model-00023-of-00032.safetensors", "model.layers.47.mlp.experts.3.down_proj.norm.weight": "model-00023-of-00032.safetensors", "model.layers.47.mlp.experts.3.down_proj.weight": "model-00023-of-00032.safetensors", "model.layers.47.mlp.experts.3.gate_proj.norm.weight": "model-00023-of-00032.safetensors", "model.layers.47.mlp.experts.3.gate_proj.weight": "model-00023-of-00032.safetensors", "model.layers.47.mlp.experts.4.down_proj.norm.weight": "model-00023-of-00032.safetensors", "model.layers.47.mlp.experts.4.down_proj.weight": "model-00023-of-00032.safetensors", "model.layers.47.mlp.experts.4.gate_proj.norm.weight": "model-00023-of-00032.safetensors", "model.layers.47.mlp.experts.4.gate_proj.weight": "model-00023-of-00032.safetensors", "model.layers.47.mlp.experts.5.down_proj.norm.weight": "model-00023-of-00032.safetensors", "model.layers.47.mlp.experts.5.down_proj.weight": "model-00023-of-00032.safetensors", "model.layers.47.mlp.experts.5.gate_proj.norm.weight": "model-00023-of-00032.safetensors", "model.layers.47.mlp.experts.5.gate_proj.weight": "model-00023-of-00032.safetensors", "model.layers.47.mlp.experts.6.down_proj.norm.weight": "model-00023-of-00032.safetensors", "model.layers.47.mlp.experts.6.down_proj.weight": "model-00023-of-00032.safetensors", "model.layers.47.mlp.experts.6.gate_proj.norm.weight": "model-00023-of-00032.safetensors", "model.layers.47.mlp.experts.6.gate_proj.weight": "model-00023-of-00032.safetensors", "model.layers.47.mlp.experts.7.down_proj.norm.weight": "model-00023-of-00032.safetensors", "model.layers.47.mlp.experts.7.down_proj.weight": "model-00023-of-00032.safetensors", "model.layers.47.mlp.experts.7.gate_proj.norm.weight": "model-00023-of-00032.safetensors", "model.layers.47.mlp.experts.7.gate_proj.weight": "model-00023-of-00032.safetensors", "model.layers.47.mlp.router.norm.weight": "model-00022-of-00032.safetensors", "model.layers.47.mlp.router.weight": "model-00022-of-00032.safetensors", "model.layers.47.mlp_norm.weight": "model-00022-of-00032.safetensors", "model.layers.48.attn.f_proj.norm.weight": "model-00023-of-00032.safetensors", "model.layers.48.attn.f_proj.weight": "model-00023-of-00032.safetensors", "model.layers.48.attn.g_norm.weight": "model-00023-of-00032.safetensors", "model.layers.48.attn.g_proj.norm.weight": "model-00023-of-00032.safetensors", "model.layers.48.attn.g_proj.weight": "model-00023-of-00032.safetensors", "model.layers.48.attn.i_proj.norm.weight": "model-00023-of-00032.safetensors", "model.layers.48.attn.i_proj.weight": "model-00023-of-00032.safetensors", "model.layers.48.attn.o_proj.norm.weight": "model-00023-of-00032.safetensors", "model.layers.48.attn.o_proj.weight": "model-00023-of-00032.safetensors", "model.layers.48.attn_norm.weight": "model-00023-of-00032.safetensors", "model.layers.48.mlp.down_proj.norm.weight": "model-00023-of-00032.safetensors", "model.layers.48.mlp.down_proj.weight": "model-00023-of-00032.safetensors", "model.layers.48.mlp.gate_proj.norm.weight": "model-00023-of-00032.safetensors", "model.layers.48.mlp.gate_proj.weight": "model-00023-of-00032.safetensors", "model.layers.48.mlp_norm.weight": "model-00023-of-00032.safetensors", "model.layers.49.attn.f_proj.norm.weight": "model-00023-of-00032.safetensors", "model.layers.49.attn.f_proj.weight": "model-00023-of-00032.safetensors", "model.layers.49.attn.g_norm.weight": "model-00023-of-00032.safetensors", "model.layers.49.attn.g_proj.norm.weight": "model-00023-of-00032.safetensors", "model.layers.49.attn.g_proj.weight": "model-00023-of-00032.safetensors", "model.layers.49.attn.i_proj.norm.weight": "model-00023-of-00032.safetensors", "model.layers.49.attn.i_proj.weight": "model-00023-of-00032.safetensors", "model.layers.49.attn.o_proj.norm.weight": "model-00023-of-00032.safetensors", "model.layers.49.attn.o_proj.weight": "model-00023-of-00032.safetensors", "model.layers.49.attn_norm.weight": "model-00023-of-00032.safetensors", "model.layers.49.mlp.experts.0.down_proj.norm.weight": "model-00023-of-00032.safetensors", "model.layers.49.mlp.experts.0.down_proj.weight": "model-00023-of-00032.safetensors", "model.layers.49.mlp.experts.0.gate_proj.norm.weight": "model-00023-of-00032.safetensors", "model.layers.49.mlp.experts.0.gate_proj.weight": "model-00023-of-00032.safetensors", "model.layers.49.mlp.experts.1.down_proj.norm.weight": "model-00024-of-00032.safetensors", "model.layers.49.mlp.experts.1.down_proj.weight": "model-00024-of-00032.safetensors", "model.layers.49.mlp.experts.1.gate_proj.norm.weight": "model-00024-of-00032.safetensors", "model.layers.49.mlp.experts.1.gate_proj.weight": "model-00024-of-00032.safetensors", "model.layers.49.mlp.experts.2.down_proj.norm.weight": "model-00024-of-00032.safetensors", "model.layers.49.mlp.experts.2.down_proj.weight": "model-00024-of-00032.safetensors", "model.layers.49.mlp.experts.2.gate_proj.norm.weight": "model-00024-of-00032.safetensors", "model.layers.49.mlp.experts.2.gate_proj.weight": "model-00024-of-00032.safetensors", "model.layers.49.mlp.experts.3.down_proj.norm.weight": "model-00024-of-00032.safetensors", "model.layers.49.mlp.experts.3.down_proj.weight": "model-00024-of-00032.safetensors", "model.layers.49.mlp.experts.3.gate_proj.norm.weight": "model-00024-of-00032.safetensors", "model.layers.49.mlp.experts.3.gate_proj.weight": "model-00024-of-00032.safetensors", "model.layers.49.mlp.experts.4.down_proj.norm.weight": "model-00024-of-00032.safetensors", "model.layers.49.mlp.experts.4.down_proj.weight": "model-00024-of-00032.safetensors", "model.layers.49.mlp.experts.4.gate_proj.norm.weight": "model-00024-of-00032.safetensors", "model.layers.49.mlp.experts.4.gate_proj.weight": "model-00024-of-00032.safetensors", "model.layers.49.mlp.experts.5.down_proj.norm.weight": "model-00024-of-00032.safetensors", "model.layers.49.mlp.experts.5.down_proj.weight": "model-00024-of-00032.safetensors", "model.layers.49.mlp.experts.5.gate_proj.norm.weight": "model-00024-of-00032.safetensors", "model.layers.49.mlp.experts.5.gate_proj.weight": "model-00024-of-00032.safetensors", "model.layers.49.mlp.experts.6.down_proj.norm.weight": "model-00024-of-00032.safetensors", "model.layers.49.mlp.experts.6.down_proj.weight": "model-00024-of-00032.safetensors", "model.layers.49.mlp.experts.6.gate_proj.norm.weight": "model-00024-of-00032.safetensors", "model.layers.49.mlp.experts.6.gate_proj.weight": "model-00024-of-00032.safetensors", "model.layers.49.mlp.experts.7.down_proj.norm.weight": "model-00024-of-00032.safetensors", "model.layers.49.mlp.experts.7.down_proj.weight": "model-00024-of-00032.safetensors", "model.layers.49.mlp.experts.7.gate_proj.norm.weight": "model-00024-of-00032.safetensors", "model.layers.49.mlp.experts.7.gate_proj.weight": "model-00024-of-00032.safetensors", "model.layers.49.mlp.router.norm.weight": "model-00023-of-00032.safetensors", "model.layers.49.mlp.router.weight": "model-00023-of-00032.safetensors", "model.layers.49.mlp_norm.weight": "model-00023-of-00032.safetensors", "model.layers.5.attn.f_proj.norm.weight": "model-00003-of-00032.safetensors", "model.layers.5.attn.f_proj.weight": "model-00003-of-00032.safetensors", "model.layers.5.attn.g_norm.weight": "model-00003-of-00032.safetensors", "model.layers.5.attn.g_proj.norm.weight": "model-00003-of-00032.safetensors", "model.layers.5.attn.g_proj.weight": "model-00003-of-00032.safetensors", "model.layers.5.attn.i_proj.norm.weight": "model-00003-of-00032.safetensors", "model.layers.5.attn.i_proj.weight": "model-00003-of-00032.safetensors", "model.layers.5.attn.o_proj.norm.weight": "model-00003-of-00032.safetensors", "model.layers.5.attn.o_proj.weight": "model-00003-of-00032.safetensors", "model.layers.5.attn_norm.weight": "model-00003-of-00032.safetensors", "model.layers.5.mlp.experts.0.down_proj.norm.weight": "model-00003-of-00032.safetensors", "model.layers.5.mlp.experts.0.down_proj.weight": "model-00003-of-00032.safetensors", "model.layers.5.mlp.experts.0.gate_proj.norm.weight": "model-00003-of-00032.safetensors", "model.layers.5.mlp.experts.0.gate_proj.weight": "model-00003-of-00032.safetensors", "model.layers.5.mlp.experts.1.down_proj.norm.weight": "model-00003-of-00032.safetensors", "model.layers.5.mlp.experts.1.down_proj.weight": "model-00003-of-00032.safetensors", "model.layers.5.mlp.experts.1.gate_proj.norm.weight": "model-00003-of-00032.safetensors", "model.layers.5.mlp.experts.1.gate_proj.weight": "model-00003-of-00032.safetensors", "model.layers.5.mlp.experts.2.down_proj.norm.weight": "model-00003-of-00032.safetensors", "model.layers.5.mlp.experts.2.down_proj.weight": "model-00003-of-00032.safetensors", "model.layers.5.mlp.experts.2.gate_proj.norm.weight": "model-00003-of-00032.safetensors", "model.layers.5.mlp.experts.2.gate_proj.weight": "model-00003-of-00032.safetensors", "model.layers.5.mlp.experts.3.down_proj.norm.weight": "model-00003-of-00032.safetensors", "model.layers.5.mlp.experts.3.down_proj.weight": "model-00003-of-00032.safetensors", "model.layers.5.mlp.experts.3.gate_proj.norm.weight": "model-00003-of-00032.safetensors", "model.layers.5.mlp.experts.3.gate_proj.weight": "model-00003-of-00032.safetensors", "model.layers.5.mlp.experts.4.down_proj.norm.weight": "model-00003-of-00032.safetensors", "model.layers.5.mlp.experts.4.down_proj.weight": "model-00003-of-00032.safetensors", "model.layers.5.mlp.experts.4.gate_proj.norm.weight": "model-00003-of-00032.safetensors", "model.layers.5.mlp.experts.4.gate_proj.weight": "model-00003-of-00032.safetensors", "model.layers.5.mlp.experts.5.down_proj.norm.weight": "model-00003-of-00032.safetensors", "model.layers.5.mlp.experts.5.down_proj.weight": "model-00003-of-00032.safetensors", "model.layers.5.mlp.experts.5.gate_proj.norm.weight": "model-00003-of-00032.safetensors", "model.layers.5.mlp.experts.5.gate_proj.weight": "model-00003-of-00032.safetensors", "model.layers.5.mlp.experts.6.down_proj.norm.weight": "model-00003-of-00032.safetensors", "model.layers.5.mlp.experts.6.down_proj.weight": "model-00003-of-00032.safetensors", "model.layers.5.mlp.experts.6.gate_proj.norm.weight": "model-00003-of-00032.safetensors", "model.layers.5.mlp.experts.6.gate_proj.weight": "model-00003-of-00032.safetensors", "model.layers.5.mlp.experts.7.down_proj.norm.weight": "model-00004-of-00032.safetensors", "model.layers.5.mlp.experts.7.down_proj.weight": "model-00004-of-00032.safetensors", "model.layers.5.mlp.experts.7.gate_proj.norm.weight": "model-00004-of-00032.safetensors", "model.layers.5.mlp.experts.7.gate_proj.weight": "model-00004-of-00032.safetensors", "model.layers.5.mlp.router.norm.weight": "model-00003-of-00032.safetensors", "model.layers.5.mlp.router.weight": "model-00003-of-00032.safetensors", "model.layers.5.mlp_norm.weight": "model-00003-of-00032.safetensors", "model.layers.50.attn.f_proj.norm.weight": "model-00024-of-00032.safetensors", "model.layers.50.attn.f_proj.weight": "model-00024-of-00032.safetensors", "model.layers.50.attn.g_norm.weight": "model-00024-of-00032.safetensors", "model.layers.50.attn.g_proj.norm.weight": "model-00024-of-00032.safetensors", "model.layers.50.attn.g_proj.weight": "model-00024-of-00032.safetensors", "model.layers.50.attn.i_proj.norm.weight": "model-00024-of-00032.safetensors", "model.layers.50.attn.i_proj.weight": "model-00024-of-00032.safetensors", "model.layers.50.attn.o_proj.norm.weight": "model-00024-of-00032.safetensors", "model.layers.50.attn.o_proj.weight": "model-00024-of-00032.safetensors", "model.layers.50.attn_norm.weight": "model-00024-of-00032.safetensors", "model.layers.50.mlp.down_proj.norm.weight": "model-00024-of-00032.safetensors", "model.layers.50.mlp.down_proj.weight": "model-00024-of-00032.safetensors", "model.layers.50.mlp.gate_proj.norm.weight": "model-00024-of-00032.safetensors", "model.layers.50.mlp.gate_proj.weight": "model-00024-of-00032.safetensors", "model.layers.50.mlp_norm.weight": "model-00024-of-00032.safetensors", "model.layers.51.attn.f_proj.norm.weight": "model-00024-of-00032.safetensors", "model.layers.51.attn.f_proj.weight": "model-00024-of-00032.safetensors", "model.layers.51.attn.g_norm.weight": "model-00024-of-00032.safetensors", "model.layers.51.attn.g_proj.norm.weight": "model-00024-of-00032.safetensors", "model.layers.51.attn.g_proj.weight": "model-00024-of-00032.safetensors", "model.layers.51.attn.i_proj.norm.weight": "model-00024-of-00032.safetensors", "model.layers.51.attn.i_proj.weight": "model-00024-of-00032.safetensors", "model.layers.51.attn.o_proj.norm.weight": "model-00024-of-00032.safetensors", "model.layers.51.attn.o_proj.weight": "model-00024-of-00032.safetensors", "model.layers.51.attn_norm.weight": "model-00024-of-00032.safetensors", "model.layers.51.mlp.experts.0.down_proj.norm.weight": "model-00024-of-00032.safetensors", "model.layers.51.mlp.experts.0.down_proj.weight": "model-00024-of-00032.safetensors", "model.layers.51.mlp.experts.0.gate_proj.norm.weight": "model-00024-of-00032.safetensors", "model.layers.51.mlp.experts.0.gate_proj.weight": "model-00024-of-00032.safetensors", "model.layers.51.mlp.experts.1.down_proj.norm.weight": "model-00024-of-00032.safetensors", "model.layers.51.mlp.experts.1.down_proj.weight": "model-00024-of-00032.safetensors", "model.layers.51.mlp.experts.1.gate_proj.norm.weight": "model-00024-of-00032.safetensors", "model.layers.51.mlp.experts.1.gate_proj.weight": "model-00024-of-00032.safetensors", "model.layers.51.mlp.experts.2.down_proj.norm.weight": "model-00025-of-00032.safetensors", "model.layers.51.mlp.experts.2.down_proj.weight": "model-00025-of-00032.safetensors", "model.layers.51.mlp.experts.2.gate_proj.norm.weight": "model-00025-of-00032.safetensors", "model.layers.51.mlp.experts.2.gate_proj.weight": "model-00025-of-00032.safetensors", "model.layers.51.mlp.experts.3.down_proj.norm.weight": "model-00025-of-00032.safetensors", "model.layers.51.mlp.experts.3.down_proj.weight": "model-00025-of-00032.safetensors", "model.layers.51.mlp.experts.3.gate_proj.norm.weight": "model-00025-of-00032.safetensors", "model.layers.51.mlp.experts.3.gate_proj.weight": "model-00025-of-00032.safetensors", "model.layers.51.mlp.experts.4.down_proj.norm.weight": "model-00025-of-00032.safetensors", "model.layers.51.mlp.experts.4.down_proj.weight": "model-00025-of-00032.safetensors", "model.layers.51.mlp.experts.4.gate_proj.norm.weight": "model-00025-of-00032.safetensors", "model.layers.51.mlp.experts.4.gate_proj.weight": "model-00025-of-00032.safetensors", "model.layers.51.mlp.experts.5.down_proj.norm.weight": "model-00025-of-00032.safetensors", "model.layers.51.mlp.experts.5.down_proj.weight": "model-00025-of-00032.safetensors", "model.layers.51.mlp.experts.5.gate_proj.norm.weight": "model-00025-of-00032.safetensors", "model.layers.51.mlp.experts.5.gate_proj.weight": "model-00025-of-00032.safetensors", "model.layers.51.mlp.experts.6.down_proj.norm.weight": "model-00025-of-00032.safetensors", "model.layers.51.mlp.experts.6.down_proj.weight": "model-00025-of-00032.safetensors", "model.layers.51.mlp.experts.6.gate_proj.norm.weight": "model-00025-of-00032.safetensors", "model.layers.51.mlp.experts.6.gate_proj.weight": "model-00025-of-00032.safetensors", "model.layers.51.mlp.experts.7.down_proj.norm.weight": "model-00025-of-00032.safetensors", "model.layers.51.mlp.experts.7.down_proj.weight": "model-00025-of-00032.safetensors", "model.layers.51.mlp.experts.7.gate_proj.norm.weight": "model-00025-of-00032.safetensors", "model.layers.51.mlp.experts.7.gate_proj.weight": "model-00025-of-00032.safetensors", "model.layers.51.mlp.router.norm.weight": "model-00024-of-00032.safetensors", "model.layers.51.mlp.router.weight": "model-00024-of-00032.safetensors", "model.layers.51.mlp_norm.weight": "model-00024-of-00032.safetensors", "model.layers.52.attn.f_proj.norm.weight": "model-00025-of-00032.safetensors", "model.layers.52.attn.f_proj.weight": "model-00025-of-00032.safetensors", "model.layers.52.attn.g_norm.weight": "model-00025-of-00032.safetensors", "model.layers.52.attn.g_proj.norm.weight": "model-00025-of-00032.safetensors", "model.layers.52.attn.g_proj.weight": "model-00025-of-00032.safetensors", "model.layers.52.attn.i_proj.norm.weight": "model-00025-of-00032.safetensors", "model.layers.52.attn.i_proj.weight": "model-00025-of-00032.safetensors", "model.layers.52.attn.o_proj.norm.weight": "model-00025-of-00032.safetensors", "model.layers.52.attn.o_proj.weight": "model-00025-of-00032.safetensors", "model.layers.52.attn_norm.weight": "model-00025-of-00032.safetensors", "model.layers.52.mlp.down_proj.norm.weight": "model-00025-of-00032.safetensors", "model.layers.52.mlp.down_proj.weight": "model-00025-of-00032.safetensors", "model.layers.52.mlp.gate_proj.norm.weight": "model-00025-of-00032.safetensors", "model.layers.52.mlp.gate_proj.weight": "model-00025-of-00032.safetensors", "model.layers.52.mlp_norm.weight": "model-00025-of-00032.safetensors", "model.layers.53.attn.f_proj.norm.weight": "model-00025-of-00032.safetensors", "model.layers.53.attn.f_proj.weight": "model-00025-of-00032.safetensors", "model.layers.53.attn.g_norm.weight": "model-00025-of-00032.safetensors", "model.layers.53.attn.g_proj.norm.weight": "model-00025-of-00032.safetensors", "model.layers.53.attn.g_proj.weight": "model-00025-of-00032.safetensors", "model.layers.53.attn.i_proj.norm.weight": "model-00025-of-00032.safetensors", "model.layers.53.attn.i_proj.weight": "model-00025-of-00032.safetensors", "model.layers.53.attn.o_proj.norm.weight": "model-00025-of-00032.safetensors", "model.layers.53.attn.o_proj.weight": "model-00025-of-00032.safetensors", "model.layers.53.attn_norm.weight": "model-00025-of-00032.safetensors", "model.layers.53.mlp.experts.0.down_proj.norm.weight": "model-00025-of-00032.safetensors", "model.layers.53.mlp.experts.0.down_proj.weight": "model-00025-of-00032.safetensors", "model.layers.53.mlp.experts.0.gate_proj.norm.weight": "model-00025-of-00032.safetensors", "model.layers.53.mlp.experts.0.gate_proj.weight": "model-00025-of-00032.safetensors", "model.layers.53.mlp.experts.1.down_proj.norm.weight": "model-00025-of-00032.safetensors", "model.layers.53.mlp.experts.1.down_proj.weight": "model-00025-of-00032.safetensors", "model.layers.53.mlp.experts.1.gate_proj.norm.weight": "model-00025-of-00032.safetensors", "model.layers.53.mlp.experts.1.gate_proj.weight": "model-00025-of-00032.safetensors", "model.layers.53.mlp.experts.2.down_proj.norm.weight": "model-00025-of-00032.safetensors", "model.layers.53.mlp.experts.2.down_proj.weight": "model-00025-of-00032.safetensors", "model.layers.53.mlp.experts.2.gate_proj.norm.weight": "model-00025-of-00032.safetensors", "model.layers.53.mlp.experts.2.gate_proj.weight": "model-00025-of-00032.safetensors", "model.layers.53.mlp.experts.3.down_proj.norm.weight": "model-00026-of-00032.safetensors", "model.layers.53.mlp.experts.3.down_proj.weight": "model-00026-of-00032.safetensors", "model.layers.53.mlp.experts.3.gate_proj.norm.weight": "model-00026-of-00032.safetensors", "model.layers.53.mlp.experts.3.gate_proj.weight": "model-00026-of-00032.safetensors", "model.layers.53.mlp.experts.4.down_proj.norm.weight": "model-00026-of-00032.safetensors", "model.layers.53.mlp.experts.4.down_proj.weight": "model-00026-of-00032.safetensors", "model.layers.53.mlp.experts.4.gate_proj.norm.weight": "model-00026-of-00032.safetensors", "model.layers.53.mlp.experts.4.gate_proj.weight": "model-00026-of-00032.safetensors", "model.layers.53.mlp.experts.5.down_proj.norm.weight": "model-00026-of-00032.safetensors", "model.layers.53.mlp.experts.5.down_proj.weight": "model-00026-of-00032.safetensors", "model.layers.53.mlp.experts.5.gate_proj.norm.weight": "model-00026-of-00032.safetensors", "model.layers.53.mlp.experts.5.gate_proj.weight": "model-00026-of-00032.safetensors", "model.layers.53.mlp.experts.6.down_proj.norm.weight": "model-00026-of-00032.safetensors", "model.layers.53.mlp.experts.6.down_proj.weight": "model-00026-of-00032.safetensors", "model.layers.53.mlp.experts.6.gate_proj.norm.weight": "model-00026-of-00032.safetensors", "model.layers.53.mlp.experts.6.gate_proj.weight": "model-00026-of-00032.safetensors", "model.layers.53.mlp.experts.7.down_proj.norm.weight": "model-00026-of-00032.safetensors", "model.layers.53.mlp.experts.7.down_proj.weight": "model-00026-of-00032.safetensors", "model.layers.53.mlp.experts.7.gate_proj.norm.weight": "model-00026-of-00032.safetensors", "model.layers.53.mlp.experts.7.gate_proj.weight": "model-00026-of-00032.safetensors", "model.layers.53.mlp.router.norm.weight": "model-00025-of-00032.safetensors", "model.layers.53.mlp.router.weight": "model-00025-of-00032.safetensors", "model.layers.53.mlp_norm.weight": "model-00025-of-00032.safetensors", "model.layers.54.attn.f_proj.norm.weight": "model-00026-of-00032.safetensors", "model.layers.54.attn.f_proj.weight": "model-00026-of-00032.safetensors", "model.layers.54.attn.g_norm.weight": "model-00026-of-00032.safetensors", "model.layers.54.attn.g_proj.norm.weight": "model-00026-of-00032.safetensors", "model.layers.54.attn.g_proj.weight": "model-00026-of-00032.safetensors", "model.layers.54.attn.i_proj.norm.weight": "model-00026-of-00032.safetensors", "model.layers.54.attn.i_proj.weight": "model-00026-of-00032.safetensors", "model.layers.54.attn.o_proj.norm.weight": "model-00026-of-00032.safetensors", "model.layers.54.attn.o_proj.weight": "model-00026-of-00032.safetensors", "model.layers.54.attn_norm.weight": "model-00026-of-00032.safetensors", "model.layers.54.mlp.down_proj.norm.weight": "model-00026-of-00032.safetensors", "model.layers.54.mlp.down_proj.weight": "model-00026-of-00032.safetensors", "model.layers.54.mlp.gate_proj.norm.weight": "model-00026-of-00032.safetensors", "model.layers.54.mlp.gate_proj.weight": "model-00026-of-00032.safetensors", "model.layers.54.mlp_norm.weight": "model-00026-of-00032.safetensors", "model.layers.55.attn.f_proj.norm.weight": "model-00026-of-00032.safetensors", "model.layers.55.attn.f_proj.weight": "model-00026-of-00032.safetensors", "model.layers.55.attn.g_norm.weight": "model-00026-of-00032.safetensors", "model.layers.55.attn.g_proj.norm.weight": "model-00026-of-00032.safetensors", "model.layers.55.attn.g_proj.weight": "model-00026-of-00032.safetensors", "model.layers.55.attn.i_proj.norm.weight": "model-00026-of-00032.safetensors", "model.layers.55.attn.i_proj.weight": "model-00026-of-00032.safetensors", "model.layers.55.attn.o_proj.norm.weight": "model-00026-of-00032.safetensors", "model.layers.55.attn.o_proj.weight": "model-00026-of-00032.safetensors", "model.layers.55.attn_norm.weight": "model-00026-of-00032.safetensors", "model.layers.55.mlp.experts.0.down_proj.norm.weight": "model-00026-of-00032.safetensors", "model.layers.55.mlp.experts.0.down_proj.weight": "model-00026-of-00032.safetensors", "model.layers.55.mlp.experts.0.gate_proj.norm.weight": "model-00026-of-00032.safetensors", "model.layers.55.mlp.experts.0.gate_proj.weight": "model-00026-of-00032.safetensors", "model.layers.55.mlp.experts.1.down_proj.norm.weight": "model-00026-of-00032.safetensors", "model.layers.55.mlp.experts.1.down_proj.weight": "model-00026-of-00032.safetensors", "model.layers.55.mlp.experts.1.gate_proj.norm.weight": "model-00026-of-00032.safetensors", "model.layers.55.mlp.experts.1.gate_proj.weight": "model-00026-of-00032.safetensors", "model.layers.55.mlp.experts.2.down_proj.norm.weight": "model-00026-of-00032.safetensors", "model.layers.55.mlp.experts.2.down_proj.weight": "model-00026-of-00032.safetensors", "model.layers.55.mlp.experts.2.gate_proj.norm.weight": "model-00026-of-00032.safetensors", "model.layers.55.mlp.experts.2.gate_proj.weight": "model-00026-of-00032.safetensors", "model.layers.55.mlp.experts.3.down_proj.norm.weight": "model-00026-of-00032.safetensors", "model.layers.55.mlp.experts.3.down_proj.weight": "model-00026-of-00032.safetensors", "model.layers.55.mlp.experts.3.gate_proj.norm.weight": "model-00026-of-00032.safetensors", "model.layers.55.mlp.experts.3.gate_proj.weight": "model-00026-of-00032.safetensors", "model.layers.55.mlp.experts.4.down_proj.norm.weight": "model-00027-of-00032.safetensors", "model.layers.55.mlp.experts.4.down_proj.weight": "model-00027-of-00032.safetensors", "model.layers.55.mlp.experts.4.gate_proj.norm.weight": "model-00027-of-00032.safetensors", "model.layers.55.mlp.experts.4.gate_proj.weight": "model-00027-of-00032.safetensors", "model.layers.55.mlp.experts.5.down_proj.norm.weight": "model-00027-of-00032.safetensors", "model.layers.55.mlp.experts.5.down_proj.weight": "model-00027-of-00032.safetensors", "model.layers.55.mlp.experts.5.gate_proj.norm.weight": "model-00027-of-00032.safetensors", "model.layers.55.mlp.experts.5.gate_proj.weight": "model-00027-of-00032.safetensors", "model.layers.55.mlp.experts.6.down_proj.norm.weight": "model-00027-of-00032.safetensors", "model.layers.55.mlp.experts.6.down_proj.weight": "model-00027-of-00032.safetensors", "model.layers.55.mlp.experts.6.gate_proj.norm.weight": "model-00027-of-00032.safetensors", "model.layers.55.mlp.experts.6.gate_proj.weight": "model-00027-of-00032.safetensors", "model.layers.55.mlp.experts.7.down_proj.norm.weight": "model-00027-of-00032.safetensors", "model.layers.55.mlp.experts.7.down_proj.weight": "model-00027-of-00032.safetensors", "model.layers.55.mlp.experts.7.gate_proj.norm.weight": "model-00027-of-00032.safetensors", "model.layers.55.mlp.experts.7.gate_proj.weight": "model-00027-of-00032.safetensors", "model.layers.55.mlp.router.norm.weight": "model-00026-of-00032.safetensors", "model.layers.55.mlp.router.weight": "model-00026-of-00032.safetensors", "model.layers.55.mlp_norm.weight": "model-00026-of-00032.safetensors", "model.layers.56.attn.f_proj.norm.weight": "model-00027-of-00032.safetensors", "model.layers.56.attn.f_proj.weight": "model-00027-of-00032.safetensors", "model.layers.56.attn.g_norm.weight": "model-00027-of-00032.safetensors", "model.layers.56.attn.g_proj.norm.weight": "model-00027-of-00032.safetensors", "model.layers.56.attn.g_proj.weight": "model-00027-of-00032.safetensors", "model.layers.56.attn.i_proj.norm.weight": "model-00027-of-00032.safetensors", "model.layers.56.attn.i_proj.weight": "model-00027-of-00032.safetensors", "model.layers.56.attn.o_proj.norm.weight": "model-00027-of-00032.safetensors", "model.layers.56.attn.o_proj.weight": "model-00027-of-00032.safetensors", "model.layers.56.attn_norm.weight": "model-00027-of-00032.safetensors", "model.layers.56.mlp.down_proj.norm.weight": "model-00027-of-00032.safetensors", "model.layers.56.mlp.down_proj.weight": "model-00027-of-00032.safetensors", "model.layers.56.mlp.gate_proj.norm.weight": "model-00027-of-00032.safetensors", "model.layers.56.mlp.gate_proj.weight": "model-00027-of-00032.safetensors", "model.layers.56.mlp_norm.weight": "model-00027-of-00032.safetensors", "model.layers.57.attn.f_proj.norm.weight": "model-00027-of-00032.safetensors", "model.layers.57.attn.f_proj.weight": "model-00027-of-00032.safetensors", "model.layers.57.attn.g_norm.weight": "model-00027-of-00032.safetensors", "model.layers.57.attn.g_proj.norm.weight": "model-00027-of-00032.safetensors", "model.layers.57.attn.g_proj.weight": "model-00027-of-00032.safetensors", "model.layers.57.attn.i_proj.norm.weight": "model-00027-of-00032.safetensors", "model.layers.57.attn.i_proj.weight": "model-00027-of-00032.safetensors", "model.layers.57.attn.o_proj.norm.weight": "model-00027-of-00032.safetensors", "model.layers.57.attn.o_proj.weight": "model-00027-of-00032.safetensors", "model.layers.57.attn_norm.weight": "model-00027-of-00032.safetensors", "model.layers.57.mlp.experts.0.down_proj.norm.weight": "model-00027-of-00032.safetensors", "model.layers.57.mlp.experts.0.down_proj.weight": "model-00027-of-00032.safetensors", "model.layers.57.mlp.experts.0.gate_proj.norm.weight": "model-00027-of-00032.safetensors", "model.layers.57.mlp.experts.0.gate_proj.weight": "model-00027-of-00032.safetensors", "model.layers.57.mlp.experts.1.down_proj.norm.weight": "model-00027-of-00032.safetensors", "model.layers.57.mlp.experts.1.down_proj.weight": "model-00027-of-00032.safetensors", "model.layers.57.mlp.experts.1.gate_proj.norm.weight": "model-00027-of-00032.safetensors", "model.layers.57.mlp.experts.1.gate_proj.weight": "model-00027-of-00032.safetensors", "model.layers.57.mlp.experts.2.down_proj.norm.weight": "model-00027-of-00032.safetensors", "model.layers.57.mlp.experts.2.down_proj.weight": "model-00027-of-00032.safetensors", "model.layers.57.mlp.experts.2.gate_proj.norm.weight": "model-00027-of-00032.safetensors", "model.layers.57.mlp.experts.2.gate_proj.weight": "model-00027-of-00032.safetensors", "model.layers.57.mlp.experts.3.down_proj.norm.weight": "model-00027-of-00032.safetensors", "model.layers.57.mlp.experts.3.down_proj.weight": "model-00027-of-00032.safetensors", "model.layers.57.mlp.experts.3.gate_proj.norm.weight": "model-00027-of-00032.safetensors", "model.layers.57.mlp.experts.3.gate_proj.weight": "model-00027-of-00032.safetensors", "model.layers.57.mlp.experts.4.down_proj.norm.weight": "model-00027-of-00032.safetensors", "model.layers.57.mlp.experts.4.down_proj.weight": "model-00027-of-00032.safetensors", "model.layers.57.mlp.experts.4.gate_proj.norm.weight": "model-00027-of-00032.safetensors", "model.layers.57.mlp.experts.4.gate_proj.weight": "model-00027-of-00032.safetensors", "model.layers.57.mlp.experts.5.down_proj.norm.weight": "model-00028-of-00032.safetensors", "model.layers.57.mlp.experts.5.down_proj.weight": "model-00028-of-00032.safetensors", "model.layers.57.mlp.experts.5.gate_proj.norm.weight": "model-00028-of-00032.safetensors", "model.layers.57.mlp.experts.5.gate_proj.weight": "model-00028-of-00032.safetensors", "model.layers.57.mlp.experts.6.down_proj.norm.weight": "model-00028-of-00032.safetensors", "model.layers.57.mlp.experts.6.down_proj.weight": "model-00028-of-00032.safetensors", "model.layers.57.mlp.experts.6.gate_proj.norm.weight": "model-00028-of-00032.safetensors", "model.layers.57.mlp.experts.6.gate_proj.weight": "model-00028-of-00032.safetensors", "model.layers.57.mlp.experts.7.down_proj.norm.weight": "model-00028-of-00032.safetensors", "model.layers.57.mlp.experts.7.down_proj.weight": "model-00028-of-00032.safetensors", "model.layers.57.mlp.experts.7.gate_proj.norm.weight": "model-00028-of-00032.safetensors", "model.layers.57.mlp.experts.7.gate_proj.weight": "model-00028-of-00032.safetensors", "model.layers.57.mlp.router.norm.weight": "model-00027-of-00032.safetensors", "model.layers.57.mlp.router.weight": "model-00027-of-00032.safetensors", "model.layers.57.mlp_norm.weight": "model-00027-of-00032.safetensors", "model.layers.58.attn.f_proj.norm.weight": "model-00028-of-00032.safetensors", "model.layers.58.attn.f_proj.weight": "model-00028-of-00032.safetensors", "model.layers.58.attn.g_norm.weight": "model-00028-of-00032.safetensors", "model.layers.58.attn.g_proj.norm.weight": "model-00028-of-00032.safetensors", "model.layers.58.attn.g_proj.weight": "model-00028-of-00032.safetensors", "model.layers.58.attn.i_proj.norm.weight": "model-00028-of-00032.safetensors", "model.layers.58.attn.i_proj.weight": "model-00028-of-00032.safetensors", "model.layers.58.attn.o_proj.norm.weight": "model-00028-of-00032.safetensors", "model.layers.58.attn.o_proj.weight": "model-00028-of-00032.safetensors", "model.layers.58.attn_norm.weight": "model-00028-of-00032.safetensors", "model.layers.58.mlp.down_proj.norm.weight": "model-00028-of-00032.safetensors", "model.layers.58.mlp.down_proj.weight": "model-00028-of-00032.safetensors", "model.layers.58.mlp.gate_proj.norm.weight": "model-00028-of-00032.safetensors", "model.layers.58.mlp.gate_proj.weight": "model-00028-of-00032.safetensors", "model.layers.58.mlp_norm.weight": "model-00028-of-00032.safetensors", "model.layers.59.attn.f_proj.norm.weight": "model-00028-of-00032.safetensors", "model.layers.59.attn.f_proj.weight": "model-00028-of-00032.safetensors", "model.layers.59.attn.g_norm.weight": "model-00028-of-00032.safetensors", "model.layers.59.attn.g_proj.norm.weight": "model-00028-of-00032.safetensors", "model.layers.59.attn.g_proj.weight": "model-00028-of-00032.safetensors", "model.layers.59.attn.i_proj.norm.weight": "model-00028-of-00032.safetensors", "model.layers.59.attn.i_proj.weight": "model-00028-of-00032.safetensors", "model.layers.59.attn.o_proj.norm.weight": "model-00028-of-00032.safetensors", "model.layers.59.attn.o_proj.weight": "model-00028-of-00032.safetensors", "model.layers.59.attn_norm.weight": "model-00028-of-00032.safetensors", "model.layers.59.mlp.experts.0.down_proj.norm.weight": "model-00028-of-00032.safetensors", "model.layers.59.mlp.experts.0.down_proj.weight": "model-00028-of-00032.safetensors", "model.layers.59.mlp.experts.0.gate_proj.norm.weight": "model-00028-of-00032.safetensors", "model.layers.59.mlp.experts.0.gate_proj.weight": "model-00028-of-00032.safetensors", "model.layers.59.mlp.experts.1.down_proj.norm.weight": "model-00028-of-00032.safetensors", "model.layers.59.mlp.experts.1.down_proj.weight": "model-00028-of-00032.safetensors", "model.layers.59.mlp.experts.1.gate_proj.norm.weight": "model-00028-of-00032.safetensors", "model.layers.59.mlp.experts.1.gate_proj.weight": "model-00028-of-00032.safetensors", "model.layers.59.mlp.experts.2.down_proj.norm.weight": "model-00028-of-00032.safetensors", "model.layers.59.mlp.experts.2.down_proj.weight": "model-00028-of-00032.safetensors", "model.layers.59.mlp.experts.2.gate_proj.norm.weight": "model-00028-of-00032.safetensors", "model.layers.59.mlp.experts.2.gate_proj.weight": "model-00028-of-00032.safetensors", "model.layers.59.mlp.experts.3.down_proj.norm.weight": "model-00028-of-00032.safetensors", "model.layers.59.mlp.experts.3.down_proj.weight": "model-00028-of-00032.safetensors", "model.layers.59.mlp.experts.3.gate_proj.norm.weight": "model-00028-of-00032.safetensors", "model.layers.59.mlp.experts.3.gate_proj.weight": "model-00028-of-00032.safetensors", "model.layers.59.mlp.experts.4.down_proj.norm.weight": "model-00028-of-00032.safetensors", "model.layers.59.mlp.experts.4.down_proj.weight": "model-00028-of-00032.safetensors", "model.layers.59.mlp.experts.4.gate_proj.norm.weight": "model-00028-of-00032.safetensors", "model.layers.59.mlp.experts.4.gate_proj.weight": "model-00028-of-00032.safetensors", "model.layers.59.mlp.experts.5.down_proj.norm.weight": "model-00028-of-00032.safetensors", "model.layers.59.mlp.experts.5.down_proj.weight": "model-00028-of-00032.safetensors", "model.layers.59.mlp.experts.5.gate_proj.norm.weight": "model-00028-of-00032.safetensors", "model.layers.59.mlp.experts.5.gate_proj.weight": "model-00028-of-00032.safetensors", "model.layers.59.mlp.experts.6.down_proj.norm.weight": "model-00029-of-00032.safetensors", "model.layers.59.mlp.experts.6.down_proj.weight": "model-00029-of-00032.safetensors", "model.layers.59.mlp.experts.6.gate_proj.norm.weight": "model-00029-of-00032.safetensors", "model.layers.59.mlp.experts.6.gate_proj.weight": "model-00029-of-00032.safetensors", "model.layers.59.mlp.experts.7.down_proj.norm.weight": "model-00029-of-00032.safetensors", "model.layers.59.mlp.experts.7.down_proj.weight": "model-00029-of-00032.safetensors", "model.layers.59.mlp.experts.7.gate_proj.norm.weight": "model-00029-of-00032.safetensors", "model.layers.59.mlp.experts.7.gate_proj.weight": "model-00029-of-00032.safetensors", "model.layers.59.mlp.router.norm.weight": "model-00028-of-00032.safetensors", "model.layers.59.mlp.router.weight": "model-00028-of-00032.safetensors", "model.layers.59.mlp_norm.weight": "model-00028-of-00032.safetensors", "model.layers.6.attn.f_proj.norm.weight": "model-00004-of-00032.safetensors", "model.layers.6.attn.f_proj.weight": "model-00004-of-00032.safetensors", "model.layers.6.attn.g_norm.weight": "model-00004-of-00032.safetensors", "model.layers.6.attn.g_proj.norm.weight": "model-00004-of-00032.safetensors", "model.layers.6.attn.g_proj.weight": "model-00004-of-00032.safetensors", "model.layers.6.attn.i_proj.norm.weight": "model-00004-of-00032.safetensors", "model.layers.6.attn.i_proj.weight": "model-00004-of-00032.safetensors", "model.layers.6.attn.o_proj.norm.weight": "model-00004-of-00032.safetensors", "model.layers.6.attn.o_proj.weight": "model-00004-of-00032.safetensors", "model.layers.6.attn_norm.weight": "model-00004-of-00032.safetensors", "model.layers.6.mlp.down_proj.norm.weight": "model-00004-of-00032.safetensors", "model.layers.6.mlp.down_proj.weight": "model-00004-of-00032.safetensors", "model.layers.6.mlp.gate_proj.norm.weight": "model-00004-of-00032.safetensors", "model.layers.6.mlp.gate_proj.weight": "model-00004-of-00032.safetensors", "model.layers.6.mlp_norm.weight": "model-00004-of-00032.safetensors", "model.layers.60.attn.f_proj.norm.weight": "model-00029-of-00032.safetensors", "model.layers.60.attn.f_proj.weight": "model-00029-of-00032.safetensors", "model.layers.60.attn.g_norm.weight": "model-00029-of-00032.safetensors", "model.layers.60.attn.g_proj.norm.weight": "model-00029-of-00032.safetensors", "model.layers.60.attn.g_proj.weight": "model-00029-of-00032.safetensors", "model.layers.60.attn.i_proj.norm.weight": "model-00029-of-00032.safetensors", "model.layers.60.attn.i_proj.weight": "model-00029-of-00032.safetensors", "model.layers.60.attn.o_proj.norm.weight": "model-00029-of-00032.safetensors", "model.layers.60.attn.o_proj.weight": "model-00029-of-00032.safetensors", "model.layers.60.attn_norm.weight": "model-00029-of-00032.safetensors", "model.layers.60.mlp.down_proj.norm.weight": "model-00029-of-00032.safetensors", "model.layers.60.mlp.down_proj.weight": "model-00029-of-00032.safetensors", "model.layers.60.mlp.gate_proj.norm.weight": "model-00029-of-00032.safetensors", "model.layers.60.mlp.gate_proj.weight": "model-00029-of-00032.safetensors", "model.layers.60.mlp_norm.weight": "model-00029-of-00032.safetensors", "model.layers.61.attn.f_proj.norm.weight": "model-00029-of-00032.safetensors", "model.layers.61.attn.f_proj.weight": "model-00029-of-00032.safetensors", "model.layers.61.attn.g_norm.weight": "model-00029-of-00032.safetensors", "model.layers.61.attn.g_proj.norm.weight": "model-00029-of-00032.safetensors", "model.layers.61.attn.g_proj.weight": "model-00029-of-00032.safetensors", "model.layers.61.attn.i_proj.norm.weight": "model-00029-of-00032.safetensors", "model.layers.61.attn.i_proj.weight": "model-00029-of-00032.safetensors", "model.layers.61.attn.o_proj.norm.weight": "model-00029-of-00032.safetensors", "model.layers.61.attn.o_proj.weight": "model-00029-of-00032.safetensors", "model.layers.61.attn_norm.weight": "model-00029-of-00032.safetensors", "model.layers.61.mlp.experts.0.down_proj.norm.weight": "model-00029-of-00032.safetensors", "model.layers.61.mlp.experts.0.down_proj.weight": "model-00029-of-00032.safetensors", "model.layers.61.mlp.experts.0.gate_proj.norm.weight": "model-00029-of-00032.safetensors", "model.layers.61.mlp.experts.0.gate_proj.weight": "model-00029-of-00032.safetensors", "model.layers.61.mlp.experts.1.down_proj.norm.weight": "model-00029-of-00032.safetensors", "model.layers.61.mlp.experts.1.down_proj.weight": "model-00029-of-00032.safetensors", "model.layers.61.mlp.experts.1.gate_proj.norm.weight": "model-00029-of-00032.safetensors", "model.layers.61.mlp.experts.1.gate_proj.weight": "model-00029-of-00032.safetensors", "model.layers.61.mlp.experts.2.down_proj.norm.weight": "model-00029-of-00032.safetensors", "model.layers.61.mlp.experts.2.down_proj.weight": "model-00029-of-00032.safetensors", "model.layers.61.mlp.experts.2.gate_proj.norm.weight": "model-00029-of-00032.safetensors", "model.layers.61.mlp.experts.2.gate_proj.weight": "model-00029-of-00032.safetensors", "model.layers.61.mlp.experts.3.down_proj.norm.weight": "model-00029-of-00032.safetensors", "model.layers.61.mlp.experts.3.down_proj.weight": "model-00029-of-00032.safetensors", "model.layers.61.mlp.experts.3.gate_proj.norm.weight": "model-00029-of-00032.safetensors", "model.layers.61.mlp.experts.3.gate_proj.weight": "model-00029-of-00032.safetensors", "model.layers.61.mlp.experts.4.down_proj.norm.weight": "model-00029-of-00032.safetensors", "model.layers.61.mlp.experts.4.down_proj.weight": "model-00029-of-00032.safetensors", "model.layers.61.mlp.experts.4.gate_proj.norm.weight": "model-00029-of-00032.safetensors", "model.layers.61.mlp.experts.4.gate_proj.weight": "model-00029-of-00032.safetensors", "model.layers.61.mlp.experts.5.down_proj.norm.weight": "model-00029-of-00032.safetensors", "model.layers.61.mlp.experts.5.down_proj.weight": "model-00029-of-00032.safetensors", "model.layers.61.mlp.experts.5.gate_proj.norm.weight": "model-00029-of-00032.safetensors", "model.layers.61.mlp.experts.5.gate_proj.weight": "model-00029-of-00032.safetensors", "model.layers.61.mlp.experts.6.down_proj.norm.weight": "model-00029-of-00032.safetensors", "model.layers.61.mlp.experts.6.down_proj.weight": "model-00029-of-00032.safetensors", "model.layers.61.mlp.experts.6.gate_proj.norm.weight": "model-00029-of-00032.safetensors", "model.layers.61.mlp.experts.6.gate_proj.weight": "model-00029-of-00032.safetensors", "model.layers.61.mlp.experts.7.down_proj.norm.weight": "model-00030-of-00032.safetensors", "model.layers.61.mlp.experts.7.down_proj.weight": "model-00030-of-00032.safetensors", "model.layers.61.mlp.experts.7.gate_proj.norm.weight": "model-00030-of-00032.safetensors", "model.layers.61.mlp.experts.7.gate_proj.weight": "model-00030-of-00032.safetensors", "model.layers.61.mlp.router.norm.weight": "model-00029-of-00032.safetensors", "model.layers.61.mlp.router.weight": "model-00029-of-00032.safetensors", "model.layers.61.mlp_norm.weight": "model-00029-of-00032.safetensors", "model.layers.62.attn.f_proj.norm.weight": "model-00030-of-00032.safetensors", "model.layers.62.attn.f_proj.weight": "model-00030-of-00032.safetensors", "model.layers.62.attn.g_norm.weight": "model-00030-of-00032.safetensors", "model.layers.62.attn.g_proj.norm.weight": "model-00030-of-00032.safetensors", "model.layers.62.attn.g_proj.weight": "model-00030-of-00032.safetensors", "model.layers.62.attn.i_proj.norm.weight": "model-00030-of-00032.safetensors", "model.layers.62.attn.i_proj.weight": "model-00030-of-00032.safetensors", "model.layers.62.attn.o_proj.norm.weight": "model-00030-of-00032.safetensors", "model.layers.62.attn.o_proj.weight": "model-00030-of-00032.safetensors", "model.layers.62.attn_norm.weight": "model-00030-of-00032.safetensors", "model.layers.62.mlp.down_proj.norm.weight": "model-00030-of-00032.safetensors", "model.layers.62.mlp.down_proj.weight": "model-00030-of-00032.safetensors", "model.layers.62.mlp.gate_proj.norm.weight": "model-00030-of-00032.safetensors", "model.layers.62.mlp.gate_proj.weight": "model-00030-of-00032.safetensors", "model.layers.62.mlp_norm.weight": "model-00030-of-00032.safetensors", "model.layers.63.attn.f_proj.norm.weight": "model-00030-of-00032.safetensors", "model.layers.63.attn.f_proj.weight": "model-00030-of-00032.safetensors", "model.layers.63.attn.g_norm.weight": "model-00030-of-00032.safetensors", "model.layers.63.attn.g_proj.norm.weight": "model-00030-of-00032.safetensors", "model.layers.63.attn.g_proj.weight": "model-00030-of-00032.safetensors", "model.layers.63.attn.i_proj.norm.weight": "model-00030-of-00032.safetensors", "model.layers.63.attn.i_proj.weight": "model-00030-of-00032.safetensors", "model.layers.63.attn.o_proj.norm.weight": "model-00030-of-00032.safetensors", "model.layers.63.attn.o_proj.weight": "model-00030-of-00032.safetensors", "model.layers.63.attn_norm.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp.experts.0.down_proj.norm.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp.experts.0.down_proj.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp.experts.0.gate_proj.norm.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp.experts.0.gate_proj.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp.experts.1.down_proj.norm.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp.experts.1.down_proj.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp.experts.1.gate_proj.norm.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp.experts.1.gate_proj.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp.experts.2.down_proj.norm.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp.experts.2.down_proj.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp.experts.2.gate_proj.norm.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp.experts.2.gate_proj.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp.experts.3.down_proj.norm.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp.experts.3.down_proj.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp.experts.3.gate_proj.norm.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp.experts.3.gate_proj.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp.experts.4.down_proj.norm.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp.experts.4.down_proj.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp.experts.4.gate_proj.norm.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp.experts.4.gate_proj.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp.experts.5.down_proj.norm.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp.experts.5.down_proj.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp.experts.5.gate_proj.norm.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp.experts.5.gate_proj.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp.experts.6.down_proj.norm.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp.experts.6.down_proj.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp.experts.6.gate_proj.norm.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp.experts.6.gate_proj.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp.experts.7.down_proj.norm.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp.experts.7.down_proj.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp.experts.7.gate_proj.norm.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp.experts.7.gate_proj.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp.router.norm.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp.router.weight": "model-00030-of-00032.safetensors", "model.layers.63.mlp_norm.weight": "model-00030-of-00032.safetensors", "model.layers.7.attn.f_proj.norm.weight": "model-00004-of-00032.safetensors", "model.layers.7.attn.f_proj.weight": "model-00004-of-00032.safetensors", "model.layers.7.attn.g_norm.weight": "model-00004-of-00032.safetensors", "model.layers.7.attn.g_proj.norm.weight": "model-00004-of-00032.safetensors", "model.layers.7.attn.g_proj.weight": "model-00004-of-00032.safetensors", "model.layers.7.attn.i_proj.norm.weight": "model-00004-of-00032.safetensors", "model.layers.7.attn.i_proj.weight": "model-00004-of-00032.safetensors", "model.layers.7.attn.o_proj.norm.weight": "model-00004-of-00032.safetensors", "model.layers.7.attn.o_proj.weight": "model-00004-of-00032.safetensors", "model.layers.7.attn_norm.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp.experts.0.down_proj.norm.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp.experts.0.down_proj.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp.experts.0.gate_proj.norm.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp.experts.0.gate_proj.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp.experts.1.down_proj.norm.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp.experts.1.down_proj.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp.experts.1.gate_proj.norm.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp.experts.1.gate_proj.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp.experts.2.down_proj.norm.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp.experts.2.down_proj.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp.experts.2.gate_proj.norm.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp.experts.2.gate_proj.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp.experts.3.down_proj.norm.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp.experts.3.down_proj.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp.experts.3.gate_proj.norm.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp.experts.3.gate_proj.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp.experts.4.down_proj.norm.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp.experts.4.down_proj.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp.experts.4.gate_proj.norm.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp.experts.4.gate_proj.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp.experts.5.down_proj.norm.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp.experts.5.down_proj.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp.experts.5.gate_proj.norm.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp.experts.5.gate_proj.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp.experts.6.down_proj.norm.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp.experts.6.down_proj.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp.experts.6.gate_proj.norm.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp.experts.6.gate_proj.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp.experts.7.down_proj.norm.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp.experts.7.down_proj.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp.experts.7.gate_proj.norm.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp.experts.7.gate_proj.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp.router.norm.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp.router.weight": "model-00004-of-00032.safetensors", "model.layers.7.mlp_norm.weight": "model-00004-of-00032.safetensors", "model.layers.8.attn.f_proj.norm.weight": "model-00005-of-00032.safetensors", "model.layers.8.attn.f_proj.weight": "model-00005-of-00032.safetensors", "model.layers.8.attn.g_norm.weight": "model-00005-of-00032.safetensors", "model.layers.8.attn.g_proj.norm.weight": "model-00005-of-00032.safetensors", "model.layers.8.attn.g_proj.weight": "model-00005-of-00032.safetensors", "model.layers.8.attn.i_proj.norm.weight": "model-00005-of-00032.safetensors", "model.layers.8.attn.i_proj.weight": "model-00005-of-00032.safetensors", "model.layers.8.attn.o_proj.norm.weight": "model-00005-of-00032.safetensors", "model.layers.8.attn.o_proj.weight": "model-00005-of-00032.safetensors", "model.layers.8.attn_norm.weight": "model-00004-of-00032.safetensors", "model.layers.8.mlp.down_proj.norm.weight": "model-00005-of-00032.safetensors", "model.layers.8.mlp.down_proj.weight": "model-00005-of-00032.safetensors", "model.layers.8.mlp.gate_proj.norm.weight": "model-00005-of-00032.safetensors", "model.layers.8.mlp.gate_proj.weight": "model-00005-of-00032.safetensors", "model.layers.8.mlp_norm.weight": "model-00005-of-00032.safetensors", "model.layers.9.attn.f_proj.norm.weight": "model-00005-of-00032.safetensors", "model.layers.9.attn.f_proj.weight": "model-00005-of-00032.safetensors", "model.layers.9.attn.g_norm.weight": "model-00005-of-00032.safetensors", "model.layers.9.attn.g_proj.norm.weight": "model-00005-of-00032.safetensors", "model.layers.9.attn.g_proj.weight": "model-00005-of-00032.safetensors", "model.layers.9.attn.i_proj.norm.weight": "model-00005-of-00032.safetensors", "model.layers.9.attn.i_proj.weight": "model-00005-of-00032.safetensors", "model.layers.9.attn.o_proj.norm.weight": "model-00005-of-00032.safetensors", "model.layers.9.attn.o_proj.weight": "model-00005-of-00032.safetensors", "model.layers.9.attn_norm.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp.experts.0.down_proj.norm.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp.experts.0.down_proj.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp.experts.0.gate_proj.norm.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp.experts.0.gate_proj.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp.experts.1.down_proj.norm.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp.experts.1.down_proj.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp.experts.1.gate_proj.norm.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp.experts.1.gate_proj.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp.experts.2.down_proj.norm.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp.experts.2.down_proj.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp.experts.2.gate_proj.norm.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp.experts.2.gate_proj.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp.experts.3.down_proj.norm.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp.experts.3.down_proj.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp.experts.3.gate_proj.norm.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp.experts.3.gate_proj.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp.experts.4.down_proj.norm.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp.experts.4.down_proj.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp.experts.4.gate_proj.norm.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp.experts.4.gate_proj.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp.experts.5.down_proj.norm.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp.experts.5.down_proj.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp.experts.5.gate_proj.norm.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp.experts.5.gate_proj.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp.experts.6.down_proj.norm.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp.experts.6.down_proj.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp.experts.6.gate_proj.norm.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp.experts.6.gate_proj.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp.experts.7.down_proj.norm.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp.experts.7.down_proj.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp.experts.7.gate_proj.norm.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp.experts.7.gate_proj.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp.router.norm.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp.router.weight": "model-00005-of-00032.safetensors", "model.layers.9.mlp_norm.weight": "model-00005-of-00032.safetensors", "model.norm.weight": "model-00030-of-00032.safetensors" } }