diff --git "a/model.safetensors.index.json" "b/model.safetensors.index.json" --- "a/model.safetensors.index.json" +++ "b/model.safetensors.index.json" @@ -1,6 +1,6 @@ { "metadata": { - "total_size": 5424345194 + "total_size": 5724548352 }, "weight_map": { "model.embed_tokens.weight": "model-00001-of-00002.safetensors", @@ -9,15 +9,11 @@ "model.layers.0.fc1.bias": "model-00001-of-00002.safetensors", "model.layers.0.fc1.weight": "model-00001-of-00002.safetensors", "model.layers.0.fc1.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.0.fc1.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.0.fc1.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.0.fc1.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.0.fc1.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.0.fc2.bias": "model-00001-of-00002.safetensors", "model.layers.0.fc2.weight": "model-00001-of-00002.safetensors", "model.layers.0.fc2.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.0.fc2.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.0.fc2.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.0.fc2.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.0.fc2.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.0.final_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -25,29 +21,21 @@ "model.layers.0.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", "model.layers.0.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.0.self_attn.k_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.0.self_attn.k_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.0.self_attn.k_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.0.self_attn.k_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.0.self_attn.k_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.0.self_attn.out_proj.bias": "model-00001-of-00002.safetensors", "model.layers.0.self_attn.out_proj.weight": "model-00001-of-00002.safetensors", "model.layers.0.self_attn.out_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.0.self_attn.out_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.0.self_attn.out_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.0.self_attn.out_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.0.self_attn.out_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.0.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", "model.layers.0.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.0.self_attn.q_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.0.self_attn.q_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.0.self_attn.q_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.0.self_attn.q_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.0.self_attn.q_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.0.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", "model.layers.0.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.0.self_attn.v_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.0.self_attn.v_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.0.self_attn.v_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.0.self_attn.v_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.0.self_attn.v_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.0.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -55,15 +43,11 @@ "model.layers.1.fc1.bias": "model-00001-of-00002.safetensors", "model.layers.1.fc1.weight": "model-00001-of-00002.safetensors", "model.layers.1.fc1.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.1.fc1.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.1.fc1.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.1.fc1.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.1.fc1.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.1.fc2.bias": "model-00001-of-00002.safetensors", "model.layers.1.fc2.weight": "model-00001-of-00002.safetensors", "model.layers.1.fc2.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.1.fc2.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.1.fc2.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.1.fc2.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.1.fc2.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.1.final_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -71,29 +55,21 @@ "model.layers.1.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", "model.layers.1.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.1.self_attn.k_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.1.self_attn.k_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.1.self_attn.k_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.1.self_attn.k_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.1.self_attn.k_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.1.self_attn.out_proj.bias": "model-00001-of-00002.safetensors", "model.layers.1.self_attn.out_proj.weight": "model-00001-of-00002.safetensors", "model.layers.1.self_attn.out_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.1.self_attn.out_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.1.self_attn.out_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.1.self_attn.out_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.1.self_attn.out_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.1.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", "model.layers.1.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.1.self_attn.q_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.1.self_attn.q_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.1.self_attn.q_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.1.self_attn.q_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.1.self_attn.q_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.1.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", "model.layers.1.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.1.self_attn.v_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.1.self_attn.v_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.1.self_attn.v_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.1.self_attn.v_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.1.self_attn.v_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.1.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -101,15 +77,11 @@ "model.layers.10.fc1.bias": "model-00001-of-00002.safetensors", "model.layers.10.fc1.weight": "model-00001-of-00002.safetensors", "model.layers.10.fc1.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.10.fc1.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.10.fc1.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.10.fc1.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.10.fc1.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.10.fc2.bias": "model-00001-of-00002.safetensors", "model.layers.10.fc2.weight": "model-00001-of-00002.safetensors", "model.layers.10.fc2.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.10.fc2.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.10.fc2.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.10.fc2.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.10.fc2.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.10.final_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -117,29 +89,21 @@ "model.layers.10.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", "model.layers.10.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.10.self_attn.k_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.10.self_attn.k_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.10.self_attn.k_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.10.self_attn.k_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.10.self_attn.k_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.10.self_attn.out_proj.bias": "model-00001-of-00002.safetensors", "model.layers.10.self_attn.out_proj.weight": "model-00001-of-00002.safetensors", "model.layers.10.self_attn.out_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.10.self_attn.out_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.10.self_attn.out_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.10.self_attn.out_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.10.self_attn.out_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.10.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", "model.layers.10.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.10.self_attn.q_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.10.self_attn.q_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.10.self_attn.q_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.10.self_attn.q_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.10.self_attn.q_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.10.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", "model.layers.10.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.10.self_attn.v_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.10.self_attn.v_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.10.self_attn.v_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.10.self_attn.v_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.10.self_attn.v_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.10.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -147,15 +111,11 @@ "model.layers.11.fc1.bias": "model-00001-of-00002.safetensors", "model.layers.11.fc1.weight": "model-00001-of-00002.safetensors", "model.layers.11.fc1.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.11.fc1.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.11.fc1.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.11.fc1.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.11.fc1.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.11.fc2.bias": "model-00001-of-00002.safetensors", "model.layers.11.fc2.weight": "model-00001-of-00002.safetensors", "model.layers.11.fc2.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.11.fc2.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.11.fc2.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.11.fc2.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.11.fc2.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.11.final_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -163,29 +123,21 @@ "model.layers.11.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", "model.layers.11.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.11.self_attn.k_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.11.self_attn.k_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.11.self_attn.k_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.11.self_attn.k_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.11.self_attn.k_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.11.self_attn.out_proj.bias": "model-00001-of-00002.safetensors", "model.layers.11.self_attn.out_proj.weight": "model-00001-of-00002.safetensors", "model.layers.11.self_attn.out_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.11.self_attn.out_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.11.self_attn.out_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.11.self_attn.out_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.11.self_attn.out_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.11.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", "model.layers.11.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.11.self_attn.q_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.11.self_attn.q_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.11.self_attn.q_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.11.self_attn.q_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.11.self_attn.q_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.11.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", "model.layers.11.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.11.self_attn.v_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.11.self_attn.v_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.11.self_attn.v_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.11.self_attn.v_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.11.self_attn.v_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.11.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -193,15 +145,11 @@ "model.layers.12.fc1.bias": "model-00001-of-00002.safetensors", "model.layers.12.fc1.weight": "model-00001-of-00002.safetensors", "model.layers.12.fc1.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.12.fc1.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.12.fc1.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.12.fc1.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.12.fc1.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.12.fc2.bias": "model-00001-of-00002.safetensors", "model.layers.12.fc2.weight": "model-00001-of-00002.safetensors", "model.layers.12.fc2.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.12.fc2.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.12.fc2.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.12.fc2.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.12.fc2.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.12.final_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -209,29 +157,21 @@ "model.layers.12.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", "model.layers.12.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.12.self_attn.k_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.12.self_attn.k_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.12.self_attn.k_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.12.self_attn.k_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.12.self_attn.k_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.12.self_attn.out_proj.bias": "model-00001-of-00002.safetensors", "model.layers.12.self_attn.out_proj.weight": "model-00001-of-00002.safetensors", "model.layers.12.self_attn.out_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.12.self_attn.out_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.12.self_attn.out_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.12.self_attn.out_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.12.self_attn.out_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.12.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", "model.layers.12.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.12.self_attn.q_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.12.self_attn.q_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.12.self_attn.q_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.12.self_attn.q_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.12.self_attn.q_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.12.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", "model.layers.12.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.12.self_attn.v_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.12.self_attn.v_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.12.self_attn.v_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.12.self_attn.v_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.12.self_attn.v_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.12.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -239,15 +179,11 @@ "model.layers.13.fc1.bias": "model-00001-of-00002.safetensors", "model.layers.13.fc1.weight": "model-00001-of-00002.safetensors", "model.layers.13.fc1.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.13.fc1.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.13.fc1.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.13.fc1.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.13.fc1.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.13.fc2.bias": "model-00001-of-00002.safetensors", "model.layers.13.fc2.weight": "model-00001-of-00002.safetensors", "model.layers.13.fc2.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.13.fc2.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.13.fc2.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.13.fc2.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.13.fc2.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.13.final_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -255,29 +191,21 @@ "model.layers.13.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", "model.layers.13.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.13.self_attn.k_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.13.self_attn.k_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.13.self_attn.k_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.13.self_attn.k_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.13.self_attn.k_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.13.self_attn.out_proj.bias": "model-00001-of-00002.safetensors", "model.layers.13.self_attn.out_proj.weight": "model-00001-of-00002.safetensors", "model.layers.13.self_attn.out_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.13.self_attn.out_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.13.self_attn.out_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.13.self_attn.out_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.13.self_attn.out_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.13.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", "model.layers.13.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.13.self_attn.q_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.13.self_attn.q_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.13.self_attn.q_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.13.self_attn.q_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.13.self_attn.q_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.13.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", "model.layers.13.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.13.self_attn.v_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.13.self_attn.v_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.13.self_attn.v_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.13.self_attn.v_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.13.self_attn.v_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.13.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -285,15 +213,11 @@ "model.layers.14.fc1.bias": "model-00001-of-00002.safetensors", "model.layers.14.fc1.weight": "model-00001-of-00002.safetensors", "model.layers.14.fc1.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.14.fc1.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.14.fc1.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.14.fc1.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.14.fc1.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.14.fc2.bias": "model-00001-of-00002.safetensors", "model.layers.14.fc2.weight": "model-00001-of-00002.safetensors", "model.layers.14.fc2.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.14.fc2.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.14.fc2.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.14.fc2.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.14.fc2.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.14.final_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -301,29 +225,21 @@ "model.layers.14.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", "model.layers.14.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.14.self_attn.k_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.14.self_attn.k_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.14.self_attn.k_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.14.self_attn.k_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.14.self_attn.k_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.14.self_attn.out_proj.bias": "model-00001-of-00002.safetensors", "model.layers.14.self_attn.out_proj.weight": "model-00001-of-00002.safetensors", "model.layers.14.self_attn.out_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.14.self_attn.out_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.14.self_attn.out_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.14.self_attn.out_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.14.self_attn.out_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.14.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", "model.layers.14.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.14.self_attn.q_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.14.self_attn.q_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.14.self_attn.q_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.14.self_attn.q_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.14.self_attn.q_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.14.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", "model.layers.14.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.14.self_attn.v_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.14.self_attn.v_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.14.self_attn.v_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.14.self_attn.v_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.14.self_attn.v_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.14.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -331,15 +247,11 @@ "model.layers.15.fc1.bias": "model-00001-of-00002.safetensors", "model.layers.15.fc1.weight": "model-00001-of-00002.safetensors", "model.layers.15.fc1.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.15.fc1.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.15.fc1.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.15.fc1.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.15.fc1.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.15.fc2.bias": "model-00001-of-00002.safetensors", "model.layers.15.fc2.weight": "model-00001-of-00002.safetensors", "model.layers.15.fc2.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.15.fc2.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.15.fc2.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.15.fc2.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.15.fc2.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.15.final_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -347,29 +259,21 @@ "model.layers.15.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", "model.layers.15.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.15.self_attn.k_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.15.self_attn.k_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.15.self_attn.k_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.15.self_attn.k_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.15.self_attn.k_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.15.self_attn.out_proj.bias": "model-00001-of-00002.safetensors", "model.layers.15.self_attn.out_proj.weight": "model-00001-of-00002.safetensors", "model.layers.15.self_attn.out_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.15.self_attn.out_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.15.self_attn.out_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.15.self_attn.out_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.15.self_attn.out_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.15.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", "model.layers.15.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.15.self_attn.q_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.15.self_attn.q_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.15.self_attn.q_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.15.self_attn.q_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.15.self_attn.q_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.15.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", "model.layers.15.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.15.self_attn.v_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.15.self_attn.v_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.15.self_attn.v_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.15.self_attn.v_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.15.self_attn.v_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.15.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -377,15 +281,11 @@ "model.layers.16.fc1.bias": "model-00001-of-00002.safetensors", "model.layers.16.fc1.weight": "model-00001-of-00002.safetensors", "model.layers.16.fc1.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.16.fc1.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.16.fc1.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.16.fc1.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.16.fc1.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.16.fc2.bias": "model-00001-of-00002.safetensors", "model.layers.16.fc2.weight": "model-00001-of-00002.safetensors", "model.layers.16.fc2.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.16.fc2.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.16.fc2.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.16.fc2.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.16.fc2.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.16.final_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -393,29 +293,21 @@ "model.layers.16.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", "model.layers.16.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.16.self_attn.k_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.16.self_attn.k_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.16.self_attn.k_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.16.self_attn.k_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.16.self_attn.k_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.16.self_attn.out_proj.bias": "model-00001-of-00002.safetensors", "model.layers.16.self_attn.out_proj.weight": "model-00001-of-00002.safetensors", "model.layers.16.self_attn.out_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.16.self_attn.out_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.16.self_attn.out_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.16.self_attn.out_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.16.self_attn.out_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.16.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", "model.layers.16.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.16.self_attn.q_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.16.self_attn.q_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.16.self_attn.q_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.16.self_attn.q_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.16.self_attn.q_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.16.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", "model.layers.16.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.16.self_attn.v_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.16.self_attn.v_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.16.self_attn.v_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.16.self_attn.v_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.16.self_attn.v_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.16.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -423,15 +315,11 @@ "model.layers.17.fc1.bias": "model-00001-of-00002.safetensors", "model.layers.17.fc1.weight": "model-00001-of-00002.safetensors", "model.layers.17.fc1.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.17.fc1.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.17.fc1.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.17.fc1.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.17.fc1.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.17.fc2.bias": "model-00001-of-00002.safetensors", "model.layers.17.fc2.weight": "model-00001-of-00002.safetensors", "model.layers.17.fc2.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.17.fc2.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.17.fc2.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.17.fc2.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.17.fc2.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.17.final_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -439,29 +327,21 @@ "model.layers.17.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", "model.layers.17.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.17.self_attn.k_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.17.self_attn.k_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.17.self_attn.k_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.17.self_attn.k_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.17.self_attn.k_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.17.self_attn.out_proj.bias": "model-00001-of-00002.safetensors", "model.layers.17.self_attn.out_proj.weight": "model-00001-of-00002.safetensors", "model.layers.17.self_attn.out_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.17.self_attn.out_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.17.self_attn.out_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.17.self_attn.out_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.17.self_attn.out_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.17.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", "model.layers.17.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.17.self_attn.q_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.17.self_attn.q_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.17.self_attn.q_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.17.self_attn.q_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.17.self_attn.q_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.17.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", "model.layers.17.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.17.self_attn.v_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.17.self_attn.v_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.17.self_attn.v_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.17.self_attn.v_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.17.self_attn.v_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.17.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -469,15 +349,11 @@ "model.layers.18.fc1.bias": "model-00001-of-00002.safetensors", "model.layers.18.fc1.weight": "model-00001-of-00002.safetensors", "model.layers.18.fc1.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.18.fc1.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.18.fc1.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.18.fc1.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.18.fc1.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.18.fc2.bias": "model-00001-of-00002.safetensors", "model.layers.18.fc2.weight": "model-00001-of-00002.safetensors", "model.layers.18.fc2.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.18.fc2.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.18.fc2.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.18.fc2.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.18.fc2.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.18.final_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -485,29 +361,21 @@ "model.layers.18.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", "model.layers.18.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.18.self_attn.k_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.18.self_attn.k_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.18.self_attn.k_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.18.self_attn.k_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.18.self_attn.k_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.18.self_attn.out_proj.bias": "model-00001-of-00002.safetensors", "model.layers.18.self_attn.out_proj.weight": "model-00001-of-00002.safetensors", "model.layers.18.self_attn.out_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.18.self_attn.out_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.18.self_attn.out_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.18.self_attn.out_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.18.self_attn.out_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.18.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", "model.layers.18.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.18.self_attn.q_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.18.self_attn.q_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.18.self_attn.q_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.18.self_attn.q_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.18.self_attn.q_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.18.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", "model.layers.18.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.18.self_attn.v_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.18.self_attn.v_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.18.self_attn.v_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.18.self_attn.v_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.18.self_attn.v_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.18.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -515,15 +383,11 @@ "model.layers.19.fc1.bias": "model-00001-of-00002.safetensors", "model.layers.19.fc1.weight": "model-00001-of-00002.safetensors", "model.layers.19.fc1.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.19.fc1.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.19.fc1.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.19.fc1.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.19.fc1.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.19.fc2.bias": "model-00001-of-00002.safetensors", "model.layers.19.fc2.weight": "model-00001-of-00002.safetensors", "model.layers.19.fc2.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.19.fc2.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.19.fc2.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.19.fc2.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.19.fc2.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.19.final_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -531,29 +395,21 @@ "model.layers.19.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", "model.layers.19.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.19.self_attn.k_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.19.self_attn.k_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.19.self_attn.k_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.19.self_attn.k_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.19.self_attn.k_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.19.self_attn.out_proj.bias": "model-00001-of-00002.safetensors", "model.layers.19.self_attn.out_proj.weight": "model-00001-of-00002.safetensors", "model.layers.19.self_attn.out_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.19.self_attn.out_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.19.self_attn.out_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.19.self_attn.out_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.19.self_attn.out_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.19.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", "model.layers.19.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.19.self_attn.q_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.19.self_attn.q_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.19.self_attn.q_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.19.self_attn.q_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.19.self_attn.q_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.19.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", "model.layers.19.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.19.self_attn.v_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.19.self_attn.v_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.19.self_attn.v_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.19.self_attn.v_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.19.self_attn.v_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.19.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -561,15 +417,11 @@ "model.layers.2.fc1.bias": "model-00001-of-00002.safetensors", "model.layers.2.fc1.weight": "model-00001-of-00002.safetensors", "model.layers.2.fc1.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.2.fc1.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.2.fc1.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.2.fc1.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.2.fc1.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.2.fc2.bias": "model-00001-of-00002.safetensors", "model.layers.2.fc2.weight": "model-00001-of-00002.safetensors", "model.layers.2.fc2.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.2.fc2.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.2.fc2.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.2.fc2.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.2.fc2.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.2.final_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -577,29 +429,21 @@ "model.layers.2.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", "model.layers.2.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.2.self_attn.k_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.2.self_attn.k_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.2.self_attn.k_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.2.self_attn.k_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.2.self_attn.k_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.2.self_attn.out_proj.bias": "model-00001-of-00002.safetensors", "model.layers.2.self_attn.out_proj.weight": "model-00001-of-00002.safetensors", "model.layers.2.self_attn.out_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.2.self_attn.out_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.2.self_attn.out_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.2.self_attn.out_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.2.self_attn.out_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.2.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", "model.layers.2.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.2.self_attn.q_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.2.self_attn.q_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.2.self_attn.q_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.2.self_attn.q_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.2.self_attn.q_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.2.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", "model.layers.2.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.2.self_attn.v_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.2.self_attn.v_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.2.self_attn.v_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.2.self_attn.v_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.2.self_attn.v_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.2.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -607,15 +451,11 @@ "model.layers.20.fc1.bias": "model-00001-of-00002.safetensors", "model.layers.20.fc1.weight": "model-00001-of-00002.safetensors", "model.layers.20.fc1.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.20.fc1.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.20.fc1.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.20.fc1.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.20.fc1.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.20.fc2.bias": "model-00001-of-00002.safetensors", "model.layers.20.fc2.weight": "model-00001-of-00002.safetensors", "model.layers.20.fc2.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.20.fc2.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.20.fc2.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.20.fc2.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.20.fc2.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.20.final_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -623,29 +463,21 @@ "model.layers.20.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", "model.layers.20.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.20.self_attn.k_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.20.self_attn.k_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.20.self_attn.k_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.20.self_attn.k_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.20.self_attn.k_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.20.self_attn.out_proj.bias": "model-00001-of-00002.safetensors", "model.layers.20.self_attn.out_proj.weight": "model-00001-of-00002.safetensors", "model.layers.20.self_attn.out_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.20.self_attn.out_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.20.self_attn.out_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.20.self_attn.out_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.20.self_attn.out_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.20.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", "model.layers.20.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.20.self_attn.q_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.20.self_attn.q_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.20.self_attn.q_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.20.self_attn.q_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.20.self_attn.q_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.20.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", "model.layers.20.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.20.self_attn.v_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.20.self_attn.v_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.20.self_attn.v_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.20.self_attn.v_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.20.self_attn.v_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.20.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -653,15 +485,11 @@ "model.layers.21.fc1.bias": "model-00001-of-00002.safetensors", "model.layers.21.fc1.weight": "model-00001-of-00002.safetensors", "model.layers.21.fc1.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.21.fc1.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.21.fc1.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.21.fc1.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.21.fc1.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.21.fc2.bias": "model-00001-of-00002.safetensors", "model.layers.21.fc2.weight": "model-00001-of-00002.safetensors", "model.layers.21.fc2.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.21.fc2.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.21.fc2.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.21.fc2.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.21.fc2.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.21.final_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -669,29 +497,21 @@ "model.layers.21.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", "model.layers.21.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.21.self_attn.k_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.21.self_attn.k_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.21.self_attn.k_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.21.self_attn.k_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.21.self_attn.k_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.21.self_attn.out_proj.bias": "model-00001-of-00002.safetensors", "model.layers.21.self_attn.out_proj.weight": "model-00001-of-00002.safetensors", "model.layers.21.self_attn.out_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.21.self_attn.out_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.21.self_attn.out_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.21.self_attn.out_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.21.self_attn.out_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.21.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", "model.layers.21.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.21.self_attn.q_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.21.self_attn.q_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.21.self_attn.q_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.21.self_attn.q_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.21.self_attn.q_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.21.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", "model.layers.21.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.21.self_attn.v_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.21.self_attn.v_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.21.self_attn.v_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.21.self_attn.v_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.21.self_attn.v_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.21.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -699,15 +519,11 @@ "model.layers.22.fc1.bias": "model-00001-of-00002.safetensors", "model.layers.22.fc1.weight": "model-00001-of-00002.safetensors", "model.layers.22.fc1.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.22.fc1.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.22.fc1.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.22.fc1.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.22.fc1.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.22.fc2.bias": "model-00001-of-00002.safetensors", "model.layers.22.fc2.weight": "model-00001-of-00002.safetensors", "model.layers.22.fc2.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.22.fc2.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.22.fc2.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.22.fc2.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.22.fc2.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.22.final_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -715,29 +531,21 @@ "model.layers.22.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", "model.layers.22.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.22.self_attn.k_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.22.self_attn.k_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.22.self_attn.k_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.22.self_attn.k_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.22.self_attn.k_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.22.self_attn.out_proj.bias": "model-00001-of-00002.safetensors", "model.layers.22.self_attn.out_proj.weight": "model-00001-of-00002.safetensors", "model.layers.22.self_attn.out_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.22.self_attn.out_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.22.self_attn.out_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.22.self_attn.out_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.22.self_attn.out_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.22.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", "model.layers.22.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.22.self_attn.q_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.22.self_attn.q_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.22.self_attn.q_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.22.self_attn.q_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.22.self_attn.q_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.22.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", "model.layers.22.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.22.self_attn.v_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.22.self_attn.v_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.22.self_attn.v_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.22.self_attn.v_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.22.self_attn.v_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.22.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -745,15 +553,11 @@ "model.layers.23.fc1.bias": "model-00001-of-00002.safetensors", "model.layers.23.fc1.weight": "model-00001-of-00002.safetensors", "model.layers.23.fc1.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.23.fc1.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.23.fc1.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.23.fc1.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.23.fc1.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.23.fc2.bias": "model-00001-of-00002.safetensors", "model.layers.23.fc2.weight": "model-00001-of-00002.safetensors", "model.layers.23.fc2.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.23.fc2.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.23.fc2.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.23.fc2.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.23.fc2.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.23.final_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -761,29 +565,21 @@ "model.layers.23.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", "model.layers.23.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.23.self_attn.k_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.23.self_attn.k_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.23.self_attn.k_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.23.self_attn.k_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.23.self_attn.k_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.23.self_attn.out_proj.bias": "model-00001-of-00002.safetensors", "model.layers.23.self_attn.out_proj.weight": "model-00001-of-00002.safetensors", "model.layers.23.self_attn.out_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.23.self_attn.out_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.23.self_attn.out_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.23.self_attn.out_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.23.self_attn.out_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.23.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", "model.layers.23.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.23.self_attn.q_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.23.self_attn.q_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.23.self_attn.q_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.23.self_attn.q_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.23.self_attn.q_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.23.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", "model.layers.23.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.23.self_attn.v_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.23.self_attn.v_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.23.self_attn.v_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.23.self_attn.v_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.23.self_attn.v_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.23.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -791,15 +587,11 @@ "model.layers.24.fc1.bias": "model-00001-of-00002.safetensors", "model.layers.24.fc1.weight": "model-00001-of-00002.safetensors", "model.layers.24.fc1.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.24.fc1.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.24.fc1.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.24.fc1.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.24.fc1.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.24.fc2.bias": "model-00001-of-00002.safetensors", "model.layers.24.fc2.weight": "model-00001-of-00002.safetensors", "model.layers.24.fc2.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.24.fc2.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.24.fc2.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.24.fc2.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.24.fc2.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.24.final_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -807,183 +599,135 @@ "model.layers.24.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", "model.layers.24.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.24.self_attn.k_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.24.self_attn.k_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.24.self_attn.k_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.24.self_attn.k_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.24.self_attn.k_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.24.self_attn.out_proj.bias": "model-00001-of-00002.safetensors", "model.layers.24.self_attn.out_proj.weight": "model-00001-of-00002.safetensors", "model.layers.24.self_attn.out_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.24.self_attn.out_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.24.self_attn.out_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.24.self_attn.out_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.24.self_attn.out_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.24.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", "model.layers.24.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.24.self_attn.q_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.24.self_attn.q_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.24.self_attn.q_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.24.self_attn.q_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.24.self_attn.q_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.24.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", "model.layers.24.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.24.self_attn.v_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.24.self_attn.v_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.24.self_attn.v_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.24.self_attn.v_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.24.self_attn.v_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.24.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors", "model.layers.24.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors", - "model.layers.25.fc1.bias": "model-00001-of-00002.safetensors", - "model.layers.25.fc1.weight": "model-00001-of-00002.safetensors", - "model.layers.25.fc1.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.25.fc1.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.25.fc1.weight.nested_quant_map": "model-00001-of-00002.safetensors", - "model.layers.25.fc1.weight.quant_map": "model-00001-of-00002.safetensors", - "model.layers.25.fc1.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", - "model.layers.25.fc2.bias": "model-00001-of-00002.safetensors", - "model.layers.25.fc2.weight": "model-00001-of-00002.safetensors", - "model.layers.25.fc2.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.25.fc2.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.25.fc2.weight.nested_quant_map": "model-00001-of-00002.safetensors", - "model.layers.25.fc2.weight.quant_map": "model-00001-of-00002.safetensors", - "model.layers.25.fc2.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", - "model.layers.25.final_layer_norm.bias": "model-00001-of-00002.safetensors", - "model.layers.25.final_layer_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.25.fc1.bias": "model-00002-of-00002.safetensors", + "model.layers.25.fc1.weight": "model-00002-of-00002.safetensors", + "model.layers.25.fc1.weight.absmax": "model-00002-of-00002.safetensors", + "model.layers.25.fc1.weight.quant_map": "model-00002-of-00002.safetensors", + "model.layers.25.fc1.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", + "model.layers.25.fc2.bias": "model-00002-of-00002.safetensors", + "model.layers.25.fc2.weight": "model-00002-of-00002.safetensors", + "model.layers.25.fc2.weight.absmax": "model-00002-of-00002.safetensors", + "model.layers.25.fc2.weight.quant_map": "model-00002-of-00002.safetensors", + "model.layers.25.fc2.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", + "model.layers.25.final_layer_norm.bias": "model-00002-of-00002.safetensors", + "model.layers.25.final_layer_norm.weight": "model-00002-of-00002.safetensors", "model.layers.25.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", "model.layers.25.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.25.self_attn.k_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.25.self_attn.k_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.25.self_attn.k_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.25.self_attn.k_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.25.self_attn.k_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.25.self_attn.out_proj.bias": "model-00001-of-00002.safetensors", "model.layers.25.self_attn.out_proj.weight": "model-00001-of-00002.safetensors", "model.layers.25.self_attn.out_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.25.self_attn.out_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.25.self_attn.out_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.25.self_attn.out_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.25.self_attn.out_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.25.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", "model.layers.25.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.25.self_attn.q_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.25.self_attn.q_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.25.self_attn.q_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.25.self_attn.q_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.25.self_attn.q_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.25.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", "model.layers.25.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.25.self_attn.v_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.25.self_attn.v_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.25.self_attn.v_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.25.self_attn.v_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.25.self_attn.v_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.25.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors", "model.layers.25.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors", - "model.layers.26.fc1.bias": "model-00001-of-00002.safetensors", - "model.layers.26.fc1.weight": "model-00001-of-00002.safetensors", - "model.layers.26.fc1.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.26.fc1.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.26.fc1.weight.nested_quant_map": "model-00001-of-00002.safetensors", - "model.layers.26.fc1.weight.quant_map": "model-00001-of-00002.safetensors", - "model.layers.26.fc1.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", - "model.layers.26.fc2.bias": "model-00001-of-00002.safetensors", - "model.layers.26.fc2.weight": "model-00001-of-00002.safetensors", - "model.layers.26.fc2.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.26.fc2.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.26.fc2.weight.nested_quant_map": "model-00001-of-00002.safetensors", - "model.layers.26.fc2.weight.quant_map": "model-00001-of-00002.safetensors", - "model.layers.26.fc2.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", - "model.layers.26.final_layer_norm.bias": "model-00001-of-00002.safetensors", - "model.layers.26.final_layer_norm.weight": "model-00001-of-00002.safetensors", - "model.layers.26.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", - "model.layers.26.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", - "model.layers.26.self_attn.k_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.26.self_attn.k_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.26.self_attn.k_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", - "model.layers.26.self_attn.k_proj.weight.quant_map": "model-00001-of-00002.safetensors", - "model.layers.26.self_attn.k_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", - "model.layers.26.self_attn.out_proj.bias": "model-00001-of-00002.safetensors", - "model.layers.26.self_attn.out_proj.weight": "model-00001-of-00002.safetensors", - "model.layers.26.self_attn.out_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.26.self_attn.out_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.26.self_attn.out_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", - "model.layers.26.self_attn.out_proj.weight.quant_map": "model-00001-of-00002.safetensors", - "model.layers.26.self_attn.out_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", - "model.layers.26.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", - "model.layers.26.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", - "model.layers.26.self_attn.q_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.26.self_attn.q_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.26.self_attn.q_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", - "model.layers.26.self_attn.q_proj.weight.quant_map": "model-00001-of-00002.safetensors", - "model.layers.26.self_attn.q_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", - "model.layers.26.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", - "model.layers.26.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", - "model.layers.26.self_attn.v_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.26.self_attn.v_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.26.self_attn.v_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", - "model.layers.26.self_attn.v_proj.weight.quant_map": "model-00001-of-00002.safetensors", - "model.layers.26.self_attn.v_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", - "model.layers.26.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors", - "model.layers.26.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors", - "model.layers.27.fc1.bias": "model-00001-of-00002.safetensors", - "model.layers.27.fc1.weight": "model-00001-of-00002.safetensors", - "model.layers.27.fc1.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.27.fc1.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.27.fc1.weight.nested_quant_map": "model-00001-of-00002.safetensors", - "model.layers.27.fc1.weight.quant_map": "model-00001-of-00002.safetensors", - "model.layers.27.fc1.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", + "model.layers.26.fc1.bias": "model-00002-of-00002.safetensors", + "model.layers.26.fc1.weight": "model-00002-of-00002.safetensors", + "model.layers.26.fc1.weight.absmax": "model-00002-of-00002.safetensors", + "model.layers.26.fc1.weight.quant_map": "model-00002-of-00002.safetensors", + "model.layers.26.fc1.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", + "model.layers.26.fc2.bias": "model-00002-of-00002.safetensors", + "model.layers.26.fc2.weight": "model-00002-of-00002.safetensors", + "model.layers.26.fc2.weight.absmax": "model-00002-of-00002.safetensors", + "model.layers.26.fc2.weight.quant_map": "model-00002-of-00002.safetensors", + "model.layers.26.fc2.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", + "model.layers.26.final_layer_norm.bias": "model-00002-of-00002.safetensors", + "model.layers.26.final_layer_norm.weight": "model-00002-of-00002.safetensors", + "model.layers.26.self_attn.k_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.26.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.26.self_attn.k_proj.weight.absmax": "model-00002-of-00002.safetensors", + "model.layers.26.self_attn.k_proj.weight.quant_map": "model-00002-of-00002.safetensors", + "model.layers.26.self_attn.k_proj.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", + "model.layers.26.self_attn.out_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.26.self_attn.out_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.26.self_attn.out_proj.weight.absmax": "model-00002-of-00002.safetensors", + "model.layers.26.self_attn.out_proj.weight.quant_map": "model-00002-of-00002.safetensors", + "model.layers.26.self_attn.out_proj.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", + "model.layers.26.self_attn.q_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.26.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.26.self_attn.q_proj.weight.absmax": "model-00002-of-00002.safetensors", + "model.layers.26.self_attn.q_proj.weight.quant_map": "model-00002-of-00002.safetensors", + "model.layers.26.self_attn.q_proj.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", + "model.layers.26.self_attn.v_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.26.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.26.self_attn.v_proj.weight.absmax": "model-00002-of-00002.safetensors", + "model.layers.26.self_attn.v_proj.weight.quant_map": "model-00002-of-00002.safetensors", + "model.layers.26.self_attn.v_proj.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", + "model.layers.26.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors", + "model.layers.26.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors", + "model.layers.27.fc1.bias": "model-00002-of-00002.safetensors", + "model.layers.27.fc1.weight": "model-00002-of-00002.safetensors", + "model.layers.27.fc1.weight.absmax": "model-00002-of-00002.safetensors", + "model.layers.27.fc1.weight.quant_map": "model-00002-of-00002.safetensors", + "model.layers.27.fc1.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", "model.layers.27.fc2.bias": "model-00002-of-00002.safetensors", "model.layers.27.fc2.weight": "model-00002-of-00002.safetensors", "model.layers.27.fc2.weight.absmax": "model-00002-of-00002.safetensors", - "model.layers.27.fc2.weight.nested_absmax": "model-00002-of-00002.safetensors", - "model.layers.27.fc2.weight.nested_quant_map": "model-00002-of-00002.safetensors", "model.layers.27.fc2.weight.quant_map": "model-00002-of-00002.safetensors", "model.layers.27.fc2.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", "model.layers.27.final_layer_norm.bias": "model-00002-of-00002.safetensors", "model.layers.27.final_layer_norm.weight": "model-00002-of-00002.safetensors", - "model.layers.27.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", - "model.layers.27.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", - "model.layers.27.self_attn.k_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.27.self_attn.k_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.27.self_attn.k_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", - "model.layers.27.self_attn.k_proj.weight.quant_map": "model-00001-of-00002.safetensors", - "model.layers.27.self_attn.k_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", - "model.layers.27.self_attn.out_proj.bias": "model-00001-of-00002.safetensors", - "model.layers.27.self_attn.out_proj.weight": "model-00001-of-00002.safetensors", - "model.layers.27.self_attn.out_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.27.self_attn.out_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.27.self_attn.out_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", - "model.layers.27.self_attn.out_proj.weight.quant_map": "model-00001-of-00002.safetensors", - "model.layers.27.self_attn.out_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", - "model.layers.27.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", - "model.layers.27.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", - "model.layers.27.self_attn.q_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.27.self_attn.q_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.27.self_attn.q_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", - "model.layers.27.self_attn.q_proj.weight.quant_map": "model-00001-of-00002.safetensors", - "model.layers.27.self_attn.q_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", - "model.layers.27.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", - "model.layers.27.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", - "model.layers.27.self_attn.v_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.27.self_attn.v_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.27.self_attn.v_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", - "model.layers.27.self_attn.v_proj.weight.quant_map": "model-00001-of-00002.safetensors", - "model.layers.27.self_attn.v_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", - "model.layers.27.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors", - "model.layers.27.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors", + "model.layers.27.self_attn.k_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.27.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.27.self_attn.k_proj.weight.absmax": "model-00002-of-00002.safetensors", + "model.layers.27.self_attn.k_proj.weight.quant_map": "model-00002-of-00002.safetensors", + "model.layers.27.self_attn.k_proj.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", + "model.layers.27.self_attn.out_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.27.self_attn.out_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.27.self_attn.out_proj.weight.absmax": "model-00002-of-00002.safetensors", + "model.layers.27.self_attn.out_proj.weight.quant_map": "model-00002-of-00002.safetensors", + "model.layers.27.self_attn.out_proj.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", + "model.layers.27.self_attn.q_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.27.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.27.self_attn.q_proj.weight.absmax": "model-00002-of-00002.safetensors", + "model.layers.27.self_attn.q_proj.weight.quant_map": "model-00002-of-00002.safetensors", + "model.layers.27.self_attn.q_proj.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", + "model.layers.27.self_attn.v_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.27.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.27.self_attn.v_proj.weight.absmax": "model-00002-of-00002.safetensors", + "model.layers.27.self_attn.v_proj.weight.quant_map": "model-00002-of-00002.safetensors", + "model.layers.27.self_attn.v_proj.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", + "model.layers.27.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors", + "model.layers.27.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors", "model.layers.28.fc1.bias": "model-00002-of-00002.safetensors", "model.layers.28.fc1.weight": "model-00002-of-00002.safetensors", "model.layers.28.fc1.weight.absmax": "model-00002-of-00002.safetensors", - "model.layers.28.fc1.weight.nested_absmax": "model-00002-of-00002.safetensors", - "model.layers.28.fc1.weight.nested_quant_map": "model-00002-of-00002.safetensors", "model.layers.28.fc1.weight.quant_map": "model-00002-of-00002.safetensors", "model.layers.28.fc1.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", "model.layers.28.fc2.bias": "model-00002-of-00002.safetensors", "model.layers.28.fc2.weight": "model-00002-of-00002.safetensors", "model.layers.28.fc2.weight.absmax": "model-00002-of-00002.safetensors", - "model.layers.28.fc2.weight.nested_absmax": "model-00002-of-00002.safetensors", - "model.layers.28.fc2.weight.nested_quant_map": "model-00002-of-00002.safetensors", "model.layers.28.fc2.weight.quant_map": "model-00002-of-00002.safetensors", "model.layers.28.fc2.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", "model.layers.28.final_layer_norm.bias": "model-00002-of-00002.safetensors", @@ -991,29 +735,21 @@ "model.layers.28.self_attn.k_proj.bias": "model-00002-of-00002.safetensors", "model.layers.28.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", "model.layers.28.self_attn.k_proj.weight.absmax": "model-00002-of-00002.safetensors", - "model.layers.28.self_attn.k_proj.weight.nested_absmax": "model-00002-of-00002.safetensors", - "model.layers.28.self_attn.k_proj.weight.nested_quant_map": "model-00002-of-00002.safetensors", "model.layers.28.self_attn.k_proj.weight.quant_map": "model-00002-of-00002.safetensors", "model.layers.28.self_attn.k_proj.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", "model.layers.28.self_attn.out_proj.bias": "model-00002-of-00002.safetensors", "model.layers.28.self_attn.out_proj.weight": "model-00002-of-00002.safetensors", "model.layers.28.self_attn.out_proj.weight.absmax": "model-00002-of-00002.safetensors", - "model.layers.28.self_attn.out_proj.weight.nested_absmax": "model-00002-of-00002.safetensors", - "model.layers.28.self_attn.out_proj.weight.nested_quant_map": "model-00002-of-00002.safetensors", "model.layers.28.self_attn.out_proj.weight.quant_map": "model-00002-of-00002.safetensors", "model.layers.28.self_attn.out_proj.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", "model.layers.28.self_attn.q_proj.bias": "model-00002-of-00002.safetensors", "model.layers.28.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", "model.layers.28.self_attn.q_proj.weight.absmax": "model-00002-of-00002.safetensors", - "model.layers.28.self_attn.q_proj.weight.nested_absmax": "model-00002-of-00002.safetensors", - "model.layers.28.self_attn.q_proj.weight.nested_quant_map": "model-00002-of-00002.safetensors", "model.layers.28.self_attn.q_proj.weight.quant_map": "model-00002-of-00002.safetensors", "model.layers.28.self_attn.q_proj.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", "model.layers.28.self_attn.v_proj.bias": "model-00002-of-00002.safetensors", "model.layers.28.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", "model.layers.28.self_attn.v_proj.weight.absmax": "model-00002-of-00002.safetensors", - "model.layers.28.self_attn.v_proj.weight.nested_absmax": "model-00002-of-00002.safetensors", - "model.layers.28.self_attn.v_proj.weight.nested_quant_map": "model-00002-of-00002.safetensors", "model.layers.28.self_attn.v_proj.weight.quant_map": "model-00002-of-00002.safetensors", "model.layers.28.self_attn.v_proj.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", "model.layers.28.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors", @@ -1021,15 +757,11 @@ "model.layers.29.fc1.bias": "model-00002-of-00002.safetensors", "model.layers.29.fc1.weight": "model-00002-of-00002.safetensors", "model.layers.29.fc1.weight.absmax": "model-00002-of-00002.safetensors", - "model.layers.29.fc1.weight.nested_absmax": "model-00002-of-00002.safetensors", - "model.layers.29.fc1.weight.nested_quant_map": "model-00002-of-00002.safetensors", "model.layers.29.fc1.weight.quant_map": "model-00002-of-00002.safetensors", "model.layers.29.fc1.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", "model.layers.29.fc2.bias": "model-00002-of-00002.safetensors", "model.layers.29.fc2.weight": "model-00002-of-00002.safetensors", "model.layers.29.fc2.weight.absmax": "model-00002-of-00002.safetensors", - "model.layers.29.fc2.weight.nested_absmax": "model-00002-of-00002.safetensors", - "model.layers.29.fc2.weight.nested_quant_map": "model-00002-of-00002.safetensors", "model.layers.29.fc2.weight.quant_map": "model-00002-of-00002.safetensors", "model.layers.29.fc2.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", "model.layers.29.final_layer_norm.bias": "model-00002-of-00002.safetensors", @@ -1037,29 +769,21 @@ "model.layers.29.self_attn.k_proj.bias": "model-00002-of-00002.safetensors", "model.layers.29.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", "model.layers.29.self_attn.k_proj.weight.absmax": "model-00002-of-00002.safetensors", - "model.layers.29.self_attn.k_proj.weight.nested_absmax": "model-00002-of-00002.safetensors", - "model.layers.29.self_attn.k_proj.weight.nested_quant_map": "model-00002-of-00002.safetensors", "model.layers.29.self_attn.k_proj.weight.quant_map": "model-00002-of-00002.safetensors", "model.layers.29.self_attn.k_proj.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", "model.layers.29.self_attn.out_proj.bias": "model-00002-of-00002.safetensors", "model.layers.29.self_attn.out_proj.weight": "model-00002-of-00002.safetensors", "model.layers.29.self_attn.out_proj.weight.absmax": "model-00002-of-00002.safetensors", - "model.layers.29.self_attn.out_proj.weight.nested_absmax": "model-00002-of-00002.safetensors", - "model.layers.29.self_attn.out_proj.weight.nested_quant_map": "model-00002-of-00002.safetensors", "model.layers.29.self_attn.out_proj.weight.quant_map": "model-00002-of-00002.safetensors", "model.layers.29.self_attn.out_proj.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", "model.layers.29.self_attn.q_proj.bias": "model-00002-of-00002.safetensors", "model.layers.29.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", "model.layers.29.self_attn.q_proj.weight.absmax": "model-00002-of-00002.safetensors", - "model.layers.29.self_attn.q_proj.weight.nested_absmax": "model-00002-of-00002.safetensors", - "model.layers.29.self_attn.q_proj.weight.nested_quant_map": "model-00002-of-00002.safetensors", "model.layers.29.self_attn.q_proj.weight.quant_map": "model-00002-of-00002.safetensors", "model.layers.29.self_attn.q_proj.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", "model.layers.29.self_attn.v_proj.bias": "model-00002-of-00002.safetensors", "model.layers.29.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", "model.layers.29.self_attn.v_proj.weight.absmax": "model-00002-of-00002.safetensors", - "model.layers.29.self_attn.v_proj.weight.nested_absmax": "model-00002-of-00002.safetensors", - "model.layers.29.self_attn.v_proj.weight.nested_quant_map": "model-00002-of-00002.safetensors", "model.layers.29.self_attn.v_proj.weight.quant_map": "model-00002-of-00002.safetensors", "model.layers.29.self_attn.v_proj.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", "model.layers.29.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors", @@ -1067,15 +791,11 @@ "model.layers.3.fc1.bias": "model-00001-of-00002.safetensors", "model.layers.3.fc1.weight": "model-00001-of-00002.safetensors", "model.layers.3.fc1.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.3.fc1.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.3.fc1.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.3.fc1.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.3.fc1.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.3.fc2.bias": "model-00001-of-00002.safetensors", "model.layers.3.fc2.weight": "model-00001-of-00002.safetensors", "model.layers.3.fc2.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.3.fc2.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.3.fc2.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.3.fc2.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.3.fc2.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.3.final_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -1083,29 +803,21 @@ "model.layers.3.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", "model.layers.3.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.3.self_attn.k_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.3.self_attn.k_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.3.self_attn.k_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.3.self_attn.k_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.3.self_attn.k_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.3.self_attn.out_proj.bias": "model-00001-of-00002.safetensors", "model.layers.3.self_attn.out_proj.weight": "model-00001-of-00002.safetensors", "model.layers.3.self_attn.out_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.3.self_attn.out_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.3.self_attn.out_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.3.self_attn.out_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.3.self_attn.out_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.3.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", "model.layers.3.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.3.self_attn.q_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.3.self_attn.q_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.3.self_attn.q_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.3.self_attn.q_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.3.self_attn.q_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.3.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", "model.layers.3.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.3.self_attn.v_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.3.self_attn.v_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.3.self_attn.v_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.3.self_attn.v_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.3.self_attn.v_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.3.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -1113,15 +825,11 @@ "model.layers.30.fc1.bias": "model-00002-of-00002.safetensors", "model.layers.30.fc1.weight": "model-00002-of-00002.safetensors", "model.layers.30.fc1.weight.absmax": "model-00002-of-00002.safetensors", - "model.layers.30.fc1.weight.nested_absmax": "model-00002-of-00002.safetensors", - "model.layers.30.fc1.weight.nested_quant_map": "model-00002-of-00002.safetensors", "model.layers.30.fc1.weight.quant_map": "model-00002-of-00002.safetensors", "model.layers.30.fc1.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", "model.layers.30.fc2.bias": "model-00002-of-00002.safetensors", "model.layers.30.fc2.weight": "model-00002-of-00002.safetensors", "model.layers.30.fc2.weight.absmax": "model-00002-of-00002.safetensors", - "model.layers.30.fc2.weight.nested_absmax": "model-00002-of-00002.safetensors", - "model.layers.30.fc2.weight.nested_quant_map": "model-00002-of-00002.safetensors", "model.layers.30.fc2.weight.quant_map": "model-00002-of-00002.safetensors", "model.layers.30.fc2.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", "model.layers.30.final_layer_norm.bias": "model-00002-of-00002.safetensors", @@ -1129,29 +837,21 @@ "model.layers.30.self_attn.k_proj.bias": "model-00002-of-00002.safetensors", "model.layers.30.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", "model.layers.30.self_attn.k_proj.weight.absmax": "model-00002-of-00002.safetensors", - "model.layers.30.self_attn.k_proj.weight.nested_absmax": "model-00002-of-00002.safetensors", - "model.layers.30.self_attn.k_proj.weight.nested_quant_map": "model-00002-of-00002.safetensors", "model.layers.30.self_attn.k_proj.weight.quant_map": "model-00002-of-00002.safetensors", "model.layers.30.self_attn.k_proj.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", "model.layers.30.self_attn.out_proj.bias": "model-00002-of-00002.safetensors", "model.layers.30.self_attn.out_proj.weight": "model-00002-of-00002.safetensors", "model.layers.30.self_attn.out_proj.weight.absmax": "model-00002-of-00002.safetensors", - "model.layers.30.self_attn.out_proj.weight.nested_absmax": "model-00002-of-00002.safetensors", - "model.layers.30.self_attn.out_proj.weight.nested_quant_map": "model-00002-of-00002.safetensors", "model.layers.30.self_attn.out_proj.weight.quant_map": "model-00002-of-00002.safetensors", "model.layers.30.self_attn.out_proj.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", "model.layers.30.self_attn.q_proj.bias": "model-00002-of-00002.safetensors", "model.layers.30.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", "model.layers.30.self_attn.q_proj.weight.absmax": "model-00002-of-00002.safetensors", - "model.layers.30.self_attn.q_proj.weight.nested_absmax": "model-00002-of-00002.safetensors", - "model.layers.30.self_attn.q_proj.weight.nested_quant_map": "model-00002-of-00002.safetensors", "model.layers.30.self_attn.q_proj.weight.quant_map": "model-00002-of-00002.safetensors", "model.layers.30.self_attn.q_proj.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", "model.layers.30.self_attn.v_proj.bias": "model-00002-of-00002.safetensors", "model.layers.30.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", "model.layers.30.self_attn.v_proj.weight.absmax": "model-00002-of-00002.safetensors", - "model.layers.30.self_attn.v_proj.weight.nested_absmax": "model-00002-of-00002.safetensors", - "model.layers.30.self_attn.v_proj.weight.nested_quant_map": "model-00002-of-00002.safetensors", "model.layers.30.self_attn.v_proj.weight.quant_map": "model-00002-of-00002.safetensors", "model.layers.30.self_attn.v_proj.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", "model.layers.30.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors", @@ -1159,15 +859,11 @@ "model.layers.31.fc1.bias": "model-00002-of-00002.safetensors", "model.layers.31.fc1.weight": "model-00002-of-00002.safetensors", "model.layers.31.fc1.weight.absmax": "model-00002-of-00002.safetensors", - "model.layers.31.fc1.weight.nested_absmax": "model-00002-of-00002.safetensors", - "model.layers.31.fc1.weight.nested_quant_map": "model-00002-of-00002.safetensors", "model.layers.31.fc1.weight.quant_map": "model-00002-of-00002.safetensors", "model.layers.31.fc1.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", "model.layers.31.fc2.bias": "model-00002-of-00002.safetensors", "model.layers.31.fc2.weight": "model-00002-of-00002.safetensors", "model.layers.31.fc2.weight.absmax": "model-00002-of-00002.safetensors", - "model.layers.31.fc2.weight.nested_absmax": "model-00002-of-00002.safetensors", - "model.layers.31.fc2.weight.nested_quant_map": "model-00002-of-00002.safetensors", "model.layers.31.fc2.weight.quant_map": "model-00002-of-00002.safetensors", "model.layers.31.fc2.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", "model.layers.31.final_layer_norm.bias": "model-00002-of-00002.safetensors", @@ -1175,29 +871,21 @@ "model.layers.31.self_attn.k_proj.bias": "model-00002-of-00002.safetensors", "model.layers.31.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", "model.layers.31.self_attn.k_proj.weight.absmax": "model-00002-of-00002.safetensors", - "model.layers.31.self_attn.k_proj.weight.nested_absmax": "model-00002-of-00002.safetensors", - "model.layers.31.self_attn.k_proj.weight.nested_quant_map": "model-00002-of-00002.safetensors", "model.layers.31.self_attn.k_proj.weight.quant_map": "model-00002-of-00002.safetensors", "model.layers.31.self_attn.k_proj.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", "model.layers.31.self_attn.out_proj.bias": "model-00002-of-00002.safetensors", "model.layers.31.self_attn.out_proj.weight": "model-00002-of-00002.safetensors", "model.layers.31.self_attn.out_proj.weight.absmax": "model-00002-of-00002.safetensors", - "model.layers.31.self_attn.out_proj.weight.nested_absmax": "model-00002-of-00002.safetensors", - "model.layers.31.self_attn.out_proj.weight.nested_quant_map": "model-00002-of-00002.safetensors", "model.layers.31.self_attn.out_proj.weight.quant_map": "model-00002-of-00002.safetensors", "model.layers.31.self_attn.out_proj.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", "model.layers.31.self_attn.q_proj.bias": "model-00002-of-00002.safetensors", "model.layers.31.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", "model.layers.31.self_attn.q_proj.weight.absmax": "model-00002-of-00002.safetensors", - "model.layers.31.self_attn.q_proj.weight.nested_absmax": "model-00002-of-00002.safetensors", - "model.layers.31.self_attn.q_proj.weight.nested_quant_map": "model-00002-of-00002.safetensors", "model.layers.31.self_attn.q_proj.weight.quant_map": "model-00002-of-00002.safetensors", "model.layers.31.self_attn.q_proj.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", "model.layers.31.self_attn.v_proj.bias": "model-00002-of-00002.safetensors", "model.layers.31.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", "model.layers.31.self_attn.v_proj.weight.absmax": "model-00002-of-00002.safetensors", - "model.layers.31.self_attn.v_proj.weight.nested_absmax": "model-00002-of-00002.safetensors", - "model.layers.31.self_attn.v_proj.weight.nested_quant_map": "model-00002-of-00002.safetensors", "model.layers.31.self_attn.v_proj.weight.quant_map": "model-00002-of-00002.safetensors", "model.layers.31.self_attn.v_proj.weight.quant_state.bitsandbytes__fp4": "model-00002-of-00002.safetensors", "model.layers.31.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors", @@ -1205,15 +893,11 @@ "model.layers.4.fc1.bias": "model-00001-of-00002.safetensors", "model.layers.4.fc1.weight": "model-00001-of-00002.safetensors", "model.layers.4.fc1.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.4.fc1.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.4.fc1.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.4.fc1.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.4.fc1.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.4.fc2.bias": "model-00001-of-00002.safetensors", "model.layers.4.fc2.weight": "model-00001-of-00002.safetensors", "model.layers.4.fc2.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.4.fc2.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.4.fc2.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.4.fc2.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.4.fc2.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.4.final_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -1221,29 +905,21 @@ "model.layers.4.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", "model.layers.4.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.4.self_attn.k_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.4.self_attn.k_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.4.self_attn.k_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.4.self_attn.k_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.4.self_attn.k_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.4.self_attn.out_proj.bias": "model-00001-of-00002.safetensors", "model.layers.4.self_attn.out_proj.weight": "model-00001-of-00002.safetensors", "model.layers.4.self_attn.out_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.4.self_attn.out_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.4.self_attn.out_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.4.self_attn.out_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.4.self_attn.out_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.4.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", "model.layers.4.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.4.self_attn.q_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.4.self_attn.q_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.4.self_attn.q_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.4.self_attn.q_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.4.self_attn.q_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.4.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", "model.layers.4.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.4.self_attn.v_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.4.self_attn.v_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.4.self_attn.v_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.4.self_attn.v_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.4.self_attn.v_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.4.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -1251,15 +927,11 @@ "model.layers.5.fc1.bias": "model-00001-of-00002.safetensors", "model.layers.5.fc1.weight": "model-00001-of-00002.safetensors", "model.layers.5.fc1.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.5.fc1.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.5.fc1.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.5.fc1.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.5.fc1.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.5.fc2.bias": "model-00001-of-00002.safetensors", "model.layers.5.fc2.weight": "model-00001-of-00002.safetensors", "model.layers.5.fc2.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.5.fc2.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.5.fc2.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.5.fc2.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.5.fc2.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.5.final_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -1267,29 +939,21 @@ "model.layers.5.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", "model.layers.5.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.5.self_attn.k_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.5.self_attn.k_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.5.self_attn.k_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.5.self_attn.k_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.5.self_attn.k_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.5.self_attn.out_proj.bias": "model-00001-of-00002.safetensors", "model.layers.5.self_attn.out_proj.weight": "model-00001-of-00002.safetensors", "model.layers.5.self_attn.out_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.5.self_attn.out_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.5.self_attn.out_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.5.self_attn.out_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.5.self_attn.out_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.5.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", "model.layers.5.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.5.self_attn.q_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.5.self_attn.q_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.5.self_attn.q_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.5.self_attn.q_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.5.self_attn.q_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.5.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", "model.layers.5.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.5.self_attn.v_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.5.self_attn.v_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.5.self_attn.v_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.5.self_attn.v_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.5.self_attn.v_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.5.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -1297,15 +961,11 @@ "model.layers.6.fc1.bias": "model-00001-of-00002.safetensors", "model.layers.6.fc1.weight": "model-00001-of-00002.safetensors", "model.layers.6.fc1.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.6.fc1.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.6.fc1.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.6.fc1.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.6.fc1.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.6.fc2.bias": "model-00001-of-00002.safetensors", "model.layers.6.fc2.weight": "model-00001-of-00002.safetensors", "model.layers.6.fc2.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.6.fc2.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.6.fc2.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.6.fc2.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.6.fc2.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.6.final_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -1313,29 +973,21 @@ "model.layers.6.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", "model.layers.6.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.6.self_attn.k_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.6.self_attn.k_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.6.self_attn.k_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.6.self_attn.k_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.6.self_attn.k_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.6.self_attn.out_proj.bias": "model-00001-of-00002.safetensors", "model.layers.6.self_attn.out_proj.weight": "model-00001-of-00002.safetensors", "model.layers.6.self_attn.out_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.6.self_attn.out_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.6.self_attn.out_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.6.self_attn.out_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.6.self_attn.out_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.6.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", "model.layers.6.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.6.self_attn.q_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.6.self_attn.q_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.6.self_attn.q_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.6.self_attn.q_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.6.self_attn.q_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.6.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", "model.layers.6.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.6.self_attn.v_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.6.self_attn.v_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.6.self_attn.v_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.6.self_attn.v_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.6.self_attn.v_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.6.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -1343,15 +995,11 @@ "model.layers.7.fc1.bias": "model-00001-of-00002.safetensors", "model.layers.7.fc1.weight": "model-00001-of-00002.safetensors", "model.layers.7.fc1.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.7.fc1.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.7.fc1.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.7.fc1.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.7.fc1.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.7.fc2.bias": "model-00001-of-00002.safetensors", "model.layers.7.fc2.weight": "model-00001-of-00002.safetensors", "model.layers.7.fc2.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.7.fc2.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.7.fc2.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.7.fc2.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.7.fc2.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.7.final_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -1359,29 +1007,21 @@ "model.layers.7.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", "model.layers.7.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.7.self_attn.k_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.7.self_attn.k_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.7.self_attn.k_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.7.self_attn.k_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.7.self_attn.k_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.7.self_attn.out_proj.bias": "model-00001-of-00002.safetensors", "model.layers.7.self_attn.out_proj.weight": "model-00001-of-00002.safetensors", "model.layers.7.self_attn.out_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.7.self_attn.out_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.7.self_attn.out_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.7.self_attn.out_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.7.self_attn.out_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.7.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", "model.layers.7.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.7.self_attn.q_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.7.self_attn.q_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.7.self_attn.q_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.7.self_attn.q_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.7.self_attn.q_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.7.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", "model.layers.7.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.7.self_attn.v_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.7.self_attn.v_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.7.self_attn.v_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.7.self_attn.v_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.7.self_attn.v_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.7.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -1389,15 +1029,11 @@ "model.layers.8.fc1.bias": "model-00001-of-00002.safetensors", "model.layers.8.fc1.weight": "model-00001-of-00002.safetensors", "model.layers.8.fc1.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.8.fc1.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.8.fc1.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.8.fc1.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.8.fc1.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.8.fc2.bias": "model-00001-of-00002.safetensors", "model.layers.8.fc2.weight": "model-00001-of-00002.safetensors", "model.layers.8.fc2.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.8.fc2.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.8.fc2.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.8.fc2.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.8.fc2.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.8.final_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -1405,29 +1041,21 @@ "model.layers.8.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", "model.layers.8.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.8.self_attn.k_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.8.self_attn.k_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.8.self_attn.k_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.8.self_attn.k_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.8.self_attn.k_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.8.self_attn.out_proj.bias": "model-00001-of-00002.safetensors", "model.layers.8.self_attn.out_proj.weight": "model-00001-of-00002.safetensors", "model.layers.8.self_attn.out_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.8.self_attn.out_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.8.self_attn.out_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.8.self_attn.out_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.8.self_attn.out_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.8.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", "model.layers.8.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.8.self_attn.q_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.8.self_attn.q_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.8.self_attn.q_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.8.self_attn.q_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.8.self_attn.q_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.8.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", "model.layers.8.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.8.self_attn.v_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.8.self_attn.v_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.8.self_attn.v_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.8.self_attn.v_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.8.self_attn.v_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.8.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -1435,15 +1063,11 @@ "model.layers.9.fc1.bias": "model-00001-of-00002.safetensors", "model.layers.9.fc1.weight": "model-00001-of-00002.safetensors", "model.layers.9.fc1.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.9.fc1.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.9.fc1.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.9.fc1.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.9.fc1.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.9.fc2.bias": "model-00001-of-00002.safetensors", "model.layers.9.fc2.weight": "model-00001-of-00002.safetensors", "model.layers.9.fc2.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.9.fc2.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.9.fc2.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.9.fc2.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.9.fc2.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.9.final_layer_norm.bias": "model-00001-of-00002.safetensors", @@ -1451,29 +1075,21 @@ "model.layers.9.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", "model.layers.9.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.9.self_attn.k_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.9.self_attn.k_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.9.self_attn.k_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.9.self_attn.k_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.9.self_attn.k_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.9.self_attn.out_proj.bias": "model-00001-of-00002.safetensors", "model.layers.9.self_attn.out_proj.weight": "model-00001-of-00002.safetensors", "model.layers.9.self_attn.out_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.9.self_attn.out_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.9.self_attn.out_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.9.self_attn.out_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.9.self_attn.out_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.9.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", "model.layers.9.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.9.self_attn.q_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.9.self_attn.q_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.9.self_attn.q_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.9.self_attn.q_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.9.self_attn.q_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.9.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", "model.layers.9.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.9.self_attn.v_proj.weight.absmax": "model-00001-of-00002.safetensors", - "model.layers.9.self_attn.v_proj.weight.nested_absmax": "model-00001-of-00002.safetensors", - "model.layers.9.self_attn.v_proj.weight.nested_quant_map": "model-00001-of-00002.safetensors", "model.layers.9.self_attn.v_proj.weight.quant_map": "model-00001-of-00002.safetensors", "model.layers.9.self_attn.v_proj.weight.quant_state.bitsandbytes__fp4": "model-00001-of-00002.safetensors", "model.layers.9.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",