TheBloke
/

Mixtral-8x7B-v0.1-GPTQ

Text Generation

text-generation-inference

4-bit precision

Model card Files Files and versions Community

TheBloke commited on Dec 12, 2023

Commit

8de41f5

•

1 Parent(s): e0ca44b

Update config.json

Files changed (1) hide show

config.json +1 -1

config.json CHANGED Viewed

@@ -31,7 +31,7 @@
     "vocab_size": 32000,
     "quantization_config": {
         "bits": 4,
-	"inside_layer_modules" : [
         ["self_attn.k_proj", "self_attn.v_proj", "self_attn.q_proj"],
         ["self_attn.o_proj"],
         ["block_sparse_moe.experts.0.w1", "block_sparse_moe.experts.0.w2", "block_sparse_moe.experts.0.w3"],

     "vocab_size": 32000,
     "quantization_config": {
         "bits": 4,
+		"modules_in_block_to_quantize" : [
         ["self_attn.k_proj", "self_attn.v_proj", "self_attn.q_proj"],
         ["self_attn.o_proj"],
         ["block_sparse_moe.experts.0.w1", "block_sparse_moe.experts.0.w2", "block_sparse_moe.experts.0.w3"],