very good quant for speed/perplexity, embedding is at q4k
Browse files
.gitattributes
CHANGED
@@ -49,3 +49,4 @@ qwen7bq4xsoutput6k.gguf filter=lfs diff=lfs merge=lfs -text
|
|
49 |
qwenv2instruct7b_q8.gguf filter=lfs diff=lfs merge=lfs -text
|
50 |
qwen7bv2instruct_q5km.gguf filter=lfs diff=lfs merge=lfs -text
|
51 |
qwen7bv2_iq4xs_output8bit.gguf filter=lfs diff=lfs merge=lfs -text
|
|
|
|
49 |
qwenv2instruct7b_q8.gguf filter=lfs diff=lfs merge=lfs -text
|
50 |
qwen7bv2instruct_q5km.gguf filter=lfs diff=lfs merge=lfs -text
|
51 |
qwen7bv2_iq4xs_output8bit.gguf filter=lfs diff=lfs merge=lfs -text
|
52 |
+
qwen7bv2inst_q4km_output8bit.gguf filter=lfs diff=lfs merge=lfs -text
|
qwen7bq4koutput8bit.gguf → qwen7bv2inst_q4km_output8bit.gguf
RENAMED
File without changes
|