Good speed reference quant for older CPUs, however not much improvement from f16 embedding
Browse files
.gitattributes
CHANGED
@@ -55,3 +55,4 @@ qwen7bv2inst_iq4xs_embedding8_output8.gguf filter=lfs diff=lfs merge=lfs -text
|
|
55 |
qwen7bv2inst_iq4xs_embedding8_outputq8.gguf filter=lfs diff=lfs merge=lfs -text
|
56 |
qwen7bv2inst_Iq4xs_output6k.gguf filter=lfs diff=lfs merge=lfs -text
|
57 |
qwen7bv2instruct_q8.gguf filter=lfs diff=lfs merge=lfs -text
|
|
|
|
55 |
qwen7bv2inst_iq4xs_embedding8_outputq8.gguf filter=lfs diff=lfs merge=lfs -text
|
56 |
qwen7bv2inst_Iq4xs_output6k.gguf filter=lfs diff=lfs merge=lfs -text
|
57 |
qwen7bv2instruct_q8.gguf filter=lfs diff=lfs merge=lfs -text
|
58 |
+
qwen7bv2inst_q4km_embeddingf16_outputf16.gguf filter=lfs diff=lfs merge=lfs -text
|
qwen7bq4kembeddingf16outputf16.gguf → qwen7bv2inst_q4km_embeddingf16_outputf16.gguf
RENAMED
File without changes
|