nisten commited on
Commit
6c5e613
1 Parent(s): 0e76852

very good quant for speed/perplexity, embedding is at q4k

Browse files
.gitattributes CHANGED
@@ -49,3 +49,4 @@ qwen7bq4xsoutput6k.gguf filter=lfs diff=lfs merge=lfs -text
49
  qwenv2instruct7b_q8.gguf filter=lfs diff=lfs merge=lfs -text
50
  qwen7bv2instruct_q5km.gguf filter=lfs diff=lfs merge=lfs -text
51
  qwen7bv2_iq4xs_output8bit.gguf filter=lfs diff=lfs merge=lfs -text
 
 
49
  qwenv2instruct7b_q8.gguf filter=lfs diff=lfs merge=lfs -text
50
  qwen7bv2instruct_q5km.gguf filter=lfs diff=lfs merge=lfs -text
51
  qwen7bv2_iq4xs_output8bit.gguf filter=lfs diff=lfs merge=lfs -text
52
+ qwen7bv2inst_q4km_output8bit.gguf filter=lfs diff=lfs merge=lfs -text
qwen7bq4koutput8bit.gguf → qwen7bv2inst_q4km_output8bit.gguf RENAMED
File without changes