nisten commited on
Commit
9869461
1 Parent(s): 51abeba

best speed/perplexity for mobile devices with int8 acceleration

Browse files
.gitattributes CHANGED
@@ -59,3 +59,4 @@ qwen7bv2inst_q4km_embeddingf16_outputf16.gguf filter=lfs diff=lfs merge=lfs -tex
59
  qwen7bv2inst_iq4xs_output8bit.gguf filter=lfs diff=lfs merge=lfs -text
60
  qwen7bv2inst_q4km_embedding4k_output8bit.gguf filter=lfs diff=lfs merge=lfs -text
61
  qwen7bv2inst_iq4xs_embedding4xs_output6k.gguf filter=lfs diff=lfs merge=lfs -text
 
 
59
  qwen7bv2inst_iq4xs_output8bit.gguf filter=lfs diff=lfs merge=lfs -text
60
  qwen7bv2inst_q4km_embedding4k_output8bit.gguf filter=lfs diff=lfs merge=lfs -text
61
  qwen7bv2inst_iq4xs_embedding4xs_output6k.gguf filter=lfs diff=lfs merge=lfs -text
62
+ qwen7bv2inst_iq4xs_embedding4xs_output8bit.gguf filter=lfs diff=lfs merge=lfs -text
qwen7bv2inst_iq4xs_output8bit.gguf → qwen7bv2inst_iq4xs_embedding4xs_output8bit.gguf RENAMED
File without changes