Venkatesh Srinivas commited on
Commit
fe8946f
1 Parent(s): dde70a8

Import imatrix source/data and IQ3_XXS (3.06 bpw) quant for 8GB GPUs

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ imatrix.dat filter=lfs diff=lfs merge=lfs -text
group_10_merged.txt ADDED
The diff for this file is too large to render. See raw diff
 
imatrix.dat ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4b95e85c3ba8cea4e7619f8b92f23422c095b62858f71567954ba5c4297e1b1
3
+ size 11061292
psyonic_sydney-20b.gguf.iq3_xxs.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64d0dd81bd794986f80f120b7619576237ec56c1bb349de91d6d73495ca946f4
3
+ size 7587788320