GGUF
Inference Endpoints
sakuraumi commited on
Commit
d3a6154
1 Parent(s): 599c317

Upload GGUF models.

Browse files
.gitattributes CHANGED
@@ -39,3 +39,4 @@ sakura-7b-lnovel-v0.9-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
39
  sakura-7b-lnovel-v0.9-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
40
  sakura-7b-lnovel-v0.9-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
41
  sakura-7b-lnovel-v0.9-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text
 
 
39
  sakura-7b-lnovel-v0.9-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
40
  sakura-7b-lnovel-v0.9-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
41
  sakura-7b-lnovel-v0.9-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text
42
+ sakura-7b-lnovel-v0.9-fp16.gguf filter=lfs diff=lfs merge=lfs -text
sakura-7b-lnovel-v0.9-fp16.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c481cb4dd617287f6ada1f6b697cf2d7c38b172017af93681bf0905dd4fbea2b
3
+ size 15449914656