dqnguyen commited on
Commit
c76e717
1 Parent(s): 74ba0c7

Upload model PhoGPT-4B-Chat.gguf converted to gguf FP16 format and its quantized variants

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ *.gguf filter=lfs diff=lfs merge=lfs -text
PhoGPT-4B-Chat-Q4_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e570e9ae19e5792d01b3c68cf47056ebf37eb0202337bb580959a02f52a0a23
3
+ size 2364868288
PhoGPT-4B-Chat-Q8_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8cb933f5a60113cfb26fcf5a6c147bf5895d4010f23c3e3aa392a24ddaff657a
3
+ size 3923084992
PhoGPT-4B-Chat.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f224e813bb7476b1da4f3c6f9dab38cac6944fe6a6f9462794467b1efed2506c
3
+ size 7379453568