medmekk HF staff commited on 11 days ago

Commit

52fc2aa

verified ·

1 Parent(s): 5f6cb1b

Upload quantized models

Browse files

Files changed (22) hide show

.gitattributes +20 -0
Llama-3.2-1B-Instruct-IQ3_M_imat.gguf +3 -0
Llama-3.2-1B-Instruct-IQ3_XXS_imat.gguf +3 -0
Llama-3.2-1B-Instruct-IQ4_NL_imat.gguf +3 -0
Llama-3.2-1B-Instruct-IQ4_XS_imat.gguf +3 -0
Llama-3.2-1B-Instruct-Q2_K.gguf +3 -0
Llama-3.2-1B-Instruct-Q3_K_L.gguf +3 -0
Llama-3.2-1B-Instruct-Q3_K_M.gguf +3 -0
Llama-3.2-1B-Instruct-Q3_K_S.gguf +3 -0
Llama-3.2-1B-Instruct-Q4_0.gguf +3 -0
Llama-3.2-1B-Instruct-Q4_K_M.gguf +3 -0
Llama-3.2-1B-Instruct-Q4_K_M_imat.gguf +3 -0
Llama-3.2-1B-Instruct-Q4_K_S.gguf +3 -0
Llama-3.2-1B-Instruct-Q4_K_S_imat.gguf +3 -0
Llama-3.2-1B-Instruct-Q5_0.gguf +3 -0
Llama-3.2-1B-Instruct-Q5_K_M.gguf +3 -0
Llama-3.2-1B-Instruct-Q5_K_M_imat.gguf +3 -0
Llama-3.2-1B-Instruct-Q5_K_S.gguf +3 -0
Llama-3.2-1B-Instruct-Q5_K_S_imat.gguf +3 -0
Llama-3.2-1B-Instruct-Q6_K.gguf +3 -0
Llama-3.2-1B-Instruct-Q8_0.gguf +3 -0
README.md +34 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,23 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+Llama-3.2-1B-Instruct-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-3.2-1B-Instruct-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-3.2-1B-Instruct-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-3.2-1B-Instruct-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-3.2-1B-Instruct-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-3.2-1B-Instruct-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-3.2-1B-Instruct-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-3.2-1B-Instruct-Q5_0.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-3.2-1B-Instruct-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-3.2-1B-Instruct-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-3.2-1B-Instruct-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-3.2-1B-Instruct-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-3.2-1B-Instruct-IQ3_M_imat.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-3.2-1B-Instruct-IQ3_XXS_imat.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-3.2-1B-Instruct-Q4_K_M_imat.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-3.2-1B-Instruct-Q4_K_S_imat.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-3.2-1B-Instruct-IQ4_NL_imat.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-3.2-1B-Instruct-IQ4_XS_imat.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-3.2-1B-Instruct-Q5_K_M_imat.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-3.2-1B-Instruct-Q5_K_S_imat.gguf filter=lfs diff=lfs merge=lfs -text

Llama-3.2-1B-Instruct-IQ3_M_imat.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:848b4fb777c026a2eae3e1033734d620b2772982ea9dc905ee8f8bcf594a407b
+size 657289280

Llama-3.2-1B-Instruct-IQ3_XXS_imat.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7216551ff66ca41612412f62ab8db58abac017933ed9934d12345a3eeedc9950
+size 562110528

Llama-3.2-1B-Instruct-IQ4_NL_imat.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2eda584fdcb4067620b9b11079a154f11cad9c734ff77011b945d1effa8c259c
+size 773025856

Llama-3.2-1B-Instruct-IQ4_XS_imat.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:15f8c3ec48edf71a67b6096336fee7b77221421022aae1aa21b39616ea227531
+size 743141440

Llama-3.2-1B-Instruct-Q2_K.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a870730e0fff8e6c4656e4f611faa16bde7b16f33c059292167a174bf15e5b2e
+size 580874080

Llama-3.2-1B-Instruct-Q3_K_L.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ef44bca078435843c7788f9c03e7b495a099c131f845ed19dc0257e561e8caf3
+size 732524384

Llama-3.2-1B-Instruct-Q3_K_M.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7b36f7efe910829de87ab1fcd9a55fdb0bf481d8e158345b13dc48486a324a79
+size 690843488

Llama-3.2-1B-Instruct-Q3_K_S.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1444f1e3d528823058010ea5152b8f32a332f9bce37290d480c4d4e50b04eb41
+size 641691488

Llama-3.2-1B-Instruct-Q4_0.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:eadfd8fd4e29d48e720eb87fc8242d3a8d4d2dacd52c722adc8e69e48c668efc
+size 770928480

Llama-3.2-1B-Instruct-Q4_K_M.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:26bac8efd811cb41a80db4393dbe5c8360abd54b98954ec766aa4ba7dacc0bc5
+size 807694176

Llama-3.2-1B-Instruct-Q4_K_M_imat.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a9a93ed1c1df05b83a365b2a1ca429657df063e642fde9027e54cbf07137d5e9
+size 807694400

Llama-3.2-1B-Instruct-Q4_K_S.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5550376826ef08901a4145559647844d5e70a950d69145e83ae2d262ce5ce0e2
+size 775647072

Llama-3.2-1B-Instruct-Q4_K_S_imat.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cdac3f90911b2c9e171af128787e7ce6a769fb2a64a90f5b2597db97ac1623b6
+size 775647296

Llama-3.2-1B-Instruct-Q5_0.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f6aea9bca54d1b5033035771963e0bf24d307ff756ab476744a2b43ad2eeb68d
+size 892563296

Llama-3.2-1B-Instruct-Q5_K_M.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7f5165ccccbd6953de2a35ca56300ebedfb70739a407dd096e3a5c658477aefa
+size 911503200

Llama-3.2-1B-Instruct-Q5_K_M_imat.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ea756771308d485601da96d5ce6f62745888ea84fbc8d4b6bb0f3b214816a83b
+size 911503424

Llama-3.2-1B-Instruct-Q5_K_S.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a14d69cc881f282405b8ba59ab6377a3eb7f2c3686077d1be796c87f6298c398
+size 892563296

Llama-3.2-1B-Instruct-Q5_K_S_imat.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:852c37accb67fad10d2ae9ab8e36338b5365dbf43b039672534a4768f1c8905b
+size 892563520

Llama-3.2-1B-Instruct-Q6_K.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4bf385159856b7c50a938b1228112318d9f99238a76880ea0f6381ab879982b3
+size 1021800288

Llama-3.2-1B-Instruct-Q8_0.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:da49f51ced8c15546e7779beb677fb53eb5d0b3b38ac4607ac60d58d77074823
+size 1321082720

README.md ADDED Viewed

	@@ -0,0 +1,34 @@

+# medmekk/Llama-3.2-1B-Instruct.GGUF
+GGUF quantized versions of [meta-llama/Llama-3.2-1B-Instruct](https://huggingface.co/meta-llama/Llama-3.2-1B-Instruct)
+## Available Formats:
+- `Q2_K`: Llama-3.2-1B-Instruct-Q2_K.gguf
+- `Q3_K_S`: Llama-3.2-1B-Instruct-Q3_K_S.gguf
+- `Q3_K_M`: Llama-3.2-1B-Instruct-Q3_K_M.gguf
+- `Q3_K_L`: Llama-3.2-1B-Instruct-Q3_K_L.gguf
+- `Q4_0`: Llama-3.2-1B-Instruct-Q4_0.gguf
+- `Q4_K_S`: Llama-3.2-1B-Instruct-Q4_K_S.gguf
+- `Q4_K_M`: Llama-3.2-1B-Instruct-Q4_K_M.gguf
+- `Q5_0`: Llama-3.2-1B-Instruct-Q5_0.gguf
+- `Q5_K_S`: Llama-3.2-1B-Instruct-Q5_K_S.gguf
+- `Q5_K_M`: Llama-3.2-1B-Instruct-Q5_K_M.gguf
+- `Q6_K`: Llama-3.2-1B-Instruct-Q6_K.gguf
+- `Q8_0`: Llama-3.2-1B-Instruct-Q8_0.gguf
+- `IQ3_M_IMAT`: Llama-3.2-1B-Instruct-IQ3_M_imat.gguf
+- `IQ3_XXS_IMAT`: Llama-3.2-1B-Instruct-IQ3_XXS_imat.gguf
+- `Q4_K_M_IMAT`: Llama-3.2-1B-Instruct-Q4_K_M_imat.gguf
+- `Q4_K_S_IMAT`: Llama-3.2-1B-Instruct-Q4_K_S_imat.gguf
+- `IQ4_NL_IMAT`: Llama-3.2-1B-Instruct-IQ4_NL_imat.gguf
+- `IQ4_XS_IMAT`: Llama-3.2-1B-Instruct-IQ4_XS_imat.gguf
+- `Q5_K_M_IMAT`: Llama-3.2-1B-Instruct-Q5_K_M_imat.gguf
+- `Q5_K_S_IMAT`: Llama-3.2-1B-Instruct-Q5_K_S_imat.gguf
+## Usage with llama.cpp:
+```bash
+# CLI:
+llama-cli --hf-repo medmekk/Llama-3.2-1B-Instruct.GGUF --hf-file MODEL_FILE -p "Your prompt"
+# Server:
+llama-server --hf-repo medmekk/Llama-3.2-1B-Instruct.GGUF --hf-file MODEL_FILE -c 2048
+```