bartowski commited on
Commit
6bf66ff
1 Parent(s): e0e5904

Llamacpp quants

Browse files
.gitattributes CHANGED
@@ -33,3 +33,15 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ Fimbulvetr-Kuro-Lotus-10.7B-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
37
+ Fimbulvetr-Kuro-Lotus-10.7B-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
38
+ Fimbulvetr-Kuro-Lotus-10.7B-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
39
+ Fimbulvetr-Kuro-Lotus-10.7B-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
40
+ Fimbulvetr-Kuro-Lotus-10.7B-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text
41
+ Fimbulvetr-Kuro-Lotus-10.7B-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
42
+ Fimbulvetr-Kuro-Lotus-10.7B-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
43
+ Fimbulvetr-Kuro-Lotus-10.7B-Q5_0.gguf filter=lfs diff=lfs merge=lfs -text
44
+ Fimbulvetr-Kuro-Lotus-10.7B-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
45
+ Fimbulvetr-Kuro-Lotus-10.7B-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
46
+ Fimbulvetr-Kuro-Lotus-10.7B-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
47
+ Fimbulvetr-Kuro-Lotus-10.7B-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text
Fimbulvetr-Kuro-Lotus-10.7B-Q2_K.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5fa8511aa2404e1b28ac997e663c1bbdeb7ede89c8e61e14c14c4a9fd1a80aff
3
+ size 4003231936
Fimbulvetr-Kuro-Lotus-10.7B-Q3_K_L.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b37ae69387e26006a78738029d604e0f0c79dc718d16f45e47097a17ff87e04
3
+ size 5650749632
Fimbulvetr-Kuro-Lotus-10.7B-Q3_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c45ff270e7e6ca9b9fb7c76e44bd3e5e27ecec1f1ea8992aa597beae03b943a
3
+ size 5195667648
Fimbulvetr-Kuro-Lotus-10.7B-Q3_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0296c1b228bb5f06f2746e41ad0d80b7cd59a3b20bb9bb2f0eb7759f16b3e0d5
3
+ size 4664563904
Fimbulvetr-Kuro-Lotus-10.7B-Q4_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2c9c0a0ad77c92d70ece216c2ec40219c1bf24a556128c6170175be76a2ade5
3
+ size 6072383680
Fimbulvetr-Kuro-Lotus-10.7B-Q4_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a46ef2b032c4869b44359ac1ec0b27bdfbf857402171b570b86fc5c6680954a
3
+ size 6461667520
Fimbulvetr-Kuro-Lotus-10.7B-Q4_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a48b970b2810bd1dc2138933d9fc1c848f0daa8bae30be4af66a8a1e1de8f678
3
+ size 6118521024
Fimbulvetr-Kuro-Lotus-10.7B-Q5_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:287a3bf5e8ef452097d33b02b5c5551723cf82c96dd7fab4e7c643e78f0b09f9
3
+ size 7397390528
Fimbulvetr-Kuro-Lotus-10.7B-Q5_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd85cbd88e602bb0023519f37920225c3f9144c2ad91ee61a3926cb50ce0ae98
3
+ size 7597930688
Fimbulvetr-Kuro-Lotus-10.7B-Q5_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e324596457dfac61ee6d525a830e68c6c161e5569d8bb135cfc1f14567a0b3f
3
+ size 7397390528
Fimbulvetr-Kuro-Lotus-10.7B-Q6_K.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d1d4e78b63b46f36f2850af08a85f89684952c87b044310eea52780df1b6ab9
3
+ size 8805210304
Fimbulvetr-Kuro-Lotus-10.7B-Q8_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:852aa0557bb9cde0625f37568145b75d409cce7432e3d6debea0b03e2d1b27bd
3
+ size 11404155072
README.md ADDED
@@ -0,0 +1,140 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: cc-by-nc-4.0
3
+ library_name: transformers
4
+ tags:
5
+ - mergekit
6
+ - merge
7
+ base_model:
8
+ - Sao10K/Fimbulvetr-10.7B-v1
9
+ - saishf/Kuro-Lotus-10.7B
10
+ model-index:
11
+ - name: Fimbulvetr-Kuro-Lotus-10.7B
12
+ results:
13
+ - task:
14
+ type: text-generation
15
+ name: Text Generation
16
+ dataset:
17
+ name: AI2 Reasoning Challenge (25-Shot)
18
+ type: ai2_arc
19
+ config: ARC-Challenge
20
+ split: test
21
+ args:
22
+ num_few_shot: 25
23
+ metrics:
24
+ - type: acc_norm
25
+ value: 69.54
26
+ name: normalized accuracy
27
+ source:
28
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=saishf/Fimbulvetr-Kuro-Lotus-10.7B
29
+ name: Open LLM Leaderboard
30
+ - task:
31
+ type: text-generation
32
+ name: Text Generation
33
+ dataset:
34
+ name: HellaSwag (10-Shot)
35
+ type: hellaswag
36
+ split: validation
37
+ args:
38
+ num_few_shot: 10
39
+ metrics:
40
+ - type: acc_norm
41
+ value: 87.87
42
+ name: normalized accuracy
43
+ source:
44
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=saishf/Fimbulvetr-Kuro-Lotus-10.7B
45
+ name: Open LLM Leaderboard
46
+ - task:
47
+ type: text-generation
48
+ name: Text Generation
49
+ dataset:
50
+ name: MMLU (5-Shot)
51
+ type: cais/mmlu
52
+ config: all
53
+ split: test
54
+ args:
55
+ num_few_shot: 5
56
+ metrics:
57
+ - type: acc
58
+ value: 66.99
59
+ name: accuracy
60
+ source:
61
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=saishf/Fimbulvetr-Kuro-Lotus-10.7B
62
+ name: Open LLM Leaderboard
63
+ - task:
64
+ type: text-generation
65
+ name: Text Generation
66
+ dataset:
67
+ name: TruthfulQA (0-shot)
68
+ type: truthful_qa
69
+ config: multiple_choice
70
+ split: validation
71
+ args:
72
+ num_few_shot: 0
73
+ metrics:
74
+ - type: mc2
75
+ value: 60.95
76
+ source:
77
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=saishf/Fimbulvetr-Kuro-Lotus-10.7B
78
+ name: Open LLM Leaderboard
79
+ - task:
80
+ type: text-generation
81
+ name: Text Generation
82
+ dataset:
83
+ name: Winogrande (5-shot)
84
+ type: winogrande
85
+ config: winogrande_xl
86
+ split: validation
87
+ args:
88
+ num_few_shot: 5
89
+ metrics:
90
+ - type: acc
91
+ value: 84.14
92
+ name: accuracy
93
+ source:
94
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=saishf/Fimbulvetr-Kuro-Lotus-10.7B
95
+ name: Open LLM Leaderboard
96
+ - task:
97
+ type: text-generation
98
+ name: Text Generation
99
+ dataset:
100
+ name: GSM8k (5-shot)
101
+ type: gsm8k
102
+ config: main
103
+ split: test
104
+ args:
105
+ num_few_shot: 5
106
+ metrics:
107
+ - type: acc
108
+ value: 66.87
109
+ name: accuracy
110
+ source:
111
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=saishf/Fimbulvetr-Kuro-Lotus-10.7B
112
+ name: Open LLM Leaderboard
113
+ quantized_by: bartowski
114
+ pipeline_tag: text-generation
115
+ ---
116
+
117
+ ## Llamacpp Quantizations of Fimbulvetr-Kuro-Lotus-10.7B
118
+
119
+ Using <a href="https://github.com/ggerganov/llama.cpp/">llama.cpp</a> release <a href="https://github.com/ggerganov/llama.cpp/releases/tag/b2440">b2440</a> for quantization.
120
+
121
+ Original model: https://huggingface.co/saishf/Fimbulvetr-Kuro-Lotus-10.7B
122
+
123
+ Download a file (not the whole branch) from below:
124
+
125
+ | Filename | Quant type | File Size | Description |
126
+ | -------- | ---------- | --------- | ----------- |
127
+ | [Fimbulvetr-Kuro-Lotus-10.7B-Q8_0.gguf](https://huggingface.co/bartowski/Fimbulvetr-Kuro-Lotus-10.7B-GGUF/blob/main/Fimbulvetr-Kuro-Lotus-10.7B-Q8_0.gguf) | Q8_0 | 11.40GB | Extremely high quality, generally unneeded but max available quant. |
128
+ | [Fimbulvetr-Kuro-Lotus-10.7B-Q6_K.gguf](https://huggingface.co/bartowski/Fimbulvetr-Kuro-Lotus-10.7B-GGUF/blob/main/Fimbulvetr-Kuro-Lotus-10.7B-Q6_K.gguf) | Q6_K | 8.80GB | Very high quality, near perfect, *recommended*. |
129
+ | [Fimbulvetr-Kuro-Lotus-10.7B-Q5_K_M.gguf](https://huggingface.co/bartowski/Fimbulvetr-Kuro-Lotus-10.7B-GGUF/blob/main/Fimbulvetr-Kuro-Lotus-10.7B-Q5_K_M.gguf) | Q5_K_M | 7.59GB | High quality, very usable. |
130
+ | [Fimbulvetr-Kuro-Lotus-10.7B-Q5_K_S.gguf](https://huggingface.co/bartowski/Fimbulvetr-Kuro-Lotus-10.7B-GGUF/blob/main/Fimbulvetr-Kuro-Lotus-10.7B-Q5_K_S.gguf) | Q5_K_S | 7.39GB | High quality, very usable. |
131
+ | [Fimbulvetr-Kuro-Lotus-10.7B-Q5_0.gguf](https://huggingface.co/bartowski/Fimbulvetr-Kuro-Lotus-10.7B-GGUF/blob/main/Fimbulvetr-Kuro-Lotus-10.7B-Q5_0.gguf) | Q5_0 | 7.39GB | High quality, older format, generally not recommended. |
132
+ | [Fimbulvetr-Kuro-Lotus-10.7B-Q4_K_M.gguf](https://huggingface.co/bartowski/Fimbulvetr-Kuro-Lotus-10.7B-GGUF/blob/main/Fimbulvetr-Kuro-Lotus-10.7B-Q4_K_M.gguf) | Q4_K_M | 6.46GB | Good quality, similar to 4.25 bpw. |
133
+ | [Fimbulvetr-Kuro-Lotus-10.7B-Q4_K_S.gguf](https://huggingface.co/bartowski/Fimbulvetr-Kuro-Lotus-10.7B-GGUF/blob/main/Fimbulvetr-Kuro-Lotus-10.7B-Q4_K_S.gguf) | Q4_K_S | 6.11GB | Slightly lower quality with small space savings. |
134
+ | [Fimbulvetr-Kuro-Lotus-10.7B-Q4_0.gguf](https://huggingface.co/bartowski/Fimbulvetr-Kuro-Lotus-10.7B-GGUF/blob/main/Fimbulvetr-Kuro-Lotus-10.7B-Q4_0.gguf) | Q4_0 | 6.07GB | Decent quality, older format, generally not recommended. |
135
+ | [Fimbulvetr-Kuro-Lotus-10.7B-Q3_K_L.gguf](https://huggingface.co/bartowski/Fimbulvetr-Kuro-Lotus-10.7B-GGUF/blob/main/Fimbulvetr-Kuro-Lotus-10.7B-Q3_K_L.gguf) | Q3_K_L | 5.65GB | Lower quality but usable, good for low RAM availability. |
136
+ | [Fimbulvetr-Kuro-Lotus-10.7B-Q3_K_M.gguf](https://huggingface.co/bartowski/Fimbulvetr-Kuro-Lotus-10.7B-GGUF/blob/main/Fimbulvetr-Kuro-Lotus-10.7B-Q3_K_M.gguf) | Q3_K_M | 5.19GB | Even lower quality. |
137
+ | [Fimbulvetr-Kuro-Lotus-10.7B-Q3_K_S.gguf](https://huggingface.co/bartowski/Fimbulvetr-Kuro-Lotus-10.7B-GGUF/blob/main/Fimbulvetr-Kuro-Lotus-10.7B-Q3_K_S.gguf) | Q3_K_S | 4.66GB | Low quality, not recommended. |
138
+ | [Fimbulvetr-Kuro-Lotus-10.7B-Q2_K.gguf](https://huggingface.co/bartowski/Fimbulvetr-Kuro-Lotus-10.7B-GGUF/blob/main/Fimbulvetr-Kuro-Lotus-10.7B-Q2_K.gguf) | Q2_K | 4.00GB | Extremely low quality, *not* recommended.
139
+
140
+ Want to support my work? Visit my ko-fi page here: https://ko-fi.com/bartowski