morriszms commited on
Commit
effec43
1 Parent(s): 657792f

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -33,3 +33,15 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ Pythia-31M-Chat-v1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
37
+ Pythia-31M-Chat-v1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
38
+ Pythia-31M-Chat-v1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
39
+ Pythia-31M-Chat-v1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
40
+ Pythia-31M-Chat-v1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text
41
+ Pythia-31M-Chat-v1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
42
+ Pythia-31M-Chat-v1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
43
+ Pythia-31M-Chat-v1-Q5_0.gguf filter=lfs diff=lfs merge=lfs -text
44
+ Pythia-31M-Chat-v1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
45
+ Pythia-31M-Chat-v1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
46
+ Pythia-31M-Chat-v1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
47
+ Pythia-31M-Chat-v1-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text
Pythia-31M-Chat-v1-Q2_K.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09b787655ad514ded6933752c4cc2c1889b49118d748fd78499d66bedf093d0f
3
+ size 18393408
Pythia-31M-Chat-v1-Q3_K_L.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ff2e3f531a18d2a204a04df95165e0d95504bf2147fb9c0627a694762d63195
3
+ size 20644416
Pythia-31M-Chat-v1-Q3_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:951740af7699141cd10f18bbc1896215f975de334db4d8487c007b1bbcef41f8
3
+ size 20398656
Pythia-31M-Chat-v1-Q3_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:338e61bedfa70a71cc36aebd97a1846103452ca4deb61e71f8c349eadcd8eb35
3
+ size 19980864
Pythia-31M-Chat-v1-Q4_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:154ec3af278abb7e091bbe11f3a7f1ee35372545e49b82d766e5055aef6ef5f0
3
+ size 22317888
Pythia-31M-Chat-v1-Q4_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7afeb12b87f63148dd4b471d03bd3e494d9357888c51a094e1c20688e88b756e
3
+ size 22600512
Pythia-31M-Chat-v1-Q4_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:084fadb72662eefa6d9a927280a995472663d2a4ca106ea8bc383c4f66f7e0e3
3
+ size 22317888
Pythia-31M-Chat-v1-Q5_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c287801de561986ea87d73f07ee4c6b49bea905c8ef30e18e1695177a31c6b9
3
+ size 24517440
Pythia-31M-Chat-v1-Q5_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79af5d786685dafdafe43e89c146c94e63c73da1a96f2664e12a9bb55993d7bc
3
+ size 24743744
Pythia-31M-Chat-v1-Q5_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d5fea3be949e9edc005b194df2b84c94296975081f7878c1e4b14d737d67e8d
3
+ size 24517440
Pythia-31M-Chat-v1-Q6_K.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:799d4582a70731364983022296b1004c46f710b08aabe9d689624ea75812a14d
3
+ size 26854464
Pythia-31M-Chat-v1-Q8_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2cd105677585ebcaf4e2bdb13d9982b701df619e27969012a7ba17905b8db478
3
+ size 34234944
README.md ADDED
@@ -0,0 +1,229 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ language:
3
+ - en
4
+ license: apache-2.0
5
+ base_model: Felladrin/Pythia-31M-Chat-v1
6
+ datasets:
7
+ - totally-not-an-llm/EverythingLM-data-V3
8
+ - databricks/databricks-dolly-15k
9
+ - THUDM/webglm-qa
10
+ - starfishmedical/webGPT_x_dolly
11
+ - Amod/mental_health_counseling_conversations
12
+ - sablo/oasst2_curated
13
+ - cognitivecomputations/wizard_vicuna_70k_unfiltered
14
+ - mlabonne/chatml_dpo_pairs
15
+ pipeline_tag: text-generation
16
+ widget:
17
+ - messages:
18
+ - role: system
19
+ content: You are a career counselor. The user will provide you with an individual
20
+ looking for guidance in their professional life, and your task is to assist
21
+ them in determining what careers they are most suited for based on their skills,
22
+ interests, and experience. You should also conduct research into the various
23
+ options available, explain the job market trends in different industries, and
24
+ advice on which qualifications would be beneficial for pursuing particular fields.
25
+ - role: user
26
+ content: Heya!
27
+ - role: assistant
28
+ content: Hi! How may I help you?
29
+ - role: user
30
+ content: I am interested in developing a career in software engineering. What
31
+ would you recommend me to do?
32
+ - messages:
33
+ - role: system
34
+ content: You are a helpful assistant who answers user's questions with details
35
+ and curiosity.
36
+ - role: user
37
+ content: What are some potential applications for quantum computing?
38
+ - messages:
39
+ - role: system
40
+ content: You are a highly knowledgeable assistant. Help the user as much as you
41
+ can.
42
+ - role: user
43
+ content: What are some steps I can take to become a healthier person?
44
+ inference:
45
+ parameters:
46
+ max_new_tokens: 250
47
+ penalty_alpha: 0.5
48
+ top_k: 2
49
+ repetition_penalty: 1.0016
50
+ tags:
51
+ - TensorBlock
52
+ - GGUF
53
+ model-index:
54
+ - name: Pythia-31M-Chat-v1
55
+ results:
56
+ - task:
57
+ type: text-generation
58
+ name: Text Generation
59
+ dataset:
60
+ name: AI2 Reasoning Challenge (25-Shot)
61
+ type: ai2_arc
62
+ config: ARC-Challenge
63
+ split: test
64
+ args:
65
+ num_few_shot: 25
66
+ metrics:
67
+ - type: acc_norm
68
+ value: 22.7
69
+ name: normalized accuracy
70
+ source:
71
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=Felladrin/Pythia-31M-Chat-v1
72
+ name: Open LLM Leaderboard
73
+ - task:
74
+ type: text-generation
75
+ name: Text Generation
76
+ dataset:
77
+ name: HellaSwag (10-Shot)
78
+ type: hellaswag
79
+ split: validation
80
+ args:
81
+ num_few_shot: 10
82
+ metrics:
83
+ - type: acc_norm
84
+ value: 25.6
85
+ name: normalized accuracy
86
+ source:
87
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=Felladrin/Pythia-31M-Chat-v1
88
+ name: Open LLM Leaderboard
89
+ - task:
90
+ type: text-generation
91
+ name: Text Generation
92
+ dataset:
93
+ name: MMLU (5-Shot)
94
+ type: cais/mmlu
95
+ config: all
96
+ split: test
97
+ args:
98
+ num_few_shot: 5
99
+ metrics:
100
+ - type: acc
101
+ value: 23.24
102
+ name: accuracy
103
+ source:
104
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=Felladrin/Pythia-31M-Chat-v1
105
+ name: Open LLM Leaderboard
106
+ - task:
107
+ type: text-generation
108
+ name: Text Generation
109
+ dataset:
110
+ name: Winogrande (5-shot)
111
+ type: winogrande
112
+ config: winogrande_xl
113
+ split: validation
114
+ args:
115
+ num_few_shot: 5
116
+ metrics:
117
+ - type: acc
118
+ value: 47.99
119
+ name: accuracy
120
+ source:
121
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=Felladrin/Pythia-31M-Chat-v1
122
+ name: Open LLM Leaderboard
123
+ - task:
124
+ type: text-generation
125
+ name: Text Generation
126
+ dataset:
127
+ name: TruthfulQA (0-shot)
128
+ type: truthful_qa
129
+ config: multiple_choice
130
+ split: validation
131
+ args:
132
+ num_few_shot: 0
133
+ metrics:
134
+ - type: mc2
135
+ value: 0.0
136
+ source:
137
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=Felladrin/Pythia-31M-Chat-v1
138
+ name: Open LLM Leaderboard
139
+ - task:
140
+ type: text-generation
141
+ name: Text Generation
142
+ dataset:
143
+ name: GSM8k (5-shot)
144
+ type: gsm8k
145
+ config: main
146
+ split: test
147
+ args:
148
+ num_few_shot: 5
149
+ metrics:
150
+ - type: acc
151
+ value: 0.0
152
+ name: accuracy
153
+ source:
154
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=Felladrin/Pythia-31M-Chat-v1
155
+ name: Open LLM Leaderboard
156
+ ---
157
+
158
+ <div style="width: auto; margin-left: auto; margin-right: auto">
159
+ <img src="https://i.imgur.com/jC7kdl8.jpeg" alt="TensorBlock" style="width: 100%; min-width: 400px; display: block; margin: auto;">
160
+ </div>
161
+ <div style="display: flex; justify-content: space-between; width: 100%;">
162
+ <div style="display: flex; flex-direction: column; align-items: flex-start;">
163
+ <p style="margin-top: 0.5em; margin-bottom: 0em;">
164
+ Feedback and support: TensorBlock's <a href="https://x.com/tensorblock_aoi">Twitter/X</a>, <a href="https://t.me/TensorBlock">Telegram Group</a> and <a href="https://x.com/tensorblock_aoi">Discord server</a>
165
+ </p>
166
+ </div>
167
+ </div>
168
+
169
+ ## Felladrin/Pythia-31M-Chat-v1 - GGUF
170
+
171
+ This repo contains GGUF format model files for [Felladrin/Pythia-31M-Chat-v1](https://huggingface.co/Felladrin/Pythia-31M-Chat-v1).
172
+
173
+ The files were quantized using machines provided by [TensorBlock](https://tensorblock.co/), and they are compatible with llama.cpp as of [commit b4011](https://github.com/ggerganov/llama.cpp/commit/a6744e43e80f4be6398fc7733a01642c846dce1d).
174
+
175
+ <div style="text-align: left; margin: 20px 0;">
176
+ <a href="https://tensorblock.co/waitlist/client" style="display: inline-block; padding: 10px 20px; background-color: #007bff; color: white; text-decoration: none; border-radius: 5px; font-weight: bold;">
177
+ Run them on the TensorBlock client using your local machine ↗
178
+ </a>
179
+ </div>
180
+
181
+ ## Prompt template
182
+
183
+ ```
184
+ <|im_start|>system
185
+ {system_prompt}<|im_end|>
186
+ <|im_start|>user
187
+ {prompt}<|im_end|>
188
+ <|im_start|>assistant
189
+ ```
190
+
191
+ ## Model file specification
192
+
193
+ | Filename | Quant type | File Size | Description |
194
+ | -------- | ---------- | --------- | ----------- |
195
+ | [Pythia-31M-Chat-v1-Q2_K.gguf](https://huggingface.co/tensorblock/Pythia-31M-Chat-v1-GGUF/blob/main/Pythia-31M-Chat-v1-Q2_K.gguf) | Q2_K | 0.017 GB | smallest, significant quality loss - not recommended for most purposes |
196
+ | [Pythia-31M-Chat-v1-Q3_K_S.gguf](https://huggingface.co/tensorblock/Pythia-31M-Chat-v1-GGUF/blob/main/Pythia-31M-Chat-v1-Q3_K_S.gguf) | Q3_K_S | 0.019 GB | very small, high quality loss |
197
+ | [Pythia-31M-Chat-v1-Q3_K_M.gguf](https://huggingface.co/tensorblock/Pythia-31M-Chat-v1-GGUF/blob/main/Pythia-31M-Chat-v1-Q3_K_M.gguf) | Q3_K_M | 0.019 GB | very small, high quality loss |
198
+ | [Pythia-31M-Chat-v1-Q3_K_L.gguf](https://huggingface.co/tensorblock/Pythia-31M-Chat-v1-GGUF/blob/main/Pythia-31M-Chat-v1-Q3_K_L.gguf) | Q3_K_L | 0.019 GB | small, substantial quality loss |
199
+ | [Pythia-31M-Chat-v1-Q4_0.gguf](https://huggingface.co/tensorblock/Pythia-31M-Chat-v1-GGUF/blob/main/Pythia-31M-Chat-v1-Q4_0.gguf) | Q4_0 | 0.021 GB | legacy; small, very high quality loss - prefer using Q3_K_M |
200
+ | [Pythia-31M-Chat-v1-Q4_K_S.gguf](https://huggingface.co/tensorblock/Pythia-31M-Chat-v1-GGUF/blob/main/Pythia-31M-Chat-v1-Q4_K_S.gguf) | Q4_K_S | 0.021 GB | small, greater quality loss |
201
+ | [Pythia-31M-Chat-v1-Q4_K_M.gguf](https://huggingface.co/tensorblock/Pythia-31M-Chat-v1-GGUF/blob/main/Pythia-31M-Chat-v1-Q4_K_M.gguf) | Q4_K_M | 0.021 GB | medium, balanced quality - recommended |
202
+ | [Pythia-31M-Chat-v1-Q5_0.gguf](https://huggingface.co/tensorblock/Pythia-31M-Chat-v1-GGUF/blob/main/Pythia-31M-Chat-v1-Q5_0.gguf) | Q5_0 | 0.023 GB | legacy; medium, balanced quality - prefer using Q4_K_M |
203
+ | [Pythia-31M-Chat-v1-Q5_K_S.gguf](https://huggingface.co/tensorblock/Pythia-31M-Chat-v1-GGUF/blob/main/Pythia-31M-Chat-v1-Q5_K_S.gguf) | Q5_K_S | 0.023 GB | large, low quality loss - recommended |
204
+ | [Pythia-31M-Chat-v1-Q5_K_M.gguf](https://huggingface.co/tensorblock/Pythia-31M-Chat-v1-GGUF/blob/main/Pythia-31M-Chat-v1-Q5_K_M.gguf) | Q5_K_M | 0.023 GB | large, very low quality loss - recommended |
205
+ | [Pythia-31M-Chat-v1-Q6_K.gguf](https://huggingface.co/tensorblock/Pythia-31M-Chat-v1-GGUF/blob/main/Pythia-31M-Chat-v1-Q6_K.gguf) | Q6_K | 0.025 GB | very large, extremely low quality loss |
206
+ | [Pythia-31M-Chat-v1-Q8_0.gguf](https://huggingface.co/tensorblock/Pythia-31M-Chat-v1-GGUF/blob/main/Pythia-31M-Chat-v1-Q8_0.gguf) | Q8_0 | 0.032 GB | very large, extremely low quality loss - not recommended |
207
+
208
+
209
+ ## Downloading instruction
210
+
211
+ ### Command line
212
+
213
+ Firstly, install Huggingface Client
214
+
215
+ ```shell
216
+ pip install -U "huggingface_hub[cli]"
217
+ ```
218
+
219
+ Then, downoad the individual model file the a local directory
220
+
221
+ ```shell
222
+ huggingface-cli download tensorblock/Pythia-31M-Chat-v1-GGUF --include "Pythia-31M-Chat-v1-Q2_K.gguf" --local-dir MY_LOCAL_DIR
223
+ ```
224
+
225
+ If you wanna download multiple model files with a pattern (e.g., `*Q4_K*gguf`), you can try:
226
+
227
+ ```shell
228
+ huggingface-cli download tensorblock/Pythia-31M-Chat-v1-GGUF --local-dir MY_LOCAL_DIR --local-dir-use-symlinks False --include='*Q4_K*gguf'
229
+ ```