eduagarcia commited on
Commit
b4fc70b
1 Parent(s): 4c822de

fix typo and multiple models in README

Browse files
README.md CHANGED
@@ -27,58 +27,141 @@ space_ci: # See https://huggingface.co/spaces/Wauplin/gradio-space-ci
27
  - IS_PUBLIC
28
  - HAS_HIGHER_RATE_LIMIT
29
  models:
30
- - gpt2
31
- - t5-base
32
- - t5-large
33
- - t5-small
34
  - 01-ai/Yi-34B-200K
35
  - 01-ai/Yi-34B-Chat
36
- - 01-ai/Yi-34B
37
  - 01-ai/Yi-6B-200K
38
  - 01-ai/Yi-6B-Chat
39
- - 01-ai/Yi-6B
40
- - 01-ai/Yi-9B-200k
41
  - 01-ai/Yi-9B
 
42
  - 22h/cabrita_7b_pt_850000
43
  - 22h/open-cabrita3b
44
- - abacusai/Smaug-34B-v0.1
45
- - abacusai/Smaug-72B-v0.1
46
- - AetherResearch/Cerebrum-1.0-7b
47
  - AI-Sweden-Models/gpt-sw3-40b
48
- - AI-Sweden-Models/gpt-sw3-6.7b-v2
49
  - AI-Sweden-Models/gpt-sw3-6.7b
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
50
  - allenai/OLMo-1B
51
- - allenai/OLMo-7B-Twin-2T
52
  - allenai/OLMo-7B
 
53
  - allenai/tulu-2-dpo-13b
54
  - allenai/tulu-2-dpo-7b
55
  - argilla/CapybaraHermes-2.5-Mistral-7B
56
  - argilla/notus-7b-v1
57
  - argilla/notux-8x7b-v1
58
- - BAAI/Aquila-7B
59
- - BAAI/Aquila2-34B
60
- - BAAI/Aquila2-7B
61
  - baichuan-inc/Baichuan-7B
62
  - baichuan-inc/Baichuan2-13B-Base
63
  - baichuan-inc/Baichuan2-7B-Base
64
  - bardsai/jaskier-7b-dpo-v5.6
65
- - bardsai/jaskier-7b-dpo-v5.6
66
  - berkeley-nest/Starling-LM-7B-alpha
67
  - bigscience/bloom-1b7
68
  - bigscience/bloom-3b
69
  - bigscience/bloom-560m
70
  - bigscience/bloom-7b1
71
- - Bruno/Caramelinho
72
- - Bruno/Caramelo_7B
73
- - cnmoro/Mistral-7B-Portuguese
74
  - cnmoro/Mistral-7B-Portuguese
75
- - CohereForAI/aya-101
76
- - CohereForAI/c4ai-command-r-plus-4bit
77
- - CohereForAI/c4ai-command-r-v01
78
  - croissantllm/CroissantLLMBase
79
- - DAMO-NLP-MT/polylm-1.7b
80
- - DAMO-NLP-MT/polylm-13b
81
- - Deci/DeciLM-7B
82
  - deepseek-ai/deepseek-llm-7b-base
83
  - deepseek-ai/deepseek-moe-16b-base
84
  - deepseek-ai/deepseek-moe-16b-chat
@@ -88,20 +171,6 @@ models:
88
  - dynamofl/dynamo-8B-v0.1
89
  - eduagarcia/gemma-7b-it_no_chat_template
90
  - eduagarcia/gemma-7b-it_singleturn_chat_template
91
- - EleutherAI/gpt-j-6b
92
- - EleutherAI/gpt-neo-1.3B
93
- - EleutherAI/gpt-neo-125m
94
- - EleutherAI/gpt-neo-2.7B
95
- - EleutherAI/gpt-neox-20b
96
- - EleutherAI/pythia-14m
97
- - EleutherAI/pythia-160m-deduped
98
- - EleutherAI/pythia-1b-deduped
99
- - EleutherAI/pythia-1b
100
- - EleutherAI/pythia-2.8b-deduped
101
- - EleutherAI/pythia-410m-deduped
102
- - EleutherAI/pythia-6.9b-deduped
103
- - EleutherAI/pythia-6.9b
104
- - EleutherAI/pythia-70m-deduped
105
  - facebook/opt-1.3b
106
  - facebook/opt-125m
107
  - facebook/opt-13b
@@ -110,37 +179,25 @@ models:
110
  - facebook/opt-350m
111
  - facebook/opt-6.7b
112
  - facebook/opt-66b
113
- - fernandosola/bluearara-7B-instruct
114
- - fernandosola/bluearara-7B
115
  - fernandosola/bluearara-7B
116
- - FuseAI/FuseChat-7B-VaRM
117
- - FuseAI/OpenChat-3.5-7B-Solar
118
  - google/gemma-1.1-2b-it
119
  - google/gemma-1.1-7b-it
120
- - google/gemma-2b-it
121
  - google/gemma-2b
122
- - google/gemma-7b-it
123
- - google/gemma-7b-it
124
  - google/gemma-7b
 
125
  - google/mt5-base
126
- - google/mt5-base
127
- - google/mt5-small
128
  - google/mt5-small
 
129
  - h2oai/h2o-danube-1.8b-base
130
  - h2oai/h2o-danube-1.8b-chat
131
  - h2oai/h2o-danube2-1.8b-base
132
  - h2oai/h2o-danube2-1.8b-chat
133
- - HeyLucasLeao/gpt-neo-small-portuguese
134
- - HuggingFaceH4/zephyr-7b-alpha
135
- - HuggingFaceH4/zephyr-7b-beta
136
- - HuggingFaceH4/zephyr-7b-gemma-v0.1
137
- - HuggingFaceTB/cosmo-1b
138
  - huggyllama/llama-13b
139
  - huggyllama/llama-30b
140
  - huggyllama/llama-65b
141
  - huggyllama/llama-7b
142
- - Intel/neural-chat-7b-v3-1
143
- - Intel/neural-chat-7b-v3-3
144
  - internlm/internlm-20b
145
  - internlm/internlm-7b
146
  - internlm/internlm2-1_8b
@@ -149,18 +206,8 @@ models:
149
  - internlm/internlm2-base-20b
150
  - internlm/internlm2-base-7b
151
  - internlm/internlm2-chat-1_8b
152
- - internlm/internlm2-chat-1_8b
153
  - internlm/internlm2-chat-20b
154
- - internlm/internlm2-chat-20b
155
- - internlm/internlm2-chat-7b
156
  - internlm/internlm2-chat-7b
157
- - J-LAB/BRisa-7B-Instruct-v0.2
158
- - J-LAB/BRisa-7B-Instruct-v0.2
159
- - JJhooww/Mistral-7B-v0.2-Base_ptbr
160
- - JJhooww/Mistral-7B-v0.2-Base_ptbr
161
- - JJhooww/MistralReloadBR_v2_ptbr
162
- - JJhooww/Mistral_Relora_Step2k
163
- - JJhooww/Mistral_Relora_Step2k
164
  - josu/gpt-neo-pt-1.3B
165
  - josu/gpt-neo-pt-br
166
  - lmsys/vicuna-13b-v1.5
@@ -168,21 +215,18 @@ models:
168
  - lrds-code/boana-7b-instruct
169
  - lrds-code/samba-1.1B
170
  - lucianosb/boto-7B
171
- - MagusCorp/legislinho
172
- - maritaca-ai/sabia-7b
173
  - maritaca-ai/sabia-7b
174
  - matsuo-lab/weblab-10b
175
- - MaziyarPanahi/Mistral-7B-Instruct-Aya-101
176
  - meta-llama/Llama-2-13b-chat-hf
177
  - meta-llama/Llama-2-13b-hf
178
  - meta-llama/Llama-2-70b-chat-hf
179
  - meta-llama/Llama-2-70b-hf
180
  - meta-llama/Llama-2-7b-chat-hf
181
  - meta-llama/Llama-2-7b-hf
182
- - meta-llama/Meta-Llama-3-8B-Instruct
183
  - meta-llama/Meta-Llama-3-8B
184
- - microsoft/phi-1_5
185
  - microsoft/phi-1
 
186
  - microsoft/phi-2
187
  - mistral-community/Mistral-7B-v0.2
188
  - mistral-community/Mixtral-8x22B-v0.1-4bit
@@ -192,159 +236,87 @@ models:
192
  - mistralai/Mixtral-8x7B-v0.1
193
  - mlabonne/Monarch-7B
194
  - monilouise/opt125M_portuguese
195
- - mosaicml/mpt-7b-8k
196
  - mosaicml/mpt-7b
197
- - Nexusflow/Starling-LM-7B-beta
198
  - nicholasKluge/Aira-2-portuguese-124M
199
  - nicholasKluge/Aira-2-portuguese-1B7
200
  - nicholasKluge/Aira-2-portuguese-560M
201
  - nicholasKluge/TeenyTinyLlama-160m
202
- - nicholasKluge/TeenyTinyLlama-460m-Chat
203
  - nicholasKluge/TeenyTinyLlama-460m
204
- - nicolasdec/cabra13b
 
205
  - nicolasdec/CabraMistral7b-0.4
206
- - nicolasdec/Cabramistral7b
207
- - nicolasdec/Cabramistral7b
208
- - nicolasdec/CabraQwen14b
209
  - nicolasdec/CabraQwen14b
210
  - nicolasdec/CabraQwen7b
211
- - nicolasdec/Cabra
212
- - NousResearch/Nous-Hermes-13b
213
- - NousResearch/Nous-Hermes-2-Mistral-7B-DPO
214
- - NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO
215
- - NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO
216
- - NousResearch/Nous-Hermes-2-SOLAR-10.7B
217
- - NousResearch/Nous-Hermes-2-Yi-34B
218
- - NOVA-vision-language/GlorIA-1.3B
219
- - NucleusAI/nucleus-22B-token-500B
220
  - openai-community/gpt2-large
221
  - openai-community/gpt2-medium
222
  - openai-community/gpt2-xl
223
  - openai-community/openai-gpt
224
  - openchat/openchat-3.5-0106
225
- - OpenLLM-France/Claire-7B-0.1
226
- - OpenLLM-France/Claire-Mistral-7B-0.1
227
  - openlm-research/open_llama_13b
228
  - openlm-research/open_llama_3b
229
  - openlm-research/open_llama_3b_v2
230
  - openlm-research/open_llama_7b
231
  - openlm-research/open_llama_7b_v2
232
- - OrionStarAI/Orion-14B-Base
233
  - paulml/OGNO-7B
234
  - pierreguillou/gpt2-small-portuguese
235
- - PORTULAN/gervasio-7b-portuguese-ptbr-decoder
236
- - PORTULAN/gervasio-7b-portuguese-ptpt-decoder
237
- - projecte-aina/aguila-7b
238
  - projecte-aina/FLOR-1.3B
239
  - projecte-aina/FLOR-6.3B
240
  - projecte-aina/FLOR-760M
 
241
  - pucpr/gpt2-bio-pt
242
- - Qwen/Qwen-14B
243
- - Qwen/Qwen-14B
244
- - Qwen/Qwen-1_8B-Chat
245
- - Qwen/Qwen-1_8B-Chat
246
- - Qwen/Qwen-1_8B
247
- - Qwen/Qwen-1_8B
248
- - Qwen/Qwen-72B-Chat
249
- - Qwen/Qwen-72B
250
- - Qwen/Qwen-7B-Chat
251
- - Qwen/Qwen-7B-Chat
252
- - Qwen/Qwen-7B
253
- - Qwen/Qwen-7B
254
- - Qwen/Qwen1.5-0.5B-Chat
255
- - Qwen/Qwen1.5-0.5B
256
- - Qwen/Qwen1.5-1.8B-Chat
257
- - Qwen/Qwen1.5-1.8B
258
- - Qwen/Qwen1.5-14B-Chat
259
- - Qwen/Qwen1.5-14B
260
- - Qwen/Qwen1.5-32B-Chat
261
- - Qwen/Qwen1.5-32B
262
- - Qwen/Qwen1.5-4B-Chat
263
- - Qwen/Qwen1.5-4B
264
- - Qwen/Qwen1.5-72B-Chat
265
- - Qwen/Qwen1.5-72B
266
- - Qwen/Qwen1.5-7B-Chat
267
- - Qwen/Qwen1.5-7B
268
- - Qwen/Qwen1.5-MoE-A2.7B-Chat
269
- - Qwen/Qwen1.5-MoE-A2.7B
270
  - recogna-nlp/bode-13b-alpaca-pt-br
271
  - recogna-nlp/bode-7b-alpaca-pt-br
272
- - recogna-nlp/GemBode-2b-it
273
  - recogna-nlp/gembode-2b-ultraalpaca
274
  - recogna-nlp/internlmbode-7b
275
  - recogna-nlp/mistral-bode
276
  - recogna-nlp/phi-bode-2-ultraalpaca
277
- - recogna-nlp/Phi-Bode
278
- - rhaymison/gemma-portuguese-2b-it
279
- - rhaymison/gemma-portuguese-luana-2b
280
- - rhaymison/gemma-portuguese-luana-2b
281
  - rhaymison/Llama-portuguese-13b-Luana-v0.2
282
- - rhaymison/Mistral-portuguese-luana-7b-chat
283
- - rhaymison/Mistral-portuguese-luana-7b-Mathematics
284
  - rhaymison/Mistral-portuguese-luana-7b-Mathematics
 
285
  - rhaymison/Mistral-portuguese-luana-7b-mental-health
286
- - rhaymison/Mistral-portuguese-luana-7b-mental-health
287
- - rhaymison/Mistral-portuguese-luana-7b
288
- - rhaymison/Qwen-portuguese-luana-7b
289
  - rhaymison/Qwen-portuguese-luana-7b
290
- - rishiraj/CatPPT-base
 
291
  - rishiraj/CatPPT
 
292
  - semantixai/LloroV2
293
- - Skywork/Skywork-13B-base
294
- - stabilityai/stablelm-2-12b-chat
295
  - stabilityai/stablelm-2-12b
296
- - stabilityai/stablelm-2-1_6b-chat
297
- - stabilityai/stablelm-2-1_6b
298
  - stabilityai/stablelm-2-1_6b
 
299
  - stabilityai/stablelm-2-zephyr-1_6b
300
  - stabilityai/stablelm-3b-4e1t
301
- - stabilityai/stablelm-base-alpha-3b-v2
302
  - stabilityai/stablelm-base-alpha-3b
303
- - stabilityai/stablelm-base-alpha-7b-v2
304
  - stabilityai/stablelm-base-alpha-7b
 
305
  - stabilityai/stablelm-zephyr-3b
306
  - state-spaces/mamba-1.4b-hf
307
  - state-spaces/mamba-130m-hf
308
  - state-spaces/mamba-2.8b-hf
309
  - state-spaces/mamba-370m-hf
310
  - state-spaces/mamba-790m-hf
 
 
 
311
  - teknium/OpenHermes-2-Mistral-7B
312
  - teknium/OpenHermes-2.5-Mistral-7B
313
- - TencentARC/Mistral_Pro_8B_v0.1
314
- - THUDM/agentlm-7b
315
- - THUDM/chatglm2-6b
316
- - THUDM/chatglm3-6b-128k
317
- - THUDM/chatglm3-6b-32k
318
- - THUDM/chatglm3-6b-base
319
- - THUDM/chatglm3-6b
320
- - THUDM/LongAlign-7B-64k
321
  - tiiuae/falcon-40b
322
  - tiiuae/falcon-7b
323
- - TinyLlama/TinyLlama-1.1B-Chat-v1.0
324
- - TinyLlama/TinyLlama-1.1B-intermediate-step-1431k-3T
325
  - togethercomputer/RedPajama-INCITE-7B-Base
326
  - togethercomputer/RedPajama-INCITE-Base-3B-v1
327
- - Unbabel/TowerBase-7B-v0.1
328
  - upstage/SOLAR-10.7B-Instruct-v1.0
329
  - upstage/SOLAR-10.7B-v1.0
330
- - Walmart-the-bag/Misted-v2-7B
331
- - Walmart-the-bag/WordWoven-2x7B
332
  - wandgibaut/periquito-3B
333
- - Weni/WeniGPT-2.2.3-Zephyr-7B-LLM_Base_2.0.3_SFT
334
- - Weni/WeniGPT-2.2.3-Zephyr-7B-merged-LLM_Base_2.0.3_SFT
335
- - Weni/WeniGPT-2.4.1-Zephyr-7B-3-epochs-GPT-QA-1.0.1_DP_DPO
336
- - Weni/WeniGPT-2.8.1-Zephyr-7B-zephyr-prompt-binarized
337
- - Weni/WeniGPT-2.8.1-Zephyr-7B-zephyr-prompt-binarized
338
- - Weni/WeniGPT-Agents-Zephyr-1.0.17-KTO
339
- - Weni/WeniGPT-Mistral-7B-instructBase-4bit
340
- - Weni/WeniGPT-Mistral-7B-instructBase
341
- - Weni/ZeroShot-3.3.34-Mistral-7b-Multilanguage-3.3.0-merged
342
- - Weni/ZeroShot-3.4.22-Mistral-7b-DPO-1.0.0
343
- - Weni/ZeroShot-Multilanguage-Zephyr-7B
344
- - Weni/ZeroShot-Multilanguage-Zephyr-7B
345
  - xverse/XVERSE-13B
346
- - xverse/XVERSE-65B-2
347
  - xverse/XVERSE-65B
 
348
  - xverse/XVERSE-7B
349
  ---
350
 
 
27
  - IS_PUBLIC
28
  - HAS_HIGHER_RATE_LIMIT
29
  models:
30
+ - 01-ai/Yi-34B
 
 
 
31
  - 01-ai/Yi-34B-200K
32
  - 01-ai/Yi-34B-Chat
33
+ - 01-ai/Yi-6B
34
  - 01-ai/Yi-6B-200K
35
  - 01-ai/Yi-6B-Chat
 
 
36
  - 01-ai/Yi-9B
37
+ - 01-ai/Yi-9B-200k
38
  - 22h/cabrita_7b_pt_850000
39
  - 22h/open-cabrita3b
 
 
 
40
  - AI-Sweden-Models/gpt-sw3-40b
 
41
  - AI-Sweden-Models/gpt-sw3-6.7b
42
+ - AI-Sweden-Models/gpt-sw3-6.7b-v2
43
+ - AetherResearch/Cerebrum-1.0-7b
44
+ - BAAI/Aquila-7B
45
+ - BAAI/Aquila2-34B
46
+ - BAAI/Aquila2-7B
47
+ - Bruno/Caramelinho
48
+ - Bruno/Caramelo_7B
49
+ - CohereForAI/aya-101
50
+ - CohereForAI/c4ai-command-r-plus-4bit
51
+ - CohereForAI/c4ai-command-r-v01
52
+ - DAMO-NLP-MT/polylm-1.7b
53
+ - DAMO-NLP-MT/polylm-13b
54
+ - Deci/DeciLM-7B
55
+ - EleutherAI/gpt-j-6b
56
+ - EleutherAI/gpt-neo-1.3B
57
+ - EleutherAI/gpt-neo-125m
58
+ - EleutherAI/gpt-neo-2.7B
59
+ - EleutherAI/gpt-neox-20b
60
+ - EleutherAI/pythia-14m
61
+ - EleutherAI/pythia-160m-deduped
62
+ - EleutherAI/pythia-1b
63
+ - EleutherAI/pythia-1b-deduped
64
+ - EleutherAI/pythia-2.8b-deduped
65
+ - EleutherAI/pythia-410m-deduped
66
+ - EleutherAI/pythia-6.9b
67
+ - EleutherAI/pythia-6.9b-deduped
68
+ - EleutherAI/pythia-70m-deduped
69
+ - FuseAI/FuseChat-7B-VaRM
70
+ - FuseAI/OpenChat-3.5-7B-Solar
71
+ - HeyLucasLeao/gpt-neo-small-portuguese
72
+ - HuggingFaceH4/zephyr-7b-alpha
73
+ - HuggingFaceH4/zephyr-7b-beta
74
+ - HuggingFaceH4/zephyr-7b-gemma-v0.1
75
+ - HuggingFaceTB/cosmo-1b
76
+ - Intel/neural-chat-7b-v3-1
77
+ - Intel/neural-chat-7b-v3-3
78
+ - J-LAB/BRisa-7B-Instruct-v0.2
79
+ - JJhooww/Mistral-7B-v0.2-Base_ptbr
80
+ - JJhooww/MistralReloadBR_v2_ptbr
81
+ - JJhooww/Mistral_Relora_Step2k
82
+ - MagusCorp/legislinho
83
+ - MaziyarPanahi/Mistral-7B-Instruct-Aya-101
84
+ - NOVA-vision-language/GlorIA-1.3B
85
+ - Nexusflow/Starling-LM-7B-beta
86
+ - NousResearch/Nous-Hermes-13b
87
+ - NousResearch/Nous-Hermes-2-Mistral-7B-DPO
88
+ - NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO
89
+ - NousResearch/Nous-Hermes-2-SOLAR-10.7B
90
+ - NousResearch/Nous-Hermes-2-Yi-34B
91
+ - NucleusAI/nucleus-22B-token-500B
92
+ - OpenLLM-France/Claire-7B-0.1
93
+ - OpenLLM-France/Claire-Mistral-7B-0.1
94
+ - OrionStarAI/Orion-14B-Base
95
+ - PORTULAN/gervasio-7b-portuguese-ptbr-decoder
96
+ - PORTULAN/gervasio-7b-portuguese-ptpt-decoder
97
+ - Qwen/Qwen-14B
98
+ - Qwen/Qwen-1_8B
99
+ - Qwen/Qwen-1_8B-Chat
100
+ - Qwen/Qwen-72B
101
+ - Qwen/Qwen-72B-Chat
102
+ - Qwen/Qwen-7B
103
+ - Qwen/Qwen-7B-Chat
104
+ - Qwen/Qwen1.5-0.5B
105
+ - Qwen/Qwen1.5-0.5B-Chat
106
+ - Qwen/Qwen1.5-1.8B
107
+ - Qwen/Qwen1.5-1.8B-Chat
108
+ - Qwen/Qwen1.5-14B
109
+ - Qwen/Qwen1.5-14B-Chat
110
+ - Qwen/Qwen1.5-32B
111
+ - Qwen/Qwen1.5-32B-Chat
112
+ - Qwen/Qwen1.5-4B
113
+ - Qwen/Qwen1.5-4B-Chat
114
+ - Qwen/Qwen1.5-72B
115
+ - Qwen/Qwen1.5-72B-Chat
116
+ - Qwen/Qwen1.5-7B
117
+ - Qwen/Qwen1.5-7B-Chat
118
+ - Qwen/Qwen1.5-MoE-A2.7B
119
+ - Qwen/Qwen1.5-MoE-A2.7B-Chat
120
+ - Skywork/Skywork-13B-base
121
+ - THUDM/LongAlign-7B-64k
122
+ - THUDM/agentlm-7b
123
+ - THUDM/chatglm2-6b
124
+ - THUDM/chatglm3-6b
125
+ - THUDM/chatglm3-6b-128k
126
+ - THUDM/chatglm3-6b-32k
127
+ - THUDM/chatglm3-6b-base
128
+ - TencentARC/Mistral_Pro_8B_v0.1
129
+ - TinyLlama/TinyLlama-1.1B-Chat-v1.0
130
+ - TinyLlama/TinyLlama-1.1B-intermediate-step-1431k-3T
131
+ - Unbabel/TowerBase-7B-v0.1
132
+ - Walmart-the-bag/Misted-v2-7B
133
+ - Walmart-the-bag/WordWoven-2x7B
134
+ - Weni/WeniGPT-2.2.3-Zephyr-7B-LLM_Base_2.0.3_SFT
135
+ - Weni/WeniGPT-2.2.3-Zephyr-7B-merged-LLM_Base_2.0.3_SFT
136
+ - Weni/WeniGPT-2.4.1-Zephyr-7B-3-epochs-GPT-QA-1.0.1_DP_DPO
137
+ - Weni/WeniGPT-2.8.1-Zephyr-7B-zephyr-prompt-binarized
138
+ - Weni/WeniGPT-Agents-Zephyr-1.0.17-KTO
139
+ - Weni/WeniGPT-Mistral-7B-instructBase
140
+ - Weni/WeniGPT-Mistral-7B-instructBase-4bit
141
+ - Weni/ZeroShot-3.3.34-Mistral-7b-Multilanguage-3.3.0-merged
142
+ - Weni/ZeroShot-3.4.22-Mistral-7b-DPO-1.0.0
143
+ - Weni/ZeroShot-Multilanguage-Zephyr-7B
144
+ - abacusai/Smaug-34B-v0.1
145
+ - abacusai/Smaug-72B-v0.1
146
  - allenai/OLMo-1B
 
147
  - allenai/OLMo-7B
148
+ - allenai/OLMo-7B-Twin-2T
149
  - allenai/tulu-2-dpo-13b
150
  - allenai/tulu-2-dpo-7b
151
  - argilla/CapybaraHermes-2.5-Mistral-7B
152
  - argilla/notus-7b-v1
153
  - argilla/notux-8x7b-v1
 
 
 
154
  - baichuan-inc/Baichuan-7B
155
  - baichuan-inc/Baichuan2-13B-Base
156
  - baichuan-inc/Baichuan2-7B-Base
157
  - bardsai/jaskier-7b-dpo-v5.6
 
158
  - berkeley-nest/Starling-LM-7B-alpha
159
  - bigscience/bloom-1b7
160
  - bigscience/bloom-3b
161
  - bigscience/bloom-560m
162
  - bigscience/bloom-7b1
 
 
 
163
  - cnmoro/Mistral-7B-Portuguese
 
 
 
164
  - croissantllm/CroissantLLMBase
 
 
 
165
  - deepseek-ai/deepseek-llm-7b-base
166
  - deepseek-ai/deepseek-moe-16b-base
167
  - deepseek-ai/deepseek-moe-16b-chat
 
171
  - dynamofl/dynamo-8B-v0.1
172
  - eduagarcia/gemma-7b-it_no_chat_template
173
  - eduagarcia/gemma-7b-it_singleturn_chat_template
 
 
 
 
 
 
 
 
 
 
 
 
 
 
174
  - facebook/opt-1.3b
175
  - facebook/opt-125m
176
  - facebook/opt-13b
 
179
  - facebook/opt-350m
180
  - facebook/opt-6.7b
181
  - facebook/opt-66b
 
 
182
  - fernandosola/bluearara-7B
183
+ - fernandosola/bluearara-7B-instruct
 
184
  - google/gemma-1.1-2b-it
185
  - google/gemma-1.1-7b-it
 
186
  - google/gemma-2b
187
+ - google/gemma-2b-it
 
188
  - google/gemma-7b
189
+ - google/gemma-7b-it
190
  - google/mt5-base
 
 
191
  - google/mt5-small
192
+ - gpt2
193
  - h2oai/h2o-danube-1.8b-base
194
  - h2oai/h2o-danube-1.8b-chat
195
  - h2oai/h2o-danube2-1.8b-base
196
  - h2oai/h2o-danube2-1.8b-chat
 
 
 
 
 
197
  - huggyllama/llama-13b
198
  - huggyllama/llama-30b
199
  - huggyllama/llama-65b
200
  - huggyllama/llama-7b
 
 
201
  - internlm/internlm-20b
202
  - internlm/internlm-7b
203
  - internlm/internlm2-1_8b
 
206
  - internlm/internlm2-base-20b
207
  - internlm/internlm2-base-7b
208
  - internlm/internlm2-chat-1_8b
 
209
  - internlm/internlm2-chat-20b
 
 
210
  - internlm/internlm2-chat-7b
 
 
 
 
 
 
 
211
  - josu/gpt-neo-pt-1.3B
212
  - josu/gpt-neo-pt-br
213
  - lmsys/vicuna-13b-v1.5
 
215
  - lrds-code/boana-7b-instruct
216
  - lrds-code/samba-1.1B
217
  - lucianosb/boto-7B
 
 
218
  - maritaca-ai/sabia-7b
219
  - matsuo-lab/weblab-10b
 
220
  - meta-llama/Llama-2-13b-chat-hf
221
  - meta-llama/Llama-2-13b-hf
222
  - meta-llama/Llama-2-70b-chat-hf
223
  - meta-llama/Llama-2-70b-hf
224
  - meta-llama/Llama-2-7b-chat-hf
225
  - meta-llama/Llama-2-7b-hf
 
226
  - meta-llama/Meta-Llama-3-8B
227
+ - meta-llama/Meta-Llama-3-8B-Instruct
228
  - microsoft/phi-1
229
+ - microsoft/phi-1_5
230
  - microsoft/phi-2
231
  - mistral-community/Mistral-7B-v0.2
232
  - mistral-community/Mixtral-8x22B-v0.1-4bit
 
236
  - mistralai/Mixtral-8x7B-v0.1
237
  - mlabonne/Monarch-7B
238
  - monilouise/opt125M_portuguese
 
239
  - mosaicml/mpt-7b
240
+ - mosaicml/mpt-7b-8k
241
  - nicholasKluge/Aira-2-portuguese-124M
242
  - nicholasKluge/Aira-2-portuguese-1B7
243
  - nicholasKluge/Aira-2-portuguese-560M
244
  - nicholasKluge/TeenyTinyLlama-160m
 
245
  - nicholasKluge/TeenyTinyLlama-460m
246
+ - nicholasKluge/TeenyTinyLlama-460m-Chat
247
+ - nicolasdec/Cabra
248
  - nicolasdec/CabraMistral7b-0.4
 
 
 
249
  - nicolasdec/CabraQwen14b
250
  - nicolasdec/CabraQwen7b
251
+ - nicolasdec/Cabramistral7b
252
+ - nicolasdec/cabra13b
 
 
 
 
 
 
 
253
  - openai-community/gpt2-large
254
  - openai-community/gpt2-medium
255
  - openai-community/gpt2-xl
256
  - openai-community/openai-gpt
257
  - openchat/openchat-3.5-0106
 
 
258
  - openlm-research/open_llama_13b
259
  - openlm-research/open_llama_3b
260
  - openlm-research/open_llama_3b_v2
261
  - openlm-research/open_llama_7b
262
  - openlm-research/open_llama_7b_v2
 
263
  - paulml/OGNO-7B
264
  - pierreguillou/gpt2-small-portuguese
 
 
 
265
  - projecte-aina/FLOR-1.3B
266
  - projecte-aina/FLOR-6.3B
267
  - projecte-aina/FLOR-760M
268
+ - projecte-aina/aguila-7b
269
  - pucpr/gpt2-bio-pt
270
+ - recogna-nlp/GemBode-2b-it
271
+ - recogna-nlp/Phi-Bode
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
272
  - recogna-nlp/bode-13b-alpaca-pt-br
273
  - recogna-nlp/bode-7b-alpaca-pt-br
 
274
  - recogna-nlp/gembode-2b-ultraalpaca
275
  - recogna-nlp/internlmbode-7b
276
  - recogna-nlp/mistral-bode
277
  - recogna-nlp/phi-bode-2-ultraalpaca
 
 
 
 
278
  - rhaymison/Llama-portuguese-13b-Luana-v0.2
279
+ - rhaymison/Mistral-portuguese-luana-7b
 
280
  - rhaymison/Mistral-portuguese-luana-7b-Mathematics
281
+ - rhaymison/Mistral-portuguese-luana-7b-chat
282
  - rhaymison/Mistral-portuguese-luana-7b-mental-health
 
 
 
283
  - rhaymison/Qwen-portuguese-luana-7b
284
+ - rhaymison/gemma-portuguese-2b-it
285
+ - rhaymison/gemma-portuguese-luana-2b
286
  - rishiraj/CatPPT
287
+ - rishiraj/CatPPT-base
288
  - semantixai/LloroV2
 
 
289
  - stabilityai/stablelm-2-12b
290
+ - stabilityai/stablelm-2-12b-chat
 
291
  - stabilityai/stablelm-2-1_6b
292
+ - stabilityai/stablelm-2-1_6b-chat
293
  - stabilityai/stablelm-2-zephyr-1_6b
294
  - stabilityai/stablelm-3b-4e1t
 
295
  - stabilityai/stablelm-base-alpha-3b
296
+ - stabilityai/stablelm-base-alpha-3b-v2
297
  - stabilityai/stablelm-base-alpha-7b
298
+ - stabilityai/stablelm-base-alpha-7b-v2
299
  - stabilityai/stablelm-zephyr-3b
300
  - state-spaces/mamba-1.4b-hf
301
  - state-spaces/mamba-130m-hf
302
  - state-spaces/mamba-2.8b-hf
303
  - state-spaces/mamba-370m-hf
304
  - state-spaces/mamba-790m-hf
305
+ - t5-base
306
+ - t5-large
307
+ - t5-small
308
  - teknium/OpenHermes-2-Mistral-7B
309
  - teknium/OpenHermes-2.5-Mistral-7B
 
 
 
 
 
 
 
 
310
  - tiiuae/falcon-40b
311
  - tiiuae/falcon-7b
 
 
312
  - togethercomputer/RedPajama-INCITE-7B-Base
313
  - togethercomputer/RedPajama-INCITE-Base-3B-v1
 
314
  - upstage/SOLAR-10.7B-Instruct-v1.0
315
  - upstage/SOLAR-10.7B-v1.0
 
 
316
  - wandgibaut/periquito-3B
 
 
 
 
 
 
 
 
 
 
 
 
317
  - xverse/XVERSE-13B
 
318
  - xverse/XVERSE-65B
319
+ - xverse/XVERSE-65B-2
320
  - xverse/XVERSE-7B
321
  ---
322
 
model_list.txt CHANGED
@@ -1,55 +1,138 @@
1
- - gpt2
2
- - t5-base
3
- - t5-large
4
- - t5-small
5
  - 01-ai/Yi-34B-200K
6
  - 01-ai/Yi-34B-Chat
7
- - 01-ai/Yi-34B
8
  - 01-ai/Yi-6B-200K
9
  - 01-ai/Yi-6B-Chat
10
- - 01-ai/Yi-6B
11
- - 01-ai/Yi-9B-200k
12
  - 01-ai/Yi-9B
 
13
  - 22h/cabrita_7b_pt_850000
14
  - 22h/open-cabrita3b
15
- - abacusai/Smaug-34B-v0.1
16
- - abacusai/Smaug-72B-v0.1
17
- - AetherResearch/Cerebrum-1.0-7b
18
  - AI-Sweden-Models/gpt-sw3-40b
19
- - AI-Sweden-Models/gpt-sw3-6.7b-v2
20
  - AI-Sweden-Models/gpt-sw3-6.7b
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
21
  - allenai/OLMo-1B
22
- - allenai/OLMo-7B-Twin-2T
23
  - allenai/OLMo-7B
 
24
  - allenai/tulu-2-dpo-13b
25
  - allenai/tulu-2-dpo-7b
26
  - argilla/CapybaraHermes-2.5-Mistral-7B
27
  - argilla/notus-7b-v1
28
  - argilla/notux-8x7b-v1
29
- - BAAI/Aquila-7B
30
- - BAAI/Aquila2-34B
31
- - BAAI/Aquila2-7B
32
  - baichuan-inc/Baichuan-7B
33
  - baichuan-inc/Baichuan2-13B-Base
34
  - baichuan-inc/Baichuan2-7B-Base
35
  - bardsai/jaskier-7b-dpo-v5.6
36
- - bardsai/jaskier-7b-dpo-v5.6
37
  - berkeley-nest/Starling-LM-7B-alpha
38
  - bigscience/bloom-1b7
39
  - bigscience/bloom-3b
40
  - bigscience/bloom-560m
41
  - bigscience/bloom-7b1
42
- - Bruno/Caramelinho
43
- - Bruno/Caramelo_7B
44
- - cnmoro/Mistral-7B-Portuguese
45
  - cnmoro/Mistral-7B-Portuguese
46
- - CohereForAI/aya-101
47
- - CohereForAI/c4ai-command-r-plus-4bit
48
- - CohereForAI/c4ai-command-r-v01
49
  - croissantllm/CroissantLLMBase
50
- - DAMO-NLP-MT/polylm-1.7b
51
- - DAMO-NLP-MT/polylm-13b
52
- - Deci/DeciLM-7B
53
  - deepseek-ai/deepseek-llm-7b-base
54
  - deepseek-ai/deepseek-moe-16b-base
55
  - deepseek-ai/deepseek-moe-16b-chat
@@ -59,20 +142,6 @@
59
  - dynamofl/dynamo-8B-v0.1
60
  - eduagarcia/gemma-7b-it_no_chat_template
61
  - eduagarcia/gemma-7b-it_singleturn_chat_template
62
- - EleutherAI/gpt-j-6b
63
- - EleutherAI/gpt-neo-1.3B
64
- - EleutherAI/gpt-neo-125m
65
- - EleutherAI/gpt-neo-2.7B
66
- - EleutherAI/gpt-neox-20b
67
- - EleutherAI/pythia-14m
68
- - EleutherAI/pythia-160m-deduped
69
- - EleutherAI/pythia-1b-deduped
70
- - EleutherAI/pythia-1b
71
- - EleutherAI/pythia-2.8b-deduped
72
- - EleutherAI/pythia-410m-deduped
73
- - EleutherAI/pythia-6.9b-deduped
74
- - EleutherAI/pythia-6.9b
75
- - EleutherAI/pythia-70m-deduped
76
  - facebook/opt-1.3b
77
  - facebook/opt-125m
78
  - facebook/opt-13b
@@ -81,37 +150,25 @@
81
  - facebook/opt-350m
82
  - facebook/opt-6.7b
83
  - facebook/opt-66b
84
- - fernandosola/bluearara-7B-instruct
85
- - fernandosola/bluearara-7B
86
  - fernandosola/bluearara-7B
87
- - FuseAI/FuseChat-7B-VaRM
88
- - FuseAI/OpenChat-3.5-7B-Solar
89
  - google/gemma-1.1-2b-it
90
  - google/gemma-1.1-7b-it
91
- - google/gemma-2b-it
92
  - google/gemma-2b
93
- - google/gemma-7b-it
94
- - google/gemma-7b-it
95
  - google/gemma-7b
 
96
  - google/mt5-base
97
- - google/mt5-base
98
- - google/mt5-small
99
  - google/mt5-small
 
100
  - h2oai/h2o-danube-1.8b-base
101
  - h2oai/h2o-danube-1.8b-chat
102
  - h2oai/h2o-danube2-1.8b-base
103
  - h2oai/h2o-danube2-1.8b-chat
104
- - HeyLucasLeao/gpt-neo-small-portuguese
105
- - HuggingFaceH4/zephyr-7b-alpha
106
- - HuggingFaceH4/zephyr-7b-beta
107
- - HuggingFaceH4/zephyr-7b-gemma-v0.1
108
- - HuggingFaceTB/cosmo-1b
109
  - huggyllama/llama-13b
110
  - huggyllama/llama-30b
111
  - huggyllama/llama-65b
112
  - huggyllama/llama-7b
113
- - Intel/neural-chat-7b-v3-1
114
- - Intel/neural-chat-7b-v3-3
115
  - internlm/internlm-20b
116
  - internlm/internlm-7b
117
  - internlm/internlm2-1_8b
@@ -120,18 +177,8 @@
120
  - internlm/internlm2-base-20b
121
  - internlm/internlm2-base-7b
122
  - internlm/internlm2-chat-1_8b
123
- - internlm/internlm2-chat-1_8b
124
  - internlm/internlm2-chat-20b
125
- - internlm/internlm2-chat-20b
126
- - internlm/internlm2-chat-7b
127
  - internlm/internlm2-chat-7b
128
- - J-LAB/BRisa-7B-Instruct-v0.2
129
- - J-LAB/BRisa-7B-Instruct-v0.2
130
- - JJhooww/Mistral-7B-v0.2-Base_ptbr
131
- - JJhooww/Mistral-7B-v0.2-Base_ptbr
132
- - JJhooww/MistralReloadBR_v2_ptbr
133
- - JJhooww/Mistral_Relora_Step2k
134
- - JJhooww/Mistral_Relora_Step2k
135
  - josu/gpt-neo-pt-1.3B
136
  - josu/gpt-neo-pt-br
137
  - lmsys/vicuna-13b-v1.5
@@ -139,21 +186,18 @@
139
  - lrds-code/boana-7b-instruct
140
  - lrds-code/samba-1.1B
141
  - lucianosb/boto-7B
142
- - MagusCorp/legislinho
143
- - maritaca-ai/sabia-7b
144
  - maritaca-ai/sabia-7b
145
  - matsuo-lab/weblab-10b
146
- - MaziyarPanahi/Mistral-7B-Instruct-Aya-101
147
  - meta-llama/Llama-2-13b-chat-hf
148
  - meta-llama/Llama-2-13b-hf
149
  - meta-llama/Llama-2-70b-chat-hf
150
  - meta-llama/Llama-2-70b-hf
151
  - meta-llama/Llama-2-7b-chat-hf
152
  - meta-llama/Llama-2-7b-hf
153
- - meta-llama/Meta-Llama-3-8B-Instruct
154
  - meta-llama/Meta-Llama-3-8B
155
- - microsoft/phi-1_5
156
  - microsoft/phi-1
 
157
  - microsoft/phi-2
158
  - mistral-community/Mistral-7B-v0.2
159
  - mistral-community/Mixtral-8x22B-v0.1-4bit
@@ -163,157 +207,85 @@
163
  - mistralai/Mixtral-8x7B-v0.1
164
  - mlabonne/Monarch-7B
165
  - monilouise/opt125M_portuguese
166
- - mosaicml/mpt-7b-8k
167
  - mosaicml/mpt-7b
168
- - Nexusflow/Starling-LM-7B-beta
169
  - nicholasKluge/Aira-2-portuguese-124M
170
  - nicholasKluge/Aira-2-portuguese-1B7
171
  - nicholasKluge/Aira-2-portuguese-560M
172
  - nicholasKluge/TeenyTinyLlama-160m
173
- - nicholasKluge/TeenyTinyLlama-460m-Chat
174
  - nicholasKluge/TeenyTinyLlama-460m
175
- - nicolasdec/cabra13b
 
176
  - nicolasdec/CabraMistral7b-0.4
177
- - nicolasdec/Cabramistral7b
178
- - nicolasdec/Cabramistral7b
179
- - nicolasdec/CabraQwen14b
180
  - nicolasdec/CabraQwen14b
181
  - nicolasdec/CabraQwen7b
182
- - nicolasdec/Cabra
183
- - NousResearch/Nous-Hermes-13b
184
- - NousResearch/Nous-Hermes-2-Mistral-7B-DPO
185
- - NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO
186
- - NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO
187
- - NousResearch/Nous-Hermes-2-SOLAR-10.7B
188
- - NousResearch/Nous-Hermes-2-Yi-34B
189
- - NOVA-vision-language/GlorIA-1.3B
190
- - NucleusAI/nucleus-22B-token-500B
191
  - openai-community/gpt2-large
192
  - openai-community/gpt2-medium
193
  - openai-community/gpt2-xl
194
  - openai-community/openai-gpt
195
  - openchat/openchat-3.5-0106
196
- - OpenLLM-France/Claire-7B-0.1
197
- - OpenLLM-France/Claire-Mistral-7B-0.1
198
  - openlm-research/open_llama_13b
199
  - openlm-research/open_llama_3b
200
  - openlm-research/open_llama_3b_v2
201
  - openlm-research/open_llama_7b
202
  - openlm-research/open_llama_7b_v2
203
- - OrionStarAI/Orion-14B-Base
204
  - paulml/OGNO-7B
205
  - pierreguillou/gpt2-small-portuguese
206
- - PORTULAN/gervasio-7b-portuguese-ptbr-decoder
207
- - PORTULAN/gervasio-7b-portuguese-ptpt-decoder
208
- - projecte-aina/aguila-7b
209
  - projecte-aina/FLOR-1.3B
210
  - projecte-aina/FLOR-6.3B
211
  - projecte-aina/FLOR-760M
 
212
  - pucpr/gpt2-bio-pt
213
- - Qwen/Qwen-14B
214
- - Qwen/Qwen-14B
215
- - Qwen/Qwen-1_8B-Chat
216
- - Qwen/Qwen-1_8B-Chat
217
- - Qwen/Qwen-1_8B
218
- - Qwen/Qwen-1_8B
219
- - Qwen/Qwen-72B-Chat
220
- - Qwen/Qwen-72B
221
- - Qwen/Qwen-7B-Chat
222
- - Qwen/Qwen-7B-Chat
223
- - Qwen/Qwen-7B
224
- - Qwen/Qwen-7B
225
- - Qwen/Qwen1.5-0.5B-Chat
226
- - Qwen/Qwen1.5-0.5B
227
- - Qwen/Qwen1.5-1.8B-Chat
228
- - Qwen/Qwen1.5-1.8B
229
- - Qwen/Qwen1.5-14B-Chat
230
- - Qwen/Qwen1.5-14B
231
- - Qwen/Qwen1.5-32B-Chat
232
- - Qwen/Qwen1.5-32B
233
- - Qwen/Qwen1.5-4B-Chat
234
- - Qwen/Qwen1.5-4B
235
- - Qwen/Qwen1.5-72B-Chat
236
- - Qwen/Qwen1.5-72B
237
- - Qwen/Qwen1.5-7B-Chat
238
- - Qwen/Qwen1.5-7B
239
- - Qwen/Qwen1.5-MoE-A2.7B-Chat
240
- - Qwen/Qwen1.5-MoE-A2.7B
241
  - recogna-nlp/bode-13b-alpaca-pt-br
242
  - recogna-nlp/bode-7b-alpaca-pt-br
243
- - recogna-nlp/GemBode-2b-it
244
  - recogna-nlp/gembode-2b-ultraalpaca
245
  - recogna-nlp/internlmbode-7b
246
  - recogna-nlp/mistral-bode
247
  - recogna-nlp/phi-bode-2-ultraalpaca
248
- - recogna-nlp/Phi-Bode
249
- - rhaymison/gemma-portuguese-2b-it
250
- - rhaymison/gemma-portuguese-luana-2b
251
- - rhaymison/gemma-portuguese-luana-2b
252
  - rhaymison/Llama-portuguese-13b-Luana-v0.2
253
- - rhaymison/Mistral-portuguese-luana-7b-chat
254
- - rhaymison/Mistral-portuguese-luana-7b-Mathematics
255
  - rhaymison/Mistral-portuguese-luana-7b-Mathematics
 
256
  - rhaymison/Mistral-portuguese-luana-7b-mental-health
257
- - rhaymison/Mistral-portuguese-luana-7b-mental-health
258
- - rhaymison/Mistral-portuguese-luana-7b
259
- - rhaymison/Qwen-portuguese-luana-7b
260
  - rhaymison/Qwen-portuguese-luana-7b
261
- - rishiraj/CatPPT-base
 
262
  - rishiraj/CatPPT
 
263
  - semantixai/LloroV2
264
- - Skywork/Skywork-13B-base
265
- - stabilityai/stablelm-2-12b-chat
266
  - stabilityai/stablelm-2-12b
267
- - stabilityai/stablelm-2-1_6b-chat
268
- - stabilityai/stablelm-2-1_6b
269
  - stabilityai/stablelm-2-1_6b
 
270
  - stabilityai/stablelm-2-zephyr-1_6b
271
  - stabilityai/stablelm-3b-4e1t
272
- - stabilityai/stablelm-base-alpha-3b-v2
273
  - stabilityai/stablelm-base-alpha-3b
274
- - stabilityai/stablelm-base-alpha-7b-v2
275
  - stabilityai/stablelm-base-alpha-7b
 
276
  - stabilityai/stablelm-zephyr-3b
277
  - state-spaces/mamba-1.4b-hf
278
  - state-spaces/mamba-130m-hf
279
  - state-spaces/mamba-2.8b-hf
280
  - state-spaces/mamba-370m-hf
281
  - state-spaces/mamba-790m-hf
 
 
 
282
  - teknium/OpenHermes-2-Mistral-7B
283
  - teknium/OpenHermes-2.5-Mistral-7B
284
- - TencentARC/Mistral_Pro_8B_v0.1
285
- - THUDM/agentlm-7b
286
- - THUDM/chatglm2-6b
287
- - THUDM/chatglm3-6b-128k
288
- - THUDM/chatglm3-6b-32k
289
- - THUDM/chatglm3-6b-base
290
- - THUDM/chatglm3-6b
291
- - THUDM/LongAlign-7B-64k
292
  - tiiuae/falcon-40b
293
  - tiiuae/falcon-7b
294
- - TinyLlama/TinyLlama-1.1B-Chat-v1.0
295
- - TinyLlama/TinyLlama-1.1B-intermediate-step-1431k-3T
296
  - togethercomputer/RedPajama-INCITE-7B-Base
297
  - togethercomputer/RedPajama-INCITE-Base-3B-v1
298
- - Unbabel/TowerBase-7B-v0.1
299
  - upstage/SOLAR-10.7B-Instruct-v1.0
300
  - upstage/SOLAR-10.7B-v1.0
301
- - Walmart-the-bag/Misted-v2-7B
302
- - Walmart-the-bag/WordWoven-2x7B
303
  - wandgibaut/periquito-3B
304
- - Weni/WeniGPT-2.2.3-Zephyr-7B-LLM_Base_2.0.3_SFT
305
- - Weni/WeniGPT-2.2.3-Zephyr-7B-merged-LLM_Base_2.0.3_SFT
306
- - Weni/WeniGPT-2.4.1-Zephyr-7B-3-epochs-GPT-QA-1.0.1_DP_DPO
307
- - Weni/WeniGPT-2.8.1-Zephyr-7B-zephyr-prompt-binarized
308
- - Weni/WeniGPT-2.8.1-Zephyr-7B-zephyr-prompt-binarized
309
- - Weni/WeniGPT-Agents-Zephyr-1.0.17-KTO
310
- - Weni/WeniGPT-Mistral-7B-instructBase-4bit
311
- - Weni/WeniGPT-Mistral-7B-instructBase
312
- - Weni/ZeroShot-3.3.34-Mistral-7b-Multilanguage-3.3.0-merged
313
- - Weni/ZeroShot-3.4.22-Mistral-7b-DPO-1.0.0
314
- - Weni/ZeroShot-Multilanguage-Zephyr-7B
315
- - Weni/ZeroShot-Multilanguage-Zephyr-7B
316
  - xverse/XVERSE-13B
317
- - xverse/XVERSE-65B-2
318
  - xverse/XVERSE-65B
 
319
  - xverse/XVERSE-7B
 
1
+ - 01-ai/Yi-34B
 
 
 
2
  - 01-ai/Yi-34B-200K
3
  - 01-ai/Yi-34B-Chat
4
+ - 01-ai/Yi-6B
5
  - 01-ai/Yi-6B-200K
6
  - 01-ai/Yi-6B-Chat
 
 
7
  - 01-ai/Yi-9B
8
+ - 01-ai/Yi-9B-200k
9
  - 22h/cabrita_7b_pt_850000
10
  - 22h/open-cabrita3b
 
 
 
11
  - AI-Sweden-Models/gpt-sw3-40b
 
12
  - AI-Sweden-Models/gpt-sw3-6.7b
13
+ - AI-Sweden-Models/gpt-sw3-6.7b-v2
14
+ - AetherResearch/Cerebrum-1.0-7b
15
+ - BAAI/Aquila-7B
16
+ - BAAI/Aquila2-34B
17
+ - BAAI/Aquila2-7B
18
+ - Bruno/Caramelinho
19
+ - Bruno/Caramelo_7B
20
+ - CohereForAI/aya-101
21
+ - CohereForAI/c4ai-command-r-plus-4bit
22
+ - CohereForAI/c4ai-command-r-v01
23
+ - DAMO-NLP-MT/polylm-1.7b
24
+ - DAMO-NLP-MT/polylm-13b
25
+ - Deci/DeciLM-7B
26
+ - EleutherAI/gpt-j-6b
27
+ - EleutherAI/gpt-neo-1.3B
28
+ - EleutherAI/gpt-neo-125m
29
+ - EleutherAI/gpt-neo-2.7B
30
+ - EleutherAI/gpt-neox-20b
31
+ - EleutherAI/pythia-14m
32
+ - EleutherAI/pythia-160m-deduped
33
+ - EleutherAI/pythia-1b
34
+ - EleutherAI/pythia-1b-deduped
35
+ - EleutherAI/pythia-2.8b-deduped
36
+ - EleutherAI/pythia-410m-deduped
37
+ - EleutherAI/pythia-6.9b
38
+ - EleutherAI/pythia-6.9b-deduped
39
+ - EleutherAI/pythia-70m-deduped
40
+ - FuseAI/FuseChat-7B-VaRM
41
+ - FuseAI/OpenChat-3.5-7B-Solar
42
+ - HeyLucasLeao/gpt-neo-small-portuguese
43
+ - HuggingFaceH4/zephyr-7b-alpha
44
+ - HuggingFaceH4/zephyr-7b-beta
45
+ - HuggingFaceH4/zephyr-7b-gemma-v0.1
46
+ - HuggingFaceTB/cosmo-1b
47
+ - Intel/neural-chat-7b-v3-1
48
+ - Intel/neural-chat-7b-v3-3
49
+ - J-LAB/BRisa-7B-Instruct-v0.2
50
+ - JJhooww/Mistral-7B-v0.2-Base_ptbr
51
+ - JJhooww/MistralReloadBR_v2_ptbr
52
+ - JJhooww/Mistral_Relora_Step2k
53
+ - MagusCorp/legislinho
54
+ - MaziyarPanahi/Mistral-7B-Instruct-Aya-101
55
+ - NOVA-vision-language/GlorIA-1.3B
56
+ - Nexusflow/Starling-LM-7B-beta
57
+ - NousResearch/Nous-Hermes-13b
58
+ - NousResearch/Nous-Hermes-2-Mistral-7B-DPO
59
+ - NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO
60
+ - NousResearch/Nous-Hermes-2-SOLAR-10.7B
61
+ - NousResearch/Nous-Hermes-2-Yi-34B
62
+ - NucleusAI/nucleus-22B-token-500B
63
+ - OpenLLM-France/Claire-7B-0.1
64
+ - OpenLLM-France/Claire-Mistral-7B-0.1
65
+ - OrionStarAI/Orion-14B-Base
66
+ - PORTULAN/gervasio-7b-portuguese-ptbr-decoder
67
+ - PORTULAN/gervasio-7b-portuguese-ptpt-decoder
68
+ - Qwen/Qwen-14B
69
+ - Qwen/Qwen-1_8B
70
+ - Qwen/Qwen-1_8B-Chat
71
+ - Qwen/Qwen-72B
72
+ - Qwen/Qwen-72B-Chat
73
+ - Qwen/Qwen-7B
74
+ - Qwen/Qwen-7B-Chat
75
+ - Qwen/Qwen1.5-0.5B
76
+ - Qwen/Qwen1.5-0.5B-Chat
77
+ - Qwen/Qwen1.5-1.8B
78
+ - Qwen/Qwen1.5-1.8B-Chat
79
+ - Qwen/Qwen1.5-14B
80
+ - Qwen/Qwen1.5-14B-Chat
81
+ - Qwen/Qwen1.5-32B
82
+ - Qwen/Qwen1.5-32B-Chat
83
+ - Qwen/Qwen1.5-4B
84
+ - Qwen/Qwen1.5-4B-Chat
85
+ - Qwen/Qwen1.5-72B
86
+ - Qwen/Qwen1.5-72B-Chat
87
+ - Qwen/Qwen1.5-7B
88
+ - Qwen/Qwen1.5-7B-Chat
89
+ - Qwen/Qwen1.5-MoE-A2.7B
90
+ - Qwen/Qwen1.5-MoE-A2.7B-Chat
91
+ - Skywork/Skywork-13B-base
92
+ - THUDM/LongAlign-7B-64k
93
+ - THUDM/agentlm-7b
94
+ - THUDM/chatglm2-6b
95
+ - THUDM/chatglm3-6b
96
+ - THUDM/chatglm3-6b-128k
97
+ - THUDM/chatglm3-6b-32k
98
+ - THUDM/chatglm3-6b-base
99
+ - TencentARC/Mistral_Pro_8B_v0.1
100
+ - TinyLlama/TinyLlama-1.1B-Chat-v1.0
101
+ - TinyLlama/TinyLlama-1.1B-intermediate-step-1431k-3T
102
+ - Unbabel/TowerBase-7B-v0.1
103
+ - Walmart-the-bag/Misted-v2-7B
104
+ - Walmart-the-bag/WordWoven-2x7B
105
+ - Weni/WeniGPT-2.2.3-Zephyr-7B-LLM_Base_2.0.3_SFT
106
+ - Weni/WeniGPT-2.2.3-Zephyr-7B-merged-LLM_Base_2.0.3_SFT
107
+ - Weni/WeniGPT-2.4.1-Zephyr-7B-3-epochs-GPT-QA-1.0.1_DP_DPO
108
+ - Weni/WeniGPT-2.8.1-Zephyr-7B-zephyr-prompt-binarized
109
+ - Weni/WeniGPT-Agents-Zephyr-1.0.17-KTO
110
+ - Weni/WeniGPT-Mistral-7B-instructBase
111
+ - Weni/WeniGPT-Mistral-7B-instructBase-4bit
112
+ - Weni/ZeroShot-3.3.34-Mistral-7b-Multilanguage-3.3.0-merged
113
+ - Weni/ZeroShot-3.4.22-Mistral-7b-DPO-1.0.0
114
+ - Weni/ZeroShot-Multilanguage-Zephyr-7B
115
+ - abacusai/Smaug-34B-v0.1
116
+ - abacusai/Smaug-72B-v0.1
117
  - allenai/OLMo-1B
 
118
  - allenai/OLMo-7B
119
+ - allenai/OLMo-7B-Twin-2T
120
  - allenai/tulu-2-dpo-13b
121
  - allenai/tulu-2-dpo-7b
122
  - argilla/CapybaraHermes-2.5-Mistral-7B
123
  - argilla/notus-7b-v1
124
  - argilla/notux-8x7b-v1
 
 
 
125
  - baichuan-inc/Baichuan-7B
126
  - baichuan-inc/Baichuan2-13B-Base
127
  - baichuan-inc/Baichuan2-7B-Base
128
  - bardsai/jaskier-7b-dpo-v5.6
 
129
  - berkeley-nest/Starling-LM-7B-alpha
130
  - bigscience/bloom-1b7
131
  - bigscience/bloom-3b
132
  - bigscience/bloom-560m
133
  - bigscience/bloom-7b1
 
 
 
134
  - cnmoro/Mistral-7B-Portuguese
 
 
 
135
  - croissantllm/CroissantLLMBase
 
 
 
136
  - deepseek-ai/deepseek-llm-7b-base
137
  - deepseek-ai/deepseek-moe-16b-base
138
  - deepseek-ai/deepseek-moe-16b-chat
 
142
  - dynamofl/dynamo-8B-v0.1
143
  - eduagarcia/gemma-7b-it_no_chat_template
144
  - eduagarcia/gemma-7b-it_singleturn_chat_template
 
 
 
 
 
 
 
 
 
 
 
 
 
 
145
  - facebook/opt-1.3b
146
  - facebook/opt-125m
147
  - facebook/opt-13b
 
150
  - facebook/opt-350m
151
  - facebook/opt-6.7b
152
  - facebook/opt-66b
 
 
153
  - fernandosola/bluearara-7B
154
+ - fernandosola/bluearara-7B-instruct
 
155
  - google/gemma-1.1-2b-it
156
  - google/gemma-1.1-7b-it
 
157
  - google/gemma-2b
158
+ - google/gemma-2b-it
 
159
  - google/gemma-7b
160
+ - google/gemma-7b-it
161
  - google/mt5-base
 
 
162
  - google/mt5-small
163
+ - gpt2
164
  - h2oai/h2o-danube-1.8b-base
165
  - h2oai/h2o-danube-1.8b-chat
166
  - h2oai/h2o-danube2-1.8b-base
167
  - h2oai/h2o-danube2-1.8b-chat
 
 
 
 
 
168
  - huggyllama/llama-13b
169
  - huggyllama/llama-30b
170
  - huggyllama/llama-65b
171
  - huggyllama/llama-7b
 
 
172
  - internlm/internlm-20b
173
  - internlm/internlm-7b
174
  - internlm/internlm2-1_8b
 
177
  - internlm/internlm2-base-20b
178
  - internlm/internlm2-base-7b
179
  - internlm/internlm2-chat-1_8b
 
180
  - internlm/internlm2-chat-20b
 
 
181
  - internlm/internlm2-chat-7b
 
 
 
 
 
 
 
182
  - josu/gpt-neo-pt-1.3B
183
  - josu/gpt-neo-pt-br
184
  - lmsys/vicuna-13b-v1.5
 
186
  - lrds-code/boana-7b-instruct
187
  - lrds-code/samba-1.1B
188
  - lucianosb/boto-7B
 
 
189
  - maritaca-ai/sabia-7b
190
  - matsuo-lab/weblab-10b
 
191
  - meta-llama/Llama-2-13b-chat-hf
192
  - meta-llama/Llama-2-13b-hf
193
  - meta-llama/Llama-2-70b-chat-hf
194
  - meta-llama/Llama-2-70b-hf
195
  - meta-llama/Llama-2-7b-chat-hf
196
  - meta-llama/Llama-2-7b-hf
 
197
  - meta-llama/Meta-Llama-3-8B
198
+ - meta-llama/Meta-Llama-3-8B-Instruct
199
  - microsoft/phi-1
200
+ - microsoft/phi-1_5
201
  - microsoft/phi-2
202
  - mistral-community/Mistral-7B-v0.2
203
  - mistral-community/Mixtral-8x22B-v0.1-4bit
 
207
  - mistralai/Mixtral-8x7B-v0.1
208
  - mlabonne/Monarch-7B
209
  - monilouise/opt125M_portuguese
 
210
  - mosaicml/mpt-7b
211
+ - mosaicml/mpt-7b-8k
212
  - nicholasKluge/Aira-2-portuguese-124M
213
  - nicholasKluge/Aira-2-portuguese-1B7
214
  - nicholasKluge/Aira-2-portuguese-560M
215
  - nicholasKluge/TeenyTinyLlama-160m
 
216
  - nicholasKluge/TeenyTinyLlama-460m
217
+ - nicholasKluge/TeenyTinyLlama-460m-Chat
218
+ - nicolasdec/Cabra
219
  - nicolasdec/CabraMistral7b-0.4
 
 
 
220
  - nicolasdec/CabraQwen14b
221
  - nicolasdec/CabraQwen7b
222
+ - nicolasdec/Cabramistral7b
223
+ - nicolasdec/cabra13b
 
 
 
 
 
 
 
224
  - openai-community/gpt2-large
225
  - openai-community/gpt2-medium
226
  - openai-community/gpt2-xl
227
  - openai-community/openai-gpt
228
  - openchat/openchat-3.5-0106
 
 
229
  - openlm-research/open_llama_13b
230
  - openlm-research/open_llama_3b
231
  - openlm-research/open_llama_3b_v2
232
  - openlm-research/open_llama_7b
233
  - openlm-research/open_llama_7b_v2
 
234
  - paulml/OGNO-7B
235
  - pierreguillou/gpt2-small-portuguese
 
 
 
236
  - projecte-aina/FLOR-1.3B
237
  - projecte-aina/FLOR-6.3B
238
  - projecte-aina/FLOR-760M
239
+ - projecte-aina/aguila-7b
240
  - pucpr/gpt2-bio-pt
241
+ - recogna-nlp/GemBode-2b-it
242
+ - recogna-nlp/Phi-Bode
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
243
  - recogna-nlp/bode-13b-alpaca-pt-br
244
  - recogna-nlp/bode-7b-alpaca-pt-br
 
245
  - recogna-nlp/gembode-2b-ultraalpaca
246
  - recogna-nlp/internlmbode-7b
247
  - recogna-nlp/mistral-bode
248
  - recogna-nlp/phi-bode-2-ultraalpaca
 
 
 
 
249
  - rhaymison/Llama-portuguese-13b-Luana-v0.2
250
+ - rhaymison/Mistral-portuguese-luana-7b
 
251
  - rhaymison/Mistral-portuguese-luana-7b-Mathematics
252
+ - rhaymison/Mistral-portuguese-luana-7b-chat
253
  - rhaymison/Mistral-portuguese-luana-7b-mental-health
 
 
 
254
  - rhaymison/Qwen-portuguese-luana-7b
255
+ - rhaymison/gemma-portuguese-2b-it
256
+ - rhaymison/gemma-portuguese-luana-2b
257
  - rishiraj/CatPPT
258
+ - rishiraj/CatPPT-base
259
  - semantixai/LloroV2
 
 
260
  - stabilityai/stablelm-2-12b
261
+ - stabilityai/stablelm-2-12b-chat
 
262
  - stabilityai/stablelm-2-1_6b
263
+ - stabilityai/stablelm-2-1_6b-chat
264
  - stabilityai/stablelm-2-zephyr-1_6b
265
  - stabilityai/stablelm-3b-4e1t
 
266
  - stabilityai/stablelm-base-alpha-3b
267
+ - stabilityai/stablelm-base-alpha-3b-v2
268
  - stabilityai/stablelm-base-alpha-7b
269
+ - stabilityai/stablelm-base-alpha-7b-v2
270
  - stabilityai/stablelm-zephyr-3b
271
  - state-spaces/mamba-1.4b-hf
272
  - state-spaces/mamba-130m-hf
273
  - state-spaces/mamba-2.8b-hf
274
  - state-spaces/mamba-370m-hf
275
  - state-spaces/mamba-790m-hf
276
+ - t5-base
277
+ - t5-large
278
+ - t5-small
279
  - teknium/OpenHermes-2-Mistral-7B
280
  - teknium/OpenHermes-2.5-Mistral-7B
 
 
 
 
 
 
 
 
281
  - tiiuae/falcon-40b
282
  - tiiuae/falcon-7b
 
 
283
  - togethercomputer/RedPajama-INCITE-7B-Base
284
  - togethercomputer/RedPajama-INCITE-Base-3B-v1
 
285
  - upstage/SOLAR-10.7B-Instruct-v1.0
286
  - upstage/SOLAR-10.7B-v1.0
 
 
287
  - wandgibaut/periquito-3B
 
 
 
 
 
 
 
 
 
 
 
 
288
  - xverse/XVERSE-13B
 
289
  - xverse/XVERSE-65B
290
+ - xverse/XVERSE-65B-2
291
  - xverse/XVERSE-7B
src/display/formatting.py CHANGED
@@ -35,7 +35,7 @@ def make_clickable_model(model_name, json_path=None, revision=None):
35
  if json_path is not None:
36
  details_link = f"https://huggingface.co/datasets/{RESULTS_REPO}/blob/main/{model_name}/{json_path}"
37
 
38
- if revision is not None and revision != "main":
39
  if len(revision) > 12:
40
  revision = revision[:7]
41
  model_name += f" (rev: {revision})"
 
35
  if json_path is not None:
36
  details_link = f"https://huggingface.co/datasets/{RESULTS_REPO}/blob/main/{model_name}/{json_path}"
37
 
38
+ if revision is not None and revision != "" and revision != "main":
39
  if len(revision) > 12:
40
  revision = revision[:7]
41
  model_name += f" (rev: {revision})"
src/leaderboard/read_evals.py CHANGED
@@ -23,8 +23,8 @@ class EvalResult:
23
  org: str
24
  model: str
25
  model_sha: str # commit hash, "" if main
26
- revision: str = "main"
27
  results: dict
 
28
  precision: Precision = Precision.Unknown
29
  model_type: ModelType = ModelType.Unknown # Pretrained, fine tuned, ...
30
  weight_type: WeightType = WeightType.Original # Original or Adapter
@@ -176,12 +176,6 @@ class EvalResult:
176
  average = round(sum(average)/len(average), 2)
177
  npm = round(sum(npm)/len(npm), 2)
178
 
179
- rev_name = None
180
- if self.revision != "main":
181
- rev_name = self.revision
182
- if rev_name > 10:
183
- rev_name = rev_name[:7]
184
-
185
  data_dict = {
186
  "eval_name": self.eval_name, # not a column, just a save name,
187
  AutoEvalColumn.precision.name: self.precision.value.name,
@@ -189,7 +183,7 @@ class EvalResult:
189
  AutoEvalColumn.model_type_symbol.name: self.model_type.value.symbol,
190
  AutoEvalColumn.weight_type.name: self.weight_type.value.name,
191
  AutoEvalColumn.architecture.name: self.architecture,
192
- AutoEvalColumn.model.name: make_clickable_model(self.full_model, self.json_filename, revision=rev_name),
193
  AutoEvalColumn.dummy.name: self.full_model,
194
  AutoEvalColumn.revision.name: self.revision,
195
  AutoEvalColumn.average.name: average,
 
23
  org: str
24
  model: str
25
  model_sha: str # commit hash, "" if main
 
26
  results: dict
27
+ revision: str = "main"
28
  precision: Precision = Precision.Unknown
29
  model_type: ModelType = ModelType.Unknown # Pretrained, fine tuned, ...
30
  weight_type: WeightType = WeightType.Original # Original or Adapter
 
176
  average = round(sum(average)/len(average), 2)
177
  npm = round(sum(npm)/len(npm), 2)
178
 
 
 
 
 
 
 
179
  data_dict = {
180
  "eval_name": self.eval_name, # not a column, just a save name,
181
  AutoEvalColumn.precision.name: self.precision.value.name,
 
183
  AutoEvalColumn.model_type_symbol.name: self.model_type.value.symbol,
184
  AutoEvalColumn.weight_type.name: self.weight_type.value.name,
185
  AutoEvalColumn.architecture.name: self.architecture,
186
+ AutoEvalColumn.model.name: make_clickable_model(self.full_model, self.json_filename, revision=self.revision),
187
  AutoEvalColumn.dummy.name: self.full_model,
188
  AutoEvalColumn.revision.name: self.revision,
189
  AutoEvalColumn.average.name: average,
update_models_in_readme.py CHANGED
@@ -17,11 +17,15 @@ import glob
17
  import json
18
 
19
  snapshot_download(repo_id=QUEUE_REPO, local_dir=EVAL_REQUESTS_PATH, repo_type="dataset", tqdm_class=None, etag_timeout=30)
 
 
 
 
 
 
20
 
 
21
  with open('model_list.txt', 'w') as fw:
22
- for filepath in glob.glob(os.path.join(EVAL_REQUESTS_PATH, '**/*.json'), recursive=True):
23
- with open(filepath, 'r') as f:
24
- model_data = json.load(f)
25
- if model_data['status'] == 'FINISHED':
26
- print(model_data['model'])
27
- fw.write(' - '+ model_data['model'] + '\n')
 
17
  import json
18
 
19
  snapshot_download(repo_id=QUEUE_REPO, local_dir=EVAL_REQUESTS_PATH, repo_type="dataset", tqdm_class=None, etag_timeout=30)
20
+ all_models = []
21
+ for filepath in glob.glob(os.path.join(EVAL_REQUESTS_PATH, '**/*.json'), recursive=True):
22
+ with open(filepath, 'r') as f:
23
+ model_data = json.load(f)
24
+ if model_data['status'] == 'FINISHED':
25
+ all_models.append(model_data['model'])
26
 
27
+ all_models = sorted(list(set(all_models)))
28
  with open('model_list.txt', 'w') as fw:
29
+ for m in all_models:
30
+ print(m)
31
+ fw.write(' - '+ m + '\n')