Omnibus commited on
Commit
4163231
1 Parent(s): 176c5c4

Create models.py

Browse files
Files changed (1) hide show
  1. models.py +325 -0
models.py ADDED
@@ -0,0 +1,325 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ models=[
2
+ "JunRyeol/jr_model",
3
+ "Delcos/internal_chat_model_e2",
4
+ "pvduy/vicuna-13b",
5
+ "master-thesis-hell/llama-7b_sft-v5",
6
+ "pvduy/vicuna-13b-v1.1",
7
+ "ArneJacob/RemiBot",
8
+ "pvduy/vicuna-13b-v1.1-sft",
9
+ "dmayhem93/llama-13b-sft-self-critiquing-base",
10
+ "dmayhem93/llama-13b-sft-self-critiquing-critique",
11
+ "dmayhem93/llama-13b-sft-self-critiquing-refine",
12
+ "dmayhem93/llama-30b-sft-self-critiquing-base",
13
+ "dmayhem93/llama-30b-sft-self-critiquing-critique",
14
+ "dmayhem93/llama-30b-sft-self-critiquing-refine",
15
+ "AlekseyKorshuk/gpt-j-6b-chatml",
16
+ "pvduy/vicuna-13b-v1.1-sft-ver2",
17
+ "DarwinAnim8or/Grug-Edge",
18
+ "Ahrefs/flan-llama-7b-delta",
19
+ "yep-search/flan-llama-7b-delta",
20
+ "xyz-nlp/XuanYuan2.0",
21
+ "gouravsinha/mpt-balance_sheet-extractor",
22
+ "alup/agrimi-lora",
23
+ "javirandor/passgpt-16characters",
24
+ "yuyuc/llama-7b-instruct-base-chem",
25
+ "vietgpt-archive/bloom-1b7-v3",
26
+ "vietgpt-archive/bloom-1b7-v3-instruction",
27
+ "meta-llama/Llama-2-7b",
28
+ "meta-llama/Llama-2-7b-chat",
29
+ "meta-llama/Llama-2-13b",
30
+ "meta-llama/Llama-2-13b-chat",
31
+ "meta-llama/Llama-2-70b",
32
+ "meta-llama/Llama-2-70b-hf",
33
+ "meta-llama/Llama-2-13b-chat-hf",
34
+ "meta-llama/Llama-2-13b-hf",
35
+ "meta-llama/Llama-2-7b-hf",
36
+ "meta-llama/Llama-2-7b-chat-hf",
37
+ "meta-llama/Llama-2-70b-chat",
38
+ "meta-llama/Llama-2-70b-chat-hf",
39
+ "vietgpt-archive/bloom-1b7-v4-legal",
40
+ "vietgpt-archive/bloom-1b7-v4-legal-instruction",
41
+ "yentinglin/Taiwan-LLaMa-v1.0-base",
42
+ "etri-lirs/egpt-1.3b-preview",
43
+ "Trelis/Llama-2-13b-chat-hf-function-calling",
44
+ "Medlinker/Medgpt",
45
+ "Medliker/Medgpt",
46
+ "dipteshkanojia/llama-2-13b-chat-hf-qe2023-multi-shuffled",
47
+ "Loke-60000/Christina-7B-chat",
48
+ "Loke-60000/Christina-7B-32K",
49
+ "Recag/1hf",
50
+ "Experimental-Models/D-Llama-2-7b-4k-3e-6-1m",
51
+ "Experimental-Models/D-Llama-2-7b-4k-3e-6-500k-epoch-1",
52
+ "Trelis/Llama-2-13b-chat-hf-function-calling-GPTQ",
53
+ "Experimental-Models/D-Llama-2-7b-4k-3e-6-500k-epoch-2",
54
+ "Experimental-Models/D-Llama-2-7b-4k-3e-6-500k-epoch-3",
55
+ "arvind2626/falcon-7b-finetuned",
56
+ "Kumail00Alawa/look-elsewhere",
57
+ "vietgpt-archive/dama-7b-92000",
58
+ "vietgpt-archive/dama-7b-100000",
59
+ "HoangCuongNguyen/llama-2-7b-CTI-research",
60
+ "Trelis/Llama-2-13b-chat-hf-function-calling-adapters-v2",
61
+ "Trelis/Llama-2-13b-chat-hf-function-calling-v2",
62
+ "pki/SecurityGPT",
63
+ "openskyml/llama-7b-chat-hf-cpu",
64
+ "sahil2801/llama-70-1",
65
+ "sahil2801/llama-70-epoch1",
66
+ "Trelis/CodeLlama-34b-Instruct-hf-function-calling-adapters-v2",
67
+ "Trelis/CodeLlama-34b-Instruct-hf-function-calling-v2",
68
+ "vietgpt-archive/hoa-7b",
69
+ "Rakeshkamma/Llama-2-7b-chat-finetune",
70
+ "bhawanisinghshekhawat/ml_llama_ft_igql",
71
+ "sahil2801/llama-70-v2",
72
+ "sekarmulyani/gpt2-ulasan-ecommerce",
73
+ "isashap/waldomodel",
74
+ "Undi95/ReML-L2-13B",
75
+ "Trelis/Llama-2-70b-chat-hf-function-calling-adapters-v2",
76
+ "Trelis/Llama-2-70b-chat-hf-function-calling-v2",
77
+ "gracenote/llama-2-7b-chat-finetuned",
78
+ "Undi95/ReMM-S-Light",
79
+ "Undi95/MLewd-L2-13B-Part3",
80
+ "Johnyquest7/Endo_Llama-2-7b",
81
+ "mariaxclarisse/familia-ensemble",
82
+ "taide/b.1.0.0",
83
+ "Undi95/ReML-v2-L2-13B",
84
+ "adityaprakhar/code_llama_service_list_1",
85
+ "Undi95/ReML-v2.1-L2-13B",
86
+ "PathOr/PathOr_LLama_70B_CHAT",
87
+ "malhajar/llama-2-70b-hf-chat-turkish-gptq",
88
+ "Undi95/MLewd-L2-Chat-13B-Old",
89
+ "PathOr/PathOr_Llama-2-70b-chat-hf-function-calling-adapters-v2",
90
+ "vietgpt/dama-2-7b",
91
+ "migueldeguzmandev/gpt2_integrated",
92
+ "Undi95/ReML-v2.2-L2-13B",
93
+ "ura-hcmut/ura-llama-7b-r64",
94
+ "pharaouk/raijin",
95
+ "vietgpt/dama-2-7b-chat",
96
+ "qqfifi/healthcare-genai-llama-sagemaker",
97
+ "BLACKBUN/llama-2-7b-pubmed-qa",
98
+ "pharaouk/zeta-3-1B",
99
+ "IrohXu/llava-llama-2-7b-maplm_lora",
100
+ "AIFS/Apollo-13B-en",
101
+ "sebastianM99/Llama-2-7b-chat-hf-romanian",
102
+ "ura-hcmut/ura-llama-7b",
103
+ "ura-hcmut/ura-llama-13b",
104
+ "ura-hcmut/ura-llama-70b",
105
+ "AIFS/Apollo-13B-pt",
106
+ "FunyTan/llama_chat",
107
+ "pphuc25/llama-1B-cultaX",
108
+ "vikp/textbook_gen6_awq",
109
+ "vikp/textbook_gen6",
110
+ "m42-health/med42-70b",
111
+ "xDAN-AI/xDAN-L1-Chat-v0.1",
112
+ "uralstech/AFO-Chat-Merged",
113
+ "pharaouk/scribe-1B",
114
+ "Trelis/Mistral-7B-Instruct-v0.1-function-calling-adapters-v2",
115
+ "Trelis/Mistral-7B-Instruct-v0.1-function-calling-v2",
116
+ "vikp/textbook_gen_mistral",
117
+ "Delcos/Alta-13b",
118
+ "pharaouk/sentinel-7B",
119
+ "arthurdubrou/Bird",
120
+ "RickBigL/gugu_mistralai_role_play_v2",
121
+ "BLACKBUN/llama-2-7b-pubmed-qa-211k",
122
+ "soumyo-at-ather/nfk4-uiz2-gr9j-0",
123
+ "BEE-spoke-data/verysmol_llama-v8-minipile_x2",
124
+ "Ashmal/ClimateGPT13B_en",
125
+ "innoverse-lab/vlm-house-v2.3",
126
+ "BLACKBUN/llama-2-7b-paediatrics-abdominal-pain",
127
+ "lilpotato03/aarons_mental_health_chatbot_v1",
128
+ "justinphan3110/Llama-2-13b-behavior_classifier",
129
+ "BLACKBUN/llama-2-7b-virtual-patient-cases",
130
+ "BLACKBUN/llama-2-7b-both",
131
+ "yixuantt/InvestLM-awq",
132
+ "Ashmal/ClimateGPT13B",
133
+ "nctu6/MOE-AICUP-Training-7B",
134
+ "ranchlai/Baichuan2-13B-Chat-gptq-4bit-32g",
135
+ "Trelis/falcon-7b-chat-SFT",
136
+ "jin05102518/Astral-7B-0.5Epoch-Test",
137
+ "Delcos/Nate-70b-DeepN-Healthtune",
138
+ "Trelis/deepseek-coder-6.7b-instruct-function-calling-adapters-v2",
139
+ "Trelis/deepseek-coder-6.7b-instruct-function-calling-v2",
140
+ "Trelis/deepseek-coder-1.3b-instruct-function-calling-adapters-v2",
141
+ "Trelis/deepseek-coder-1.3b-instruct-function-calling-v2",
142
+ "Trelis/deepseek-coder-33b-instruct-function-calling-adapters-v2",
143
+ "Trelis/deepseek-coder-33b-instruct-function-calling-v2",
144
+ "Yeshwanth-03-06-2004/llama2-7b-hf-small-biogen",
145
+ "asmaa-ali/llama-2-7b-AsmaaChemProt",
146
+ "Trelis/zephyr-7b-beta-function-calling-v2",
147
+ "sowrensen/quipbot-llama-2-7b-chat-hf",
148
+ "sowrensen/quipbot-llama-2-7b-hf",
149
+ "xDAN-AI/xDAN-L2-Chat-Performance-e2",
150
+ "mayuanyang/llama-2-7b-hi200-faq",
151
+ "Trelis/falcon-40B-chat-SFT",
152
+ "SrikanthChellappa/mistral-7b-sharded-finetuning-medical100k-chatbot",
153
+ "JosephVit/llama2_research_healthvar",
154
+ "SrikanthChellappa/llama2-7b-sharded-finetuning-medical100k-chatbot",
155
+ "Trelis/TinyLlama-1.1B-4k-chat-SFT-DPO",
156
+ "SrikanthChellappa/falcon-7b-sharded-finetuning-medical100k-chatbot",
157
+ "nvidia/nemotron-3-8b-base-4k",
158
+ "nvidia/nemotron-3-8b-chat-4k-rlhf",
159
+ "nvidia/nemotron-3-8b-chat-4k-sft",
160
+ "nvidia/nemotron-3-8b-chat-4k-steerlm",
161
+ "nvidia/nemotron-3-8b-qa-4k",
162
+ "Yeshwanth-03-06-2004/gpt2-tweetgen",
163
+ "Trelis/Yi-6B-200K-Llamafied-function-calling-adapters-v2",
164
+ "Trelis/Yi-6B-200K-Llamafied-function-calling-v2",
165
+ "Trelis/Yi-34B-200K-Llamafied-function-calling-adapters-v2",
166
+ "Trelis/Yi-6B-200K-Llamafied-chat-SFT",
167
+ "vietgpt/dama-2-7b-chat-gguf",
168
+ "xDAN-AI/xDAN-L1Mix-DeepThinking-v2",
169
+ "Trelis/Yi-6B-200K-Llamafied-chat-SFT-AWQ",
170
+ "Trelis/Yi-34B-200K-Llamafied-chat-SFT-AWQ",
171
+ "Trelis/Yi-34B-200K-Llamafied-chat-SFT",
172
+ "BLACKBUN/llama-2-13b-virtual-patient-cases",
173
+ "Trelis/Yi-34B-200K-Llamafied-chat-SFT-function-calling-v2",
174
+ "Trelis/Yi-34B-200K-Llamafied-chat-SFT-function-calling-v2-AWQ",
175
+ "BLACKBUN/llama-2-13b-paediatrics-abdominal-pain",
176
+ "Trelis/Yi-34B-200K-Llamafied-chat-SFT-function-calling-v2-GPTQ",
177
+ "BLACKBUN/llama-2-13b-both",
178
+ "SrikanthChellappa/orca2-7b-sharded-finetuning-medical100k-chatbot",
179
+ "stabilityai/StableLM_exp1",
180
+ "taide/b.11.0.0",
181
+ "Lithicsoft/The-Lithicsoft-Research-AI-02",
182
+ "ishaansharma/llama_test_tiny_ola_hindi",
183
+ "stabilityai/StableLM_exp3",
184
+ "dongnguyen18891/zephyr-7b-beta-vi-math",
185
+ "BaoLocTown/sft-zephyr-7b-beta-v3",
186
+ "BaoLocTown/sft-zephyr-7b-beta-v4",
187
+ "deepnight-research/ai1",
188
+ "DopeorNope/mistralopithecus-v1-SFT-7b",
189
+ "DopeorNope/mistralopithecus-v3-dpo-7b",
190
+ "HumanF-MarkrAI/COKAL-DPO-13b-v3",
191
+ "fblgit/juanako-7b-UNA-v2-phase-1",
192
+ "izayashiro/mistralai-HPC-Instruct",
193
+ "Devden/Debt-agent-2",
194
+ "Trelis/em_german_leo_mistral-function-calling-v2",
195
+ "HumanF-MarkrAI/Dear_My_best_Friends-v4-13B",
196
+ "MarkrAI/DopeorNope-Maestro-v1-13B",
197
+ "snunlp/bok_finance_model_1129",
198
+ "MarkrAI/DopeorNope-maestro-v1-DPO-13b",
199
+ "MarkrAI/DopeorNope-maestro-v1.1-DPO-13b",
200
+ "MarkrAI/DopeorNope-maestro-v2-DPO-13b",
201
+ "imone/openchat_3.5_Yi_6B",
202
+ "MarkrAI/DopeorNope-maestro-v4-DPO-13b",
203
+ "Trelis/Mistral-7B-Instruct-v0.1-function-calling-v3",
204
+ "jeffzyu/llama-2-7b-chat-profit",
205
+ "wons/Yi-6b-test-v0.1",
206
+ "Trelis/openchat_3.5-function-calling-v3",
207
+ "vilm/vinallama-hermes-small",
208
+ "hclaim/clamgpt7",
209
+ "snunlp/bok_finance_llama",
210
+ "Jiahuan/vox-finetune-llama-2-7b-chat",
211
+ "V1v3c/falconX",
212
+ "Trelis/Yi-34B-200K-Llamafied-chat-SFT-function-calling-v3",
213
+ "Trelis/deepseek-llm-67b-chat-function-calling-v3",
214
+ "one-man-army/una-cybertron-14b-v2-bf16",
215
+ "solakim/Mistral-Sierra-Instruct",
216
+ "meta-llama/LlamaGuard-7b",
217
+ "Hjallti/solar-strike-0",
218
+ "shwesk/mlops_mistral-7b-Instruct-GPTQ",
219
+ "Prashanthch/llama-2-7b",
220
+ "HighClassShawty/DEV1L-V1",
221
+ "Trelis/Mistral-7B-Instruct-v0.1-Summarize-64k",
222
+ "xDAN2099/xDAN-L1M-Mixtral-experts-e1",
223
+ "taozi555/T-dpo-step300",
224
+ "Trelis/Mistral-7B-Instruct-v0.2-function-calling-v3",
225
+ "Trelis/SUS-Chat-34B-function-calling-v3",
226
+ "miweru/ochat3-5_schwurpus_merged",
227
+ "yixuantt/InvestLM-33b-awq",
228
+ "liuyongq/eval_model_tmp",
229
+ "ura-hcmut/MixSUra",
230
+ "Trelis/Mixtral-8x7B-Instruct-v0.1-function-calling-v3",
231
+ "bi-matrix/g-matrix-mx7b",
232
+ "Trelis/DeciLM-7B-instruct-function-calling-v3",
233
+ "solakim/Mistral-Mike-Instruct",
234
+ "xDAN-AI/xDAN-L1-moe-4x7b",
235
+ "xDAN-AI/xDAN-L2-Chat-RL-v2",
236
+ "Mitsuki-Sakamoto/pythia-1.4b_alpaca_farm_instructions_sft_constant_pa",
237
+ "xDAN-AI/xDAN-L1-Chat-RL-v1-awq",
238
+ "Trelis/deepseek-coder-33b-instruct-function-calling-v3",
239
+ "thanhdath/vinallama-7b-legal-chat",
240
+ "msy127/mnsim-sft-peftmerged",
241
+ "xDAN-AI/xDAN-L1-SOLAR-RL-v1",
242
+ "xDAN-AI/xDAN-L1-moe-8x7b",
243
+ "PDScience/CollegeAuditScraper_v1.0",
244
+ "Trelis/Tiny",
245
+ "pran1805/BloomFinance",
246
+ "pran1805/FalconFinance",
247
+ "ura-hcmut/MixSUra-AWQ",
248
+ "LolaLaiser/LOTTE_CHAT",
249
+ "SakuraLLM/Sakura-13B-Base-v0.9.0",
250
+ "lo0on/demo",
251
+ "iarbel/law-chat-base",
252
+ "pran1805/MistralFinance",
253
+ "justinj92/dpoplatypus-phi2",
254
+ "johaness14/BLOOM_161M_French",
255
+ "rexionmars/mistral_essay_evaluator",
256
+ "yentinglin/Taiwan-LLM-MoE-alpha",
257
+ "JoshVictor/llama-2-7b-chat-hf-TEL-ERW",
258
+ "margenai/Llama-2-7b-ecommerce-chat-hf",
259
+ "abhinand/tamil-mistral-sft-alpha-v0",
260
+ "thanhdath/c-7b-legal-chat",
261
+ "fblgit/UNA-34Beagles-32K-v1",
262
+ "iarbel/mistral-sft-lora_v3_all",
263
+ "KSU-HW-SEC/Finetune-qv-in-30k_model-5epoch",
264
+ "Trelis/Mixtral-8x7B-Instruct-v0.1-writer-assistant-inline-v0.12-fullmodel",
265
+ "Kwabena/misteralInstruct_V2",
266
+ "Gincy/mistral-7b-finetune",
267
+ "hditnh57/llama2-13b-chat-hf-trained",
268
+ "KavyaSwethaJ/Yazh",
269
+ "Harry-woolnough/mistrueue",
270
+ "jingyeom/translation_solar_shargpt",
271
+ "beomi/Yi-Ko-34B-dev",
272
+ "Trelis/CodeLlama-70b-Instruct-hf-function-calling-v3",
273
+ "nctu6/c.1.0.0",
274
+ "nctu6/e.1.0.0",
275
+ "jingyeom/translation_solar_shargpt_koen",
276
+ "iNeil77/IRCoder-1_1b",
277
+ "iNeil77/IRCoder-3_1b",
278
+ "iNeil77/IRCoder-6_7b",
279
+ "anik115/fine-tune-llama-7b",
280
+ "vilm/Quyen-SE-4e",
281
+ "vilm/Quyen-4e",
282
+ "wisdomik/Quilt-Llava-v1.5-7b",
283
+ "vilm/Quyen-Mini-4e",
284
+ "adarshxs/Telugu-SFT-merged",
285
+ "KrispNut/Chat-Bot",
286
+ "iNeil77/IRCoder-7_3b",
287
+ "iNeil77/IRCoder-1_3b",
288
+ "jingyeom/translation_solar_shargpt_koen_conversation",
289
+ "jingyeom/translate_conversation_shargpt_solar_koen",
290
+ "iNeil77/IRCoder-5_7b",
291
+ "iNeil77/IRCoder-6_7b-instruct",
292
+ "iNeil77/IRCoder-1_1b-instruct",
293
+ "iNeil77/IRCoder-3_1b-instruct",
294
+ "iNeil77/IRCoder-1_3b-instruct",
295
+ "iNeil77/IRCoder-5_7b-instruct",
296
+ "iNeil77/IRCoder-7_3b-instruct",
297
+ "google/gemma-2b",
298
+ "google/gemma-2b-it",
299
+ "google/gemma-7b",
300
+ "marcu5fen1x/llama_2_commaVQ",
301
+ "HeavenWaters/TaxTajweezLlama7B",
302
+ "plainbagel/RedFox-7B-v0.4-rc3",
303
+ "plainbagel/RedFox-6B-v0.4-rc5",
304
+ "Gincy/mistral7b-finetuned-second-llm",
305
+ "stmld/pgpt_mistral_7b",
306
+ "google/gemma-7b-it",
307
+ "AIFS/Prometh-MOEM-V.01",
308
+ "rockyclh/llama2_7b_hf_entrepreneurship",
309
+ "abhishekchohan/SOLAR-10.7B-Instruct-Forest-DPO-v1",
310
+ "plainbagel/RedFox-10.7B-v0.4-rc4",
311
+ "plainbagel/RedFox-13B-v0.4-rc1",
312
+ "plainbagel/RedFox-10.7B-v0.4-rc2",
313
+ "DrFumes/true-ANNE-7b-bf16",
314
+ "ura-hcmut/MixSUra-SFT",
315
+ "nagyroland/ANNE-7b-bf16-cmh",
316
+ "ura-hcmut/MixSUra-SFT-AWQ",
317
+ "almersawi/fine-tuning-test-01",
318
+ "AA051615/A0221",
319
+ "AA051615/A0222",
320
+ "pphuc25/poem-vistral",
321
+ "oi-uae/bert-classification-v-1",
322
+ "ura-hcmut/GemSUra-7B",
323
+ "johaness14/GPT2-54.5M-OpenWebText100K",
324
+ "ura-hcmut/GemSUra-2B"
325
+ ]