Spaces:
Runtime error
Runtime error
def return_task_name(): | |
return ('text2text-generation', "text-generation") | |
def return_models(task_name): | |
if task_name == "text2text-generation": | |
models_parent = ( | |
'google', | |
"facebook", | |
"microsoft", | |
"salesforce", | |
"langboat", | |
"bloom", | |
"allenai", | |
"mbzuai", | |
"lmsys", | |
"starmpcc", | |
"haining", | |
"kaludi", | |
) | |
else: | |
models_parent = ( | |
'google', | |
"facebook", | |
"microsoft", | |
"salesforce", | |
"langboat", | |
"databricks", | |
"aisquared", | |
"bloom", | |
"allenai", | |
"tiiuae", | |
"openlm", | |
"stabilityai", | |
"eleutherai", | |
"mbzuai", | |
"cerebras", | |
"open_assistant", | |
"nomic_ai", | |
"blinkdl", | |
"lmsys", | |
"together_computer", | |
"mosaic_ml", | |
"h20ai", | |
"deciai", | |
) | |
return models_parent | |
def return_text2text_generation_models(model_parent, count=False): | |
google_models_list = ( | |
"google/flan-t5-small", | |
"google/flan-t5-base", | |
'google/flan-t5-large', | |
'google/flan-t5-xl', | |
'google/flan-t5-xxl', | |
"google/byt5-xxl", | |
"google/byt5-xl", | |
"google/byt5-large", | |
"google/byt5-small", | |
"google/byt5-base", | |
"google/mt5-xxl", | |
"google/mt5-xl", | |
"google/mt5-large", | |
"google/mt5-small", | |
"google/long-t5-local-base", | |
"google/long-t5-local-large", | |
"google/long-t5-tglobal-base", | |
"google/long-t5-tglobal-large", | |
"google/pegasus-big_patent", | |
"google/pegasus-x-base", | |
"google/pegasus-x-large", | |
"google/pegasus-x-base-arxiv", | |
"google/roberta2roberta_L-24_wikisplit", | |
"google/roberta2roberta_L-24_discofuse", | |
"google/switch-base-8", | |
"google/switch-base-16", | |
"google/switch-base-32", | |
"google/switch-base-64", | |
"google/switch-base-128", | |
"google/switch-base-256", | |
"google/switch-large-128", | |
"google/switch-xxl-128", | |
"google/switch-c-2048", | |
"google/t5-11b-ssm", | |
"google/t5-11b-ssm-nq", | |
"google/t5-11b-ssm-nqo", | |
"google/t5-11b-ssm-tqa", | |
"google/t5-11b-ssm-tqao", | |
"google/t5-11b-ssm-wq", | |
"google/t5-11b-ssm-wqo", | |
"google/t5-3b-ssm", | |
"google/t5-3b-ssm-nq", | |
"google/t5-3b-ssm-nqo", | |
"google/t5-base-lm-adapt", | |
"google/t5-base-lm-adapt", | |
"google/t5-efficient-base", | |
"google/t5-efficient-base-dl2", | |
"google/t5-efficient-base-dl4", | |
"google/t5-efficient-base-dl6", | |
"google/t5-efficient-base-dl8", | |
"google/t5-efficient-base-dm256", | |
"google/t5-efficient-base-dm512", | |
"google/t5-efficient-base-dm1000", | |
"google/t5-efficient-base-dm2000", | |
"google/t5-efficient-base-el2", | |
"google/t5-efficient-base-el4", | |
"google/t5-efficient-base-el6", | |
"google/t5-efficient-base-el8", | |
"google/t5-efficient-base-el16", | |
"google/t5-efficient-base-nl40", | |
"google/t5-efficient-base-nl48", | |
"google/t5-efficient-base-nl8", | |
"google/t5-efficient-large", | |
"google/t5-efficient-large-dl12", | |
"google/t5-efficient-large-dl16", | |
"google/t5-efficient-large-dl2", | |
"google/t5-efficient-large-dl32", | |
"google/t5-efficient-large-dl4", | |
"google/t5-efficient-large-dl6", | |
"google/t5-efficient-large-dl8", | |
"google/t5-efficient-large-dm128", | |
"google/t5-efficient-large-dm2000", | |
"google/t5-efficient-large-dm256", | |
"google/t5-efficient-large-dm512", | |
"google/t5-efficient-large-dm768", | |
"google/t5-efficient-large-el12", | |
"google/t5-efficient-large-el2", | |
"google/t5-efficient-large-el4", | |
"google/t5-efficient-large-el6", | |
"google/t5-efficient-large-el8", | |
"google/t5-efficient-large-kv128", | |
"google/t5-efficient-large-kv16", | |
"google/t5-efficient-large-kv256", | |
"google/t5-efficient-large-kv32", | |
"google/t5-efficient-large-nh12", | |
"google/t5-efficient-large-nh2", | |
"google/t5-efficient-large-nh24", | |
"google/t5-efficient-large-nh32", | |
"google/t5-efficient-large-nh4", | |
"google/t5-efficient-large-nh8", | |
"google/t5-efficient-large-nh8-nl32", | |
"google/t5-efficient-large-nl10", | |
"google/t5-efficient-large-nl12", | |
"google/t5-efficient-large-nl16", | |
"google/t5-efficient-large-nl2", | |
"google/t5-efficient-large-nl20", | |
"google/t5-efficient-large-nl32", | |
"google/t5-efficient-large-nl36", | |
"google/t5-efficient-large-nl4", | |
"google/t5-efficient-large-nl8", | |
"google/t5-efficient-mini", | |
"google/t5-efficient-mini-nl12", | |
"google/t5-efficient-mini-nl24", | |
"google/t5-efficient-mini-nl6", | |
"google/t5-efficient-mini-nl8", | |
"google/t5-efficient-small", | |
"google/t5-efficient-small-dl12", | |
"google/t5-efficient-small-dl16", | |
"google/t5-efficient-small-dl2", | |
"google/t5-efficient-small-dl4", | |
"google/t5-efficient-small-dl8", | |
"google/t5-efficient-small-dm1000", | |
"google/t5-efficient-small-dm128", | |
"google/t5-efficient-small-dm2000", | |
"google/t5-efficient-small-dm256", | |
"google/t5-efficient-small-dm768", | |
"google/t5-efficient-small-el12", | |
"google/t5-efficient-small-el16", | |
"google/t5-efficient-small-el16-dl1", | |
"google/t5-efficient-small-el16-dl2", | |
"google/t5-efficient-small-el16-dl4", | |
"google/t5-efficient-small-el16-dl8", | |
"google/t5-efficient-small-el2", | |
"google/t5-efficient-small-el32", | |
"google/t5-efficient-small-el4", | |
"google/t5-efficient-small-el48", | |
"google/t5-efficient-small-el64", | |
"google/t5-efficient-small-el8", | |
"google/t5-efficient-small-el8-dl1", | |
"google/t5-efficient-small-el8-dl2", | |
"google/t5-efficient-small-el8-dl4", | |
"google/t5-efficient-small-ff1000", | |
"google/t5-efficient-small-ff12000", | |
"google/t5-efficient-small-ff3000", | |
"google/t5-efficient-small-ff6000", | |
"google/t5-efficient-small-ff9000", | |
"google/t5-efficient-small-kv128", | |
"google/t5-efficient-small-kv16", | |
"google/t5-efficient-small-kv256", | |
"google/t5-efficient-small-kv32", | |
"google/t5-efficient-small-nl16", | |
"google/t5-efficient-small-nl2", | |
"google/t5-efficient-small-nl20", | |
"google/t5-efficient-small-nl22", | |
"google/t5-efficient-small-nl24", | |
"google/t5-efficient-small-nl32", | |
"google/t5-efficient-small-nl36", | |
"google/t5-efficient-small-nl4", | |
"google/t5-efficient-small-nl40", | |
"google/t5-efficient-small-nl48", | |
"google/t5-efficient-small-nl8", | |
"google/t5-efficient-tiny", | |
"google/t5-efficient-tiny-dl2", | |
"google/t5-efficient-tiny-dl6", | |
"google/t5-efficient-tiny-dl8", | |
"google/t5-efficient-tiny-el12", | |
"google/t5-efficient-tiny-el2", | |
"google/t5-efficient-tiny-el6", | |
"google/t5-efficient-tiny-el8", | |
"google/t5-efficient-tiny-ff12000", | |
"google/t5-efficient-tiny-ff2000", | |
"google/t5-efficient-tiny-ff3000", | |
"google/t5-efficient-tiny-ff6000", | |
"google/t5-efficient-tiny-ff9000", | |
"google/t5-efficient-tiny-nh1", | |
"google/t5-efficient-tiny-nh16", | |
"google/t5-efficient-tiny-nh32", | |
"google/t5-efficient-tiny-nh8", | |
"google/t5-efficient-tiny-nl12", | |
"google/t5-efficient-tiny-nl16", | |
"google/t5-efficient-tiny-nl2", | |
"google/t5-efficient-tiny-nl24", | |
"google/t5-efficient-tiny-nl32", | |
"google/t5-efficient-tiny-nl6", | |
"google/t5-efficient-tiny-nl8", | |
"google/t5-efficient-xl", | |
"google/t5-efficient-xl-nl12", | |
"google/t5-efficient-xl-nl16", | |
"google/t5-efficient-xl-nl2", | |
"google/t5-efficient-xl-nl28", | |
"google/t5-efficient-xl-nl4", | |
"google/t5-efficient-xl-nl6", | |
"google/t5-efficient-xl-nl8", | |
"google/t5-efficient-xxl", | |
"google/t5-efficient-xxl-nl4", | |
"google/t5-large-lm-adapt", | |
"google/t5-large-ssm", | |
"google/t5-large-ssm-nq", | |
"google/t5-large-ssm-nqo", | |
"google/t5-small-lm-adapt", | |
"google/t5-small-ssm", | |
"google/t5-small-ssm-nq", | |
"google/t5-v1_1-base", | |
"google/t5-v1_1-large", | |
"google/t5-v1_1-small", | |
"google/t5-v1_1-xl", | |
"google/t5-v1_1-xxl", | |
"google/t5-xl-lm-adapt", | |
"google/t5-xl-ssm-nq", | |
"google/t5-xxl-lm-adapt", | |
"google/t5-xxl-ssm", | |
"google/t5-xxl-ssm-nq", | |
"google/t5-xxl-ssm-nqo", | |
"google/t5-xxl-ssm-tqa", | |
"google/t5-xxl-ssm-tqao", | |
"google/t5-xxl-ssm-wq", | |
"google/t5-xxl-ssm-wqo", | |
"google/t5_11b_trueteacher_and_anli", | |
"google/ul2", | |
"google/umt5-base", | |
"google/umt5-small", | |
"google/umt5-xl", | |
"google/umt5-xxl", | |
) | |
mbzuai_models_list = ( | |
"MBZUAI/LaMini-Flan-T5-783M", | |
"MBZUAI/LaMini-Flan-T5-248M", | |
"MBZUAI/LaMini-Flan-T5-77M", | |
"MBZUAI/LaMini-T5-738M", | |
"MBZUAI/LaMini-T5-223M", | |
"MBZUAI/LaMini-T5-61M", | |
) | |
bloom_models_list = ( | |
"bigscience/T0_3B", | |
"bigscience/T0_original_task_only", | |
"bigscience/T0_single_prompt", | |
"bigscience/T0p", | |
"bigscience/T0", | |
"bigscience/T0pp", | |
"bigscience/mt0-xxl-p3", | |
"bigscience/mt0-xxl", | |
"bigscience/mt0-large", | |
"bigscience/mt0-base", | |
"bigscience/mt0-small", | |
"bigscience/mt0-xxl-mt", | |
) | |
lmsys_models_list = ( | |
"lmsys/fastchat-t5-3b-v1.0", | |
) | |
facebook_models_list = ( | |
'facebook/mbart-large-50-many-to-many-mmt', | |
'facebook/musicgen-small', | |
'facebook/musicgen-medium', | |
"facebook/musicgen-large", | |
'facebook/m2m100_418M', | |
'facebook/mbart-large-50-one-to-many-mmt', | |
'facebook/mbart-large-50-many-to-one-mmt', | |
'facebook/mbart-large-50', | |
'facebook/mgenre-wiki', | |
'facebook/genre-linking-aidayago2', | |
'facebook/genre-linking-blink', | |
'facebook/genre-kilt', | |
'facebook/m2m100-12B-avg-10-ckpt', | |
'facebook/m2m100-12B-avg-5-ckpt', | |
'facebook/m2m100-12B-last-ckpt', | |
'facebook/m2m100_1.2B' | |
) | |
microsoft_models_list = ( | |
"microsoft/prophetnet-large-uncased", | |
"microsoft/codereviewer", | |
"microsoft/xprophetnet-large-wiki100-cased", | |
"microsoft/xprophetnet-large-wiki100-cased-xglue-qg", | |
"microsoft/xprophetnet-large-wiki100-cased-xglue-ntg", | |
"microsoft/prophetnet-large-uncased-squad-qg", | |
"microsoft/prophetnet-large-uncased-cnndm", | |
) | |
starmpcc_models_list = ( | |
"starmpcc/Asclepius-13B", | |
"starmpcc/Asclepius-7B" | |
) | |
langboat_models_list = ( | |
"Langboat/mengzi-t5-base", | |
"Langboat/mengzi-t5-base-mt" | |
) | |
haining_models_list = ( | |
"haining/scientific_abstract_simplification", | |
"haining/poem_interpretation_allpoetry169k_baseline", | |
"haining/poem_interpretation_allpoetry169k_full", | |
"haining/lyrics_interpretation_nonnegative", | |
"haining/poem_interpretation_allpoetry169k", | |
"haining/sas_baseline", | |
) | |
kaludi_models_list = ( | |
"Kaludi/chatgpt-gpt4-prompts-bart-large-cnn-samsum", | |
"Kaludi/Customer-Support-Assistant", | |
"Kaludi/Customer-Support-Assistant-V2", | |
"Kaludi/historical-events-reimagined" | |
) | |
allenai_models_list = ( | |
'allenai/macaw-large', | |
'allenai/entailer-11b', | |
'allenai/entailer-large', | |
'allenai/System4_classify_FigLang2022', | |
'allenai/System4_explain_FigLang2022', | |
'allenai/System3_DREAM_FLUTE_all_dimensions_FigLang2022', | |
'allenai/System3_DREAM_FLUTE_social_norm_FigLang2022', | |
'allenai/System3_DREAM_FLUTE_consequence_FigLang2022', | |
'allenai/System3_DREAM_FLUTE_motivation_FigLang2022', | |
'allenai/System3_DREAM_FLUTE_emotion_FigLang2022', | |
'allenai/System2_FigLang2022', | |
'allenai/System1_FigLang2022', | |
'allenai/DREAM', | |
'allenai/led-base-16384-cochrane', | |
'allenai/bart-large-multi_lexsum-long-multitask', | |
'allenai/bart-large-multi_lexsum-source-multitask', | |
'allenai/pegasus-multi_lexsum-short-tiny', | |
'allenai/pegasus-multi_lexsum-long-tiny', | |
'allenai/pegasus-multi_lexsum-long-short', | |
'allenai/bart-large-multi_lexsum-short-tiny', | |
'allenai/bart-large-multi_lexsum-long-tiny', | |
'allenai/bart-large-multi_lexsum-long-short', | |
'allenai/primera-multi_lexsum-source-tiny', | |
'allenai/primera-multi_lexsum-source-short', | |
'allenai/primera-multi_lexsum-source-long', | |
'allenai/led-base-16384-multi_lexsum-source-tiny', | |
'allenai/led-base-16384-multi_lexsum-source-short', | |
'allenai/led-base-16384-multi_lexsum-source-long', | |
'allenai/led-base-16384-ms2', | |
'allenai/mtk-instruct-11b-def-pos', | |
'allenai/tk-instruct-small-def-pos', | |
'allenai/tk-instruct-base-def-pos', | |
'allenai/tk-instruct-large-def-pos', | |
'allenai/mtk-instruct-3b-def-pos', | |
'allenai/tk-instruct-3b-def-pos-neg-expl', | |
'allenai/tk-instruct-3b-def-pos-neg', | |
'allenai/tk-instruct-3b-pos', | |
'allenai/tk-instruct-3b-def-pos', | |
'allenai/tk-instruct-3b-def', | |
'allenai/tk-instruct-11b-def-pos-neg-expl', | |
'allenai/tk-instruct-11b-def-pos', | |
'allenai/tk-instruct-11b-def', | |
'allenai/PRIMERA-arxiv', | |
'allenai/PRIMERA-wcep', | |
'allenai/PRIMERA-multixscience', | |
'allenai/PRIMERA-multinews', | |
'allenai/PRIMERA', | |
'allenai/unifiedqa-v2-t5-small-1363200', | |
'allenai/unifiedqa-v2-t5-small-1251000', | |
'allenai/unifiedqa-v2-t5-large-1363200', | |
'allenai/unifiedqa-v2-t5-large-1251000', | |
'allenai/unifiedqa-v2-t5-base-1363200', | |
'allenai/unifiedqa-v2-t5-base-1251000', | |
'allenai/unifiedqa-v2-t5-3b-1363200', | |
'allenai/unifiedqa-v2-t5-3b-1251000', | |
'allenai/unifiedqa-v2-t5-11b-1363200', | |
'allenai/unifiedqa-v2-t5-11b-1251000', | |
'allenai/unifiedqa-t5-small', | |
'allenai/unifiedqa-t5-large', | |
'allenai/unifiedqa-t5-base', | |
'allenai/unifiedqa-t5-3b', | |
'allenai/unifiedqa-t5-11b', | |
'allenai/tailor', | |
'allenai/t5-small-squad2-question-generation', | |
'allenai/t5-small-squad2-next-word-generator-squad', | |
'allenai/t5-small-squad11', | |
'allenai/t5-small-next-word-generator-qoogle', | |
'allenai/macaw-answer-11b', | |
'allenai/macaw-3b', | |
'allenai/macaw-11b', | |
'allenai/led-large-16384', | |
'allenai/led-large-16384-arxiv', | |
'allenai/led-base-16384' | |
) | |
salesforce_models_list = ( | |
'Salesforce/socratic-books-30M', | |
'Salesforce/instructcodet5p-16b', | |
'Salesforce/codet5p-2b', | |
'Salesforce/codet5p-6b', | |
'Salesforce/codet5p-16b', | |
'Salesforce/dialogstudio-t5-3b-v1.0', | |
'Salesforce/dialogstudio-t5-base-v1.0', | |
'Salesforce/dialogstudio-t5-large-v1.0', | |
'Salesforce/bart-large-xsum-samsum', | |
'Salesforce/cods-bart-large-xsum-samsum', | |
'Salesforce/qaconv-unifiedqa-t5-3b', | |
'Salesforce/qaconv-unifiedqa-t5-base', | |
'Salesforce/qaconv-unifiedqa-t5-large', | |
'Salesforce/mixqg-base', | |
'Salesforce/mixqg-3b', | |
'Salesforce/mixqg-large', | |
'Salesforce/codet5-small', | |
'Salesforce/codet5-base', | |
'Salesforce/codet5-large', | |
'Salesforce/codet5-large-ntp-py', | |
'Salesforce/codet5-base-multi-sum', | |
'Salesforce/discord_qg', | |
'Salesforce/codet5-base-codexglue-sum-python', | |
'Salesforce/codet5-base-codexglue-sum-go', | |
'Salesforce/codet5-base-codexglue-sum-php', | |
'Salesforce/codet5-base-codexglue-sum-javascript', | |
'Salesforce/codet5-base-codexglue-sum-java', | |
'Salesforce/codet5-base-codexglue-sum-ruby', | |
'Salesforce/codet5-base-codexglue-clone', | |
'Salesforce/codet5-base-codexglue-concode', | |
'Salesforce/codet5-base-codexglue-defect', | |
'Salesforce/codet5-base-codexglue-refine-medium', | |
'Salesforce/codet5-base-codexglue-refine-small', | |
'Salesforce/codet5-base-codexglue-translate-cs-java', | |
'Salesforce/codet5-base-codexglue-translate-java-cs', | |
'Salesforce/safety-flan-t5-base', | |
'Salesforce/safety-flan-t5-small', | |
'Salesforce/codet5p-770m-py', | |
'Salesforce/codet5p-770m', | |
'Salesforce/codet5p-220m', | |
'Salesforce/codet5p-220m-py', | |
'Salesforce/bart-large-swipe', | |
'Salesforce/bart-large-swipe-clean' | |
) | |
model_dict = { | |
"google": google_models_list, | |
"mbzuai": mbzuai_models_list, | |
"bloom": bloom_models_list, | |
"lmsys": lmsys_models_list, | |
"facebook": facebook_models_list, | |
"microsoft": microsoft_models_list, | |
"starmpcc": starmpcc_models_list, | |
"langboat": langboat_models_list, | |
"haining": haining_models_list, | |
"kaludi": kaludi_models_list, | |
"allenai": allenai_models_list, | |
"salesforce": salesforce_models_list | |
} | |
if count is True: | |
models_count = 0 | |
for i in model_dict: | |
models_count += len(model_dict[i]) | |
return models_count | |
return model_dict[model_parent] | |
# Text Generation Models | |
def return_text_generation_models(model_parent, count=False): | |
google_models_list = ( | |
"google/reformer-enwik8", | |
"google/reformer-crime-and-punishment", | |
) | |
mbzuai_models_list = ( | |
"MBZUAI/LaMini-Cerebras-111M", | |
"MBZUAI/LaMini-Cerebras-256M", | |
"MBZUAI/LaMini-Cerebras-590M", | |
"MBZUAI/LaMini-Cerebras-1.3B", | |
"MBZUAI/LaMini-GPT-774M", | |
"MBZUAI/LaMini-GPT-124M", | |
"MBZUAI/LaMini-GPT-1.5B", | |
"MBZUAI/LaMini-Neo-125M", | |
"MBZUAI/LaMini-Neo-1.3B", | |
) | |
eleutherai_models_list=( | |
"EleutherAI/pythia-14m", | |
"EleutherAI/pythia-31m", | |
"EleutherAI/pythia-1b-deduped", | |
"EleutherAI/pythia-2.8b-v0", | |
"EleutherAI/pythia-1b-v0", | |
"EleutherAI/pythia-410m-v0", | |
"EleutherAI/pythia-70m-deduped-v0", | |
"EleutherAI/pythia-2.8b-deduped-v0", | |
"EleutherAI/pythia-1b-deduped-v0", | |
"EleutherAI/pythia-410m-deduped-v0", | |
"EleutherAI/pythia-160m-deduped-v0", | |
"EleutherAI/pythia-6.9b-deduped-v0", | |
"EleutherAI/pythia-70m-deduped", | |
"EleutherAI/pythia-70m", | |
"EleutherAI/pythia-2.8b-deduped", | |
"EleutherAI/pythia-1b", | |
"EleutherAI/pythia-410m-deduped", | |
"EleutherAI/pythia-160m-deduped", | |
"EleutherAI/pythia-160m-v0", | |
"EleutherAI/pythia-1.4b-deduped-v0", | |
"EleutherAI/pythia-1.4b", | |
"EleutherAI/pythia-410m", | |
"EleutherAI/pythia-intervention-410m-deduped", | |
"EleutherAI/gpt-neo-125m", | |
"EleutherAI/gpt-neo-2.7B", | |
"EleutherAI/gpt-neo-1.3B", | |
"EleutherAI/pythia-160m", | |
"EleutherAI/gpt-neox-20b", | |
"EleutherAI/gpt-j-6b", | |
"EleutherAI/pythia-2.8b", | |
"EleutherAI/pythia-12b-deduped", | |
"EleutherAI/pythia-6.9b-deduped", | |
"EleutherAI/pythia-1.4b-deduped", | |
"EleutherAI/pythia-12b", | |
"EleutherAI/pythia-6.9b", | |
"EleutherAI/polyglot-ko-12.8b", | |
"EleutherAI/polyglot-ko-5.8b", | |
"EleutherAI/polyglot-ko-3.8b", | |
"EleutherAI/polyglot-ko-1.3b", | |
"EleutherAI/pythia-intervention-6.9b-deduped", | |
"EleutherAI/pythia-intervention-1.4b-deduped", | |
"EleutherAI/pythia-intervention-70m-deduped", | |
"EleutherAI/pythia-intervention-long-1.4b-deduped", | |
"EleutherAI/pythia-70m-v0", | |
"EleutherAI/pythia-1.4b-v0", | |
"EleutherAI/pythia-6.9b-v0", | |
"EleutherAI/pythia-12b-deduped-v0", | |
"EleutherAI/pythia-12b-v0", | |
"EleutherAI/pythia-160m-seed3", | |
"EleutherAI/pythia-160m-seed2", | |
"EleutherAI/pythia-160m-seed1", | |
"EleutherAI/neox-ckpt-pythia-6.9b-deduped", | |
"EleutherAI/pythia-160m-hiddendropout", | |
"EleutherAI/pythia-160m-attndropout", | |
"EleutherAI/pythia-160m-alldropout", | |
"EleutherAI/pythia-6.9b-deduped-v0-seed42", | |
) | |
cerebras_models_list = ( | |
"cerebras/btlm-3b-8k-base", | |
"cerebras/cerebras-GPT-13B", | |
"cerebras/cerebras-GPT-6.7B", | |
"cerebras/cerebras-GPT-2.7B", | |
"cerebras/cerebras-GPT-1.3B", | |
"cerebras/cerebras-GPT-590M", | |
"cerebras/cerebras-GPT-256M", | |
"cerebras/cerebras-GPT-111M", | |
) | |
open_assistant_models_list = ( | |
"OpenAssistant/codellama-13b-oasst-sft-v10", | |
"OpenAssistant/llama2-70b-oasst-sft-v10", | |
"OpenAssistant/llama2-13b-megacode2-oasst", | |
"OpenAssistant/falcon-40b-megacode2-oasst", | |
"OpenAssistant/pythia-12b-sft-v8-rlhf-2k-steps", | |
"OpenAssistant/llama2-13b-orca-8k-3319", | |
"OpenAssistant/falcon-7b-sft-mix-2000", | |
"OpenAssistant/falcon-7b-sft-top1-696", | |
"OpenAssistant/falcon-40b-sft-mix-1226", | |
"OpenAssistant/falcon-40b-sft-top1-560", | |
"OpenAssistant/pythia-12b-sft-v8-2.5k-steps", | |
"OpenAssistant/pythia-12b-sft-v8-7k-steps", | |
"OpenAssistant/pythia-12b-pre-v8-12.5k-steps", | |
"OpenAssistant/oasst-sft-4-pythia-12b-epoch-3.5", | |
"OpenAssistant/stablelm-7b-sft-v7-epoch-3", | |
"OpenAssistant/oasst-sft-1-pythia-12b", | |
"OpenAssistant/galactica-6.7b-finetuned", | |
) | |
databricks_models_list = ( | |
"databricks/dolly-v2-7b", | |
"databricks/dolly-v2-3b", | |
"databricks/dolly-v2-12b", | |
"databricks/dolly-v1-6b", | |
) | |
nomic_ai_models_list = ( | |
"nomic-ai/gpt4all-falcon", | |
"nomic-ai/gpt4all-j", | |
"nomic-ai/gpt4all-mpt", | |
"nomic-ai/gpt4all-13b-snoozy", | |
"nomic-ai/gpt4all-j-lora", | |
) | |
blinkdl_models_list = ( | |
"BlinkDL/rwkv-5-world", | |
"BlinkDL/rwkv-4-world", | |
"BlinkDL/rwkv-4-raven", | |
"BlinkDL/rwkv-4-pile-7b", | |
"BlinkDL/rwkv-4-pile-14b", | |
"BlinkDL/rwkv-4-novel", | |
"BlinkDL/rwkv-4-pileplus", | |
"BlinkDL/rwkv-4-pile-430m", | |
"BlinkDL/rwkv-4-pile-3b", | |
"BlinkDL/rwkv-4-pile-1b5", | |
"BlinkDL/rwkv-4-pile-169m", | |
"BlinkDL/rwkv-3-pile-1b5", | |
"BlinkDL/rwkv-3-pile-430m", | |
"BlinkDL/rwkv-2-pile-430m", | |
"BlinkDL/rwkv-3-pile-169m", | |
) | |
ai_squared_models_list = ( | |
"aisquared/dlite-dais-2023", | |
"aisquared/chopt-1_3b", | |
"aisquared/chopt-350m", | |
"aisquared/chopt-125m", | |
"aisquared/chopt-2_7b", | |
"aisquared/dlite-v2-1_5b", | |
"aisquared/dlite-v2-774m", | |
"aisquared/dlite-v2-355m", | |
"aisquared/dlite-v2-124m", | |
"aisquared/dlite-v1-355m", | |
"aisquared/dlite-v1-774m", | |
"aisquared/dlite-v1-1_5b", | |
"aisquared/dlite-v1-124m", | |
"aisquared/chopt-research-350m", | |
"aisquared/chopt-research-125m", | |
"aisquared/chopt-research-2_7b", | |
"aisquared/chopt-research-1_3b", | |
) | |
bloom_models_list = ( | |
"bigscience/bloom-3b-intermediate", | |
"bigscience/bloom", | |
"bigscience/bloomz-p3", | |
"bigscience/bloomz-mt", | |
"bigscience/bloomz-7b1-mt", | |
"bigscience/bloom-1b7-intermediate", | |
"bigscience/bloom-560m-intermediate", | |
"bigscience/bloomz-560m", | |
"bigscience/bloomz-1b1", | |
"bigscience/bloomz-1b7", | |
"bigscience/bloomz-3b", | |
"bigscience/bloomz-7b1", | |
'bigscience/bloomz', | |
"bigscience/bloom-1b7", | |
"bigscience/bloom-560m", | |
"bigscience/bloom-3b", | |
"bigscience/bigscience-small-testing", | |
"bigscience/distill-bloom-1b3", | |
"bigscience/bloom-1b1", | |
"bigscience/distill-bloom-1b3-10x", | |
"bigscience/test-bloomd", | |
"bigscience/test-bloomd-6b3", | |
"bigscience/bloom-7b1", | |
"bigscience/bloom-petals", | |
"bigscience/bloom-1b1-intermediate", | |
"bigscience/bloom-7b1-intermediate", | |
"bigscience/bloom-7b1-petals", | |
"bigscience/bloomz-petals", | |
"bigscience/bloomz-7b1-p3", | |
) | |
tiiuae_models_list = ( | |
"tiiuae/falcon-180B", | |
"tiiuae/falcon-180B-chat", | |
"tiiuae/falcon-40b", | |
"tiiuae/falcon-7b", | |
"tiiuae/falcon-7b-instruct", | |
"tiiuae/falcon-40b-instruct", | |
"tiiuae/falcon-rw-7b", | |
"tiiuae/falcon-rw-1b", | |
) | |
openlm_models_list = ( | |
"openlm-research/open_llama_3b_v2", | |
"openlm-research/open_llama_7b_v2", | |
"openlm-research/open_llama_13b", | |
"openlm-research/open_llama_7b", | |
"openlm-research/open_llama_3b", | |
) | |
stabilityai_models_list = ( | |
"stabilityai/StableBeluga-7B", | |
"stabilityai/StableBeluga-13B", | |
"stabilityai/StableBeluga2", | |
"stabilityai/stablelm-base-alpha-3b-v2", | |
"stabilityai/stablelm-base-alpha-7b-v2", | |
"stabilityai/japanese-stablelm-instruct-alpha-7b", | |
"stabilityai/japanese-stablelm-base-alpha-7b", | |
"stabilityai/stablecode-completion-alpha-3b-4k", | |
"stabilityai/stablecode-instruct-alpha-3b", | |
"stabilityai/stablecode-completion-alpha-3b", | |
"stabilityai/StableBeluga1-Delta", | |
"stabilityai/stablelm-base-alpha-3b", | |
"stabilityai/stablelm-base-alpha-7b", | |
"stabilityai/stablelm-tuned-alpha-3b", | |
"stabilityai/stablelm-tuned-alpha-7b", | |
) | |
lmsys_models_list = ( | |
"lmsys/vicuna-13b-v1.5-16k", | |
"lmsys/vicuna-13b-v1.5", | |
"lmsys/vicuna-7b-v1.5-16k", | |
"lmsys/longchat-7b-v1.5-32k", | |
"lmsys/vicuna-7b-v1.5", | |
"lmsys/vicuna-7b-v1.3", | |
"lmsys/vicuna-13b-v1.3", | |
"lmsys/vicuna-7b-v1.1", | |
"lmsys/vicuna-13b-v1.1", | |
"lmsys/vicuna-13b-delta-v0", | |
"lmsys/vicuna-7b-delta-v0", | |
"lmsys/vicuna-13b-delta-v1.1", | |
"lmsys/vicuna-7b-delta-v1.1", | |
"lmsys/vicuna-33b-v1.3", | |
"lmsys/longchat-13b-16k", | |
'lmsys/longchat-7b-16k', | |
) | |
togethercomputer_models_list = ( | |
'togethercomputer/Llama-2-7B-32K-Instruct', | |
'togethercomputer/RedPajama-INCITE-7B-Instruct', | |
'togethercomputer/LLaMA-2-7B-32K', | |
'togethercomputer/RedPajama-INCITE-7B-Base', | |
'togethercomputer/RedPajama-INCITE-7B-Chat', | |
'togethercomputer/RedPajama-INCITE-Chat-3B-v1', | |
'togethercomputer/RedPajama-INCITE-Instruct-3B-v1', | |
'togethercomputer/RedPajama-INCITE-Base-3B-v1', | |
'togethercomputer/GPT-NeoXT-Chat-Base-20B', | |
'togethercomputer/Pythia-Chat-Base-7B', | |
'togethercomputer/GPT-JT-Moderation-6B', | |
'togethercomputer/GPT-JT-6B-v1', | |
'togethercomputer/GPT-JT-6B-v0' | |
) | |
mosaic_models_list = ( | |
'mosaicml/mpt-7b-chat', | |
'mosaicml/mpt-30b-chat', | |
'mosaicml/mpt-7b-8k-chat', | |
'mosaicml/mpt-7b-instruct', | |
'mosaicml/mpt-7b-8k-instruct', | |
'mosaicml/mpt-7b-8k', | |
'mosaicml/mpt-30b', | |
'mosaicml/mpt-7b', | |
'mosaicml/mpt-7b-storywriter', | |
'mosaicml/mpt-30b-instruct', | |
'mosaicml/mpt-1b-redpajama-200b', | |
'mosaicml/mpt-1b-redpajama-200b-dolly' | |
) | |
h20ai_models_list = ( | |
'h2oai/h2ogpt-16k-codellama-7b-python', | |
'h2oai/h2ogpt-16k-codellama-7b-instruct', | |
'h2oai/h2ogpt-16k-codellama-7b', | |
'h2oai/h2ogpt-16k-codellama-34b-python', | |
'h2oai/h2ogpt-16k-codellama-34b-instruct', | |
'h2oai/h2ogpt-16k-codellama-13b-python', | |
'h2oai/h2ogpt-16k-codellama-13b-instruct', | |
'h2oai/h2ogpt-16k-codellama-13b', | |
'h2oai/h2ogpt-16k-codellama-34b', | |
'h2oai/h2ogpt-4096-llama2-13b-chat', | |
'h2oai/h2ogpt-4096-llama2-70b-chat', | |
'h2oai/h2ogpt-4096-llama2-7b-chat', | |
'h2oai/h2ogpt-4096-llama2-13b', | |
'h2oai/h2ogpt-4096-llama2-7b', | |
'h2oai/h2ogpt-4096-llama2-70b', | |
'h2oai/h2ogpt-gm-oasst1-en-2048-falcon-40b-v2', | |
'h2oai/h2ogpt-gm-oasst1-en-2048-falcon-7b-v3', | |
'h2oai/h2ogpt-research-oasst1-llama-65b', | |
'h2oai/h2ogpt-gm-oasst1-en-xgen-7b-8k', | |
'h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-3b', | |
'h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b', | |
'h2oai/h2ogpt-oasst1-falcon-40b', | |
'h2oai/h2ogpt-gm-oasst1-en-2048-falcon-40b-v1', | |
'h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-13b', | |
'h2oai/h2ogpt-oig-oasst1-falcon-40b', | |
'h2oai/h2ogpt-gm-oasst1-en-2048-falcon-7b', | |
'h2oai/h2ogpt-gm-oasst1-multilang-2048-falcon-7b', | |
'h2oai/h2ogpt-oasst1-512-12b', | |
'h2oai/h2ogpt-oig-oasst1-256-6_9b', | |
'h2oai/h2ogpt-oig-oasst1-512-6_9b', | |
'h2oai/h2ogpt-research-oig-oasst1-512-30b', | |
'h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-700bt', | |
'h2oai/h2ogpt-gm-oasst1-en-1024-open-llama-7b-preview-400bt', | |
'h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2', | |
'h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt', | |
'h2oai/h2ogpt-gm-oasst1-en-1024-12b', | |
'h2oai/h2ogpt-gm-oasst1-en-1024-20b', | |
'h2oai/h2ogpt-gm-oasst1-multilang-1024-20b', | |
'h2oai/h2ogpt-oasst1-512-20b' | |
) | |
facebook_models_list = ( | |
'facebook/xglm-4.5B', | |
'facebook/galactica-125m', | |
'facebook/opt-iml-1.3b', | |
'facebook/opt-iml-max-1.3b', | |
'facebook/opt-iml-max-30b', | |
'facebook/opt-iml-30b', | |
'facebook/galactica-120b', | |
'facebook/galactica-30b', | |
'facebook/galactica-6.7b', | |
'facebook/galactica-1.3b', | |
'facebook/opt-66b', | |
'facebook/opt-30b', | |
'facebook/opt-13b', | |
'facebook/opt-6.7b', | |
'facebook/opt-2.7b', | |
'facebook/opt-1.3b', | |
'facebook/opt-350m', | |
'facebook/opt-125m', | |
'facebook/incoder-1B', | |
'facebook/incoder-6B', | |
'facebook/xglm-7.5B', | |
'facebook/xglm-564M', | |
'facebook/xglm-2.9B', | |
'facebook/xglm-1.7B' | |
) | |
microsoft_models_list = ( | |
"microsoft/dolly-v2-7b-olive-optimized", | |
"microsoft/lts-gpt2-sm", | |
"microsoft/BioGPT-Large", | |
"microsoft/BioGPT-Large-PubMedQA", | |
"microsoft/biogpt", | |
"microsoft/git-large-vatex", | |
"microsoft/git-base-msrvtt-qa", | |
"microsoft/git-base-vatex", | |
"microsoft/Promptist", | |
"microsoft/CodeGPT-small-py", | |
"microsoft/CodeGPT-small-py-adaptedGPT2", | |
"microsoft/CodeGPT-small-java", | |
"microsoft/CodeGPT-small-java-adaptedGPT2", | |
"microsoft/phi-1", | |
"microsoft/phi-1_5", | |
) | |
langboat_models_list = ( | |
"Langboat/bloom-1b4-zh", | |
"Langboat/ReGPT-125M-200G", | |
"Langboat/bloom-6b4-zh", | |
"Langboat/bloom-2b5-zh", | |
"Langboat/bloom-800m-zh", | |
"Langboat/bloom-389m-zh", | |
"Langboat/mengzi-gpt-neo-base", | |
) | |
allenai_models_list = ( | |
'allenai/bhaskara', | |
'allenai/open-instruct-pythia-6.9b-tulu', | |
'allenai/open-instruct-opt-6.7b-tulu', | |
'allenai/open-instruct-sni-13b', | |
'allenai/open-instruct-flan-v2-13b', | |
'allenai/open-instruct-dolly-13b', | |
'allenai/open-instruct-self-instruct-13b', | |
'allenai/open-instruct-self-instruct-7b', | |
'allenai/open-instruct-oasst1-13b', | |
'allenai/open-instruct-oasst1-7b', | |
'allenai/open-instruct-sni-7b', | |
'allenai/open-instruct-baize-13b', | |
'allenai/open-instruct-baize-7b', | |
'allenai/open-instruct-cot-13b', | |
'allenai/open-instruct-cot-7b', | |
'allenai/open-instruct-gpt4-alpaca-13b', | |
'allenai/open-instruct-gpt4-alpaca-7b', | |
'allenai/open-instruct-human-mix-7b', | |
'allenai/open-instruct-human-mix-13b', | |
'allenai/open-instruct-sharegpt-7b', | |
'allenai/open-instruct-sharegpt-13b', | |
'allenai/open-instruct-sharegpt-30b', | |
'allenai/open-instruct-human-mix-30b', | |
'allenai/tulu-7b', | |
'allenai/tulu-13b', | |
'allenai/tulu-30b', | |
'allenai/open-instruct-code-alpaca-13b', | |
'allenai/open-instruct-code-alpaca-7b', | |
'allenai/open-instruct-unnatural-instructions-13b', | |
'allenai/open-instruct-unnatural-instructions-7b', | |
'allenai/open-instruct-stanford-alpaca-13b', | |
'allenai/open-instruct-stanford-alpaca-7b', | |
'allenai/open-instruct-flan-v2-7b', | |
'allenai/open-instruct-dolly-7b', | |
'allenai/tulu-65b', | |
'allenai/open-instruct-sharegpt-65b', | |
'allenai/open-instruct-human-mix-65b' | |
) | |
deciai_models_list = ( | |
"Deci/DeciLM-6b", | |
"Deci/DeciLM-6b-instruct", | |
"Deci/DeciCoder-1b", | |
) | |
salesforce_models_list = ( | |
'Salesforce/codegen25-7b-multi', | |
'Salesforce/xgen-7b-4k-base', | |
'Salesforce/xgen-7b-8k-inst', | |
'Salesforce/xgen-7b-8k-base', | |
'Salesforce/codegen25-7b-mono', | |
'Salesforce/codegen25-7b-instruct', | |
'Salesforce/ctrl', | |
'Salesforce/codegen2-16B', | |
'Salesforce/codegen2-7B', | |
'Salesforce/codegen2-3_7B', | |
'Salesforce/codegen2-1B', | |
'Salesforce/codegen-350M-mono', | |
'Salesforce/codegen-350M-multi', | |
'Salesforce/codegen-16B-nl', | |
'Salesforce/codegen-2B-mono', | |
'Salesforce/codegen-16B-multi', | |
'Salesforce/codegen-2B-multi', | |
'Salesforce/codegen-6B-nl', | |
'Salesforce/codegen-2B-nl', | |
'Salesforce/codegen-350M-nl', | |
'Salesforce/codegen-6B-multi', | |
'Salesforce/codegen-6B-mono', | |
'Salesforce/codegen-16B-mono' | |
) | |
model_dict = { | |
"google": google_models_list, | |
"mbzuai": mbzuai_models_list, | |
"eleutherai": eleutherai_models_list, | |
"cerebras": cerebras_models_list, | |
"open_assistant": open_assistant_models_list, | |
"databricks": databricks_models_list, | |
"nomic_ai": nomic_ai_models_list, | |
"blinkdl": blinkdl_models_list, | |
"aisquared": ai_squared_models_list, | |
"bloom": bloom_models_list, | |
"tiiuae": tiiuae_models_list, | |
"openlm": openlm_models_list, | |
"stabilityai": stabilityai_models_list, | |
"lmsys": lmsys_models_list, | |
"together_computer": togethercomputer_models_list, | |
"mosaic_ml": mosaic_models_list, | |
"h20ai": h20ai_models_list, | |
"facebook": facebook_models_list, | |
"microsoft": microsoft_models_list, | |
"langboat": langboat_models_list, | |
"allenai": allenai_models_list, | |
"deciai": deciai_models_list, | |
"salesforce": salesforce_models_list | |
} | |
if count is True: | |
models_count = 0 | |
for i in model_dict: | |
models_count += len(model_dict[i]) | |
return models_count | |
return model_dict[model_parent] | |