"""Additional information of the models.""" from collections import namedtuple from typing import List ModelInfo = namedtuple("ModelInfo", ["simple_name", "link", "description"]) model_info = {} def register_model_info( full_names: List[str], simple_name: str, link: str, description: str ): info = ModelInfo(simple_name, link, description) for full_name in full_names: model_info[full_name] = info def get_model_info(name: str) -> ModelInfo: return model_info[name] register_model_info( ["gpt-4"], "ChatGPT-4", "https://openai.com/research/gpt-4", "ChatGPT-4 by OpenAI" ) register_model_info( ["gpt-3.5-turbo"], "ChatGPT-3.5", "https://openai.com/blog/chatgpt", "ChatGPT-3.5 by OpenAI", ) register_model_info( ["gpt-3.5-turbo-16k"], "ChatGPT-3.5-16k", "https://openai.com/blog/chatgpt", "ChatGPT-3.5 with 16k by OpenAI", ) register_model_info( ["claude-v1"], "Claude", "https://www.anthropic.com/index/introducing-claude", "Claude by Anthropic", ) register_model_info( ["claude-instant-v1"], "Claude Instant", "https://www.anthropic.com/index/introducing-claude", "Claude Instant by Anthropic", ) register_model_info( ["palm-2"], "PaLM 2 Chat", "https://cloud.google.com/vertex-ai/docs/release-notes#May_10_2023", "PaLM 2 for Chat (chat-bison@001) by Google", ) register_model_info( [ "vicuna-13b", "vicuna-13b-v1.3", "vicuna-7b", "vicuna-7b-v1.3", "vicuna-33b", "vicuna-33b-v1.3", ], "Vicuna", "https://lmsys.org/blog/2023-03-30-vicuna/", "a chat assistant fine-tuned from LLaMA on user-shared conversations by LMSYS", ) register_model_info( ["wizardlm-13b"], "WizardLM", "https://github.com/nlpxucan/WizardLM", "an instruction-following LLM using evol-instruct by Microsoft", ) register_model_info( ["guanaco-33b", "guanaco-65b"], "Guanaco", "https://github.com/artidoro/qlora", "a model fine-tuned with QLoRA by UW", ) register_model_info( ["mpt-7b-chat"], "MPT-Chat", "https://www.mosaicml.com/blog/mpt-7b", "a chatbot fine-tuned from MPT-7B by MosaicML", ) register_model_info( ["mpt-30b-chat"], "MPT-Chat", "https://www.mosaicml.com/blog/mpt-30b", "a chatbot fine-tuned from MPT-30B by MosaicML", ) register_model_info( ["gpt4all-13b-snoozy"], "GPT4All-Snoozy", "https://github.com/nomic-ai/gpt4all", "A finetuned LLaMA model on assistant style data by Nomic AI", ) register_model_info( ["koala-13b"], "Koala", "https://bair.berkeley.edu/blog/2023/04/03/koala", "a dialogue model for academic research by BAIR", ) register_model_info( ["RWKV-4-Raven-14B"], "RWKV-4-Raven", "https://huggingface.co/BlinkDL/rwkv-4-raven", "an RNN with transformer-level LLM performance", ) register_model_info( ["alpaca-13b"], "Alpaca", "https://crfm.stanford.edu/2023/03/13/alpaca.html", "a model fine-tuned from LLaMA on instruction-following demonstrations by Stanford", ) register_model_info( ["chatglm-6b", "chatglm2-6b"], "ChatGLM", "https://chatglm.cn/blog", "an open bilingual dialogue language model by Tsinghua University", ) register_model_info( ["oasst-pythia-12b"], "OpenAssistant (oasst)", "https://open-assistant.io", "an Open Assistant for everyone by LAION", ) register_model_info( ["oasst-sft-7-llama-30b"], "OpenAssistant (oasst)", "https://open-assistant.io", "an Open Assistant for everyone by LAION", ) register_model_info( ["llama-13b"], "LLaMA", "https://arxiv.org/abs/2302.13971", "open and efficient foundation language models by Meta", ) register_model_info( ["dolly-v2-12b"], "Dolly", "https://www.databricks.com/blog/2023/04/12/dolly-first-open-commercially-viable-instruction-tuned-llm", "an instruction-tuned open large language model by Databricks", ) register_model_info( ["stablelm-tuned-alpha-7b"], "StableLM", "https://github.com/stability-AI/stableLM", "Stability AI language models", ) register_model_info( ["codet5p-6b"], "CodeT5p-6b", "https://huggingface.co/Salesforce/codet5p-6b", "Code completion model released by Salesforce", ) register_model_info( ["fastchat-t5-3b", "fastchat-t5-3b-v1.0"], "FastChat-T5", "https://huggingface.co/lmsys/fastchat-t5-3b-v1.0", "a chat assistant fine-tuned from FLAN-T5 by LMSYS", ) register_model_info( ["phoenix-inst-chat-7b"], "Phoenix-7B", "https://huggingface.co/FreedomIntelligence/phoenix-inst-chat-7b", "a multilingual chat assistant fine-tuned from Bloomz to democratize ChatGPT across languages by CUHK(SZ)", ) register_model_info( ["billa-7b-sft"], "BiLLa-7B-SFT", "https://huggingface.co/Neutralzz/BiLLa-7B-SFT", "an instruction-tuned bilingual LLaMA with enhanced reasoning ability by an independent researcher", ) register_model_info( ["h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2"], "h2oGPT-GM-7b", "https://huggingface.co/h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2", "an instruction-tuned OpenLLaMA with enhanced conversational ability by H2O.ai", ) register_model_info( ["baize-v2-7b", "baize-v2-13b"], "Baize v2", "https://github.com/project-baize/baize-chatbot#v2", "A chatbot fine-tuned from LLaMA with ChatGPT self-chat data and Self-Disillation with Feedback (SDF) by UCSD and SYSU.", ) register_model_info( ["Robin-7b-v2", "Robin-13b-v2", "Robin-33b-v2"], "Robin-v2", "https://huggingface.co/OptimalScale/robin-7b-v2-delta", "A chatbot fine-tuned from LLaMA-7b, achieving competitive performance on chitchat, commonsense reasoning and instruction-following tasks, by OptimalScale, HKUST.", ) register_model_info( ["manticore-13b-chat"], "Manticore 13B Chat", "https://huggingface.co/openaccess-ai-collective/manticore-13b-chat-pyg", "A chatbot fine-tuned from LlaMa across several CoT and chat datasets.", ) register_model_info( ["redpajama-incite-7b-chat"], "RedPajama-INCITE-7B-Chat", "https://huggingface.co/togethercomputer/RedPajama-INCITE-7B-Chat", "A chatbot fine-tuned from RedPajama-INCITE-7B-Base by Together", ) register_model_info( ["falcon-7b", "falcon-7b-instruct", "falcon-40b", "falcon-40b-instruct"], "Falcon", "https://huggingface.co/tiiuae/falcon-40b", "TII's flagship series of large language models", ) register_model_info( ["tigerbot-7b-sft"], "Tigerbot", "https://huggingface.co/TigerResearch/tigerbot-7b-sft", "TigerBot is a large-scale language model (LLM) with multiple languages and tasks.", )