Spaces:

TIGER-Lab
/

GenAI-Arena

Running on Zero

App Files Files Community

GenAI-Arena / arena_elo /elo_rating /model_registry.py

tianleliphoebe

Reinitialize

e368cec 7 months ago

raw

history blame

16.4 kB

	"""Additional information of the models."""
	from collections import namedtuple, OrderedDict
	from typing import List


	ModelInfo = namedtuple("ModelInfo", ["simple_name", "link", "description"])


	model_info = OrderedDict()


	def register_model_info(
	full_names: List[str], simple_name: str, link: str, description: str
	):
	info = ModelInfo(simple_name, link, description)

	for full_name in full_names:
	model_info[full_name] = info


	def get_model_info(name: str) -> ModelInfo:
	if name in model_info:
	return model_info[name]
	else:
	# To fix this, please use `register_model_info` to register your model
	return ModelInfo(
	name, "", "Register the description at arena.model/model_registry.py"
	)


	register_model_info(
	[
	"IEITYuan/Yuan2-2B-Janus-hf",
	"IEITYuan/Yuan2-2B-hf",
	"IEITYuan/Yuan2-51B-hf",
	"IEITYuan/Yuan2-102B-hf",
	],
	"IEIT-Yuan2",
	"https://github.com/IEIT-Yuan/Yuan-2.0",
	"Yuan2.0 is a new generation Fundamental Large Language Model developed by IEIT System.",
	)

	register_model_info(
	["mixtral-8x7b-instruct-v0.1", "mistral-7b-instruct"],
	"Mixtral of experts",
	"https://mistral.ai/news/mixtral-of-experts/",
	"A Mixture-of-Experts model by Mistral AI",
	)

	register_model_info(
	["gemini-pro"],
	"Gemini",
	"https://blog.google/technology/ai/google-gemini-pro-imagen-duet-ai-update/",
	"Gemini by Google",
	)

	register_model_info(
	["gemini-pro-vision"],
	"Gemini",
	"https://blog.google/technology/ai/google-gemini-pro-imagen-duet-ai-update/",
	"Gemini by Google",
	)

	register_model_info(
	["solar-10.7b-instruct-v1.0"],
	"SOLAR-10.7B-Instruct",
	"https://huggingface.co/upstage/SOLAR-10.7B-Instruct-v1.0",
	"A model trained using depth up-scaling by Upstage AI",
	)

	register_model_info(
	["gpt-4-turbo"],
	"GPT-4-Turbo",
	"https://platform.openai.com/docs/models/gpt-4-and-gpt-4-turbo",
	"GPT-4-Turbo by OpenAI",
	)

	register_model_info(
	["gpt-4-vision-preview"],
	"gpt-4-vision-preview",
	"https://platform.openai.com/docs/models/gpt-4-and-gpt-4-turbo",
	"GPT-4(V) by OpenAI",
	)

	register_model_info(
	["gpt-3.5-turbo", "gpt-3.5-turbo-0314", "gpt-3.5-turbo-0613", "gpt-3.5-turbo-1106"],
	"GPT-3.5",
	"https://platform.openai.com/docs/models/gpt-3-5",
	"GPT-3.5-Turbo by OpenAI",
	)

	register_model_info(
	["gpt-4", "gpt-4-0314", "gpt-4-0613"],
	"GPT-4",
	"https://openai.com/research/gpt-4",
	"GPT-4 by OpenAI",
	)

	register_model_info(
	["claude-2.1", "claude-2.0"],
	"Claude",
	"https://www.anthropic.com/index/claude-2",
	"Claude 2 by Anthropic",
	)

	register_model_info(
	["claude-1"],
	"Claude",
	"https://www.anthropic.com/index/introducing-claude",
	"Claude 1 by Anthropic",
	)

	register_model_info(
	["claude-instant-1", "claude-instant-1.2"],
	"Claude Instant",
	"https://www.anthropic.com/index/introducing-claude",
	"Claude Instant by Anthropic",
	)

	register_model_info(
	["pplx-70b-online", "pplx-7b-online"],
	"pplx-online-llms",
	"https://blog.perplexity.ai/blog/introducing-pplx-online-llms",
	"Online LLM API by Perplexity AI",
	)

	register_model_info(
	["openhermes-2.5-mistral-7b"],
	"OpenHermes-2.5-Mistral-7B",
	"https://huggingface.co/teknium/OpenHermes-2.5-Mistral-7B",
	"a mistral-based model fine-tuned on 1M GPT-4 outputs",
	)

	register_model_info(
	["starling-lm-7b-alpha"],
	"Starling-LM-7B-alpha",
	"https://huggingface.co/berkeley-nest/Starling-LM-7B-alpha",
	"an open model trained using RLAIF by Berkeley",
	)

	register_model_info(
	["tulu-2-dpo-70b"],
	"Tulu 2",
	"https://huggingface.co/allenai/tulu-2-dpo-70b",
	"an instruction and RLHF model by UW/AllenAI",
	)

	register_model_info(
	["yi-34b-chat", "yi-6b-chat"],
	"Yi-Chat",
	"https://huggingface.co/01-ai/Yi-34B-Chat",
	"A large language model by 01 AI",
	)

	register_model_info(
	["llama-2-70b-chat", "llama-2-34b-chat", "llama-2-13b-chat", "llama-2-7b-chat"],
	"Llama 2",
	"https://ai.meta.com/llama/",
	"open foundation and fine-tuned chat models by Meta",
	)

	register_model_info(
	[
	"vicuna-33b",
	"vicuna-33b-v1.3",
	"vicuna-13b",
	"vicuna-13b-v1.3",
	"vicuna-7b",
	"vicuna-7b-v1.3",
	],
	"Vicuna",
	"https://lmsys.org/blog/2023-03-30-vicuna/",
	"a chat assistant fine-tuned on user-shared conversations by LMSYS",
	)

	register_model_info(
	["chatglm3-6b", "chatglm2-6b", "chatglm-6b"],
	"ChatGLM",
	"https://chatglm.cn/blog",
	"an open bilingual dialogue language model by Tsinghua University",
	)

	register_model_info(
	["openchat-3.5"],
	"OpenChat 3.5",
	"https://github.com/imoneoi/openchat",
	"an open model fine-tuned on Mistral-7B using C-RLFT",
	)

	register_model_info(
	["tenyxchat-7b-v1"],
	"TenyxChat-7B",
	"https://huggingface.co/tenyx/TenyxChat-7B-v1",
	"an open model DPO trained on top of OpenChat-3.5 using Tenyx fine-tuning",
	)

	register_model_info(
	["zephyr-7b-beta", "zephyr-7b-alpha"],
	"Zephyr",
	"https://huggingface.co/HuggingFaceH4/zephyr-7b-alpha",
	"a chatbot fine-tuned from Mistral by Hugging Face",
	)

	register_model_info(
	["notus-7b-v1"],
	"Notus",
	"https://huggingface.co/argilla/notus-7b-v1",
	"a chatbot fine-tuned from Zephyr SFT by Argilla",
	)

	register_model_info(
	["catppt"],
	"CatPPT",
	"https://huggingface.co/rishiraj/CatPPT",
	"a chatbot fine-tuned from a SLERP merged model by Rishiraj Acharya",
	)

	register_model_info(
	["TinyLlama"],
	"TinyLlama",
	"https://huggingface.co/TinyLlama/TinyLlama-1.1B-Chat-v1.0",
	"The TinyLlama project is an open endeavor to pretrain a 1.1B Llama model on 3 trillion tokens.",
	)

	register_model_info(
	["qwen-14b-chat"],
	"Qwen",
	"https://huggingface.co/Qwen/Qwen-14B-Chat",
	"a large language model by Alibaba Cloud",
	)

	register_model_info(
	["codellama-34b-instruct", "codellama-13b-instruct", "codellama-7b-instruct"],
	"Code Llama",
	"https://ai.meta.com/blog/code-llama-large-language-model-coding/",
	"open foundation models for code by Meta",
	)

	register_model_info(
	["wizardlm-70b", "wizardlm-30b", "wizardlm-13b"],
	"WizardLM",
	"https://github.com/nlpxucan/WizardLM",
	"an instruction-following LLM using evol-instruct by Microsoft",
	)

	register_model_info(
	["wizardcoder-15b-v1.0"],
	"WizardLM",
	"https://github.com/nlpxucan/WizardLM/tree/main/WizardCoder",
	"Empowering Code Large Language Models with Evol-Instruct",
	)

	register_model_info(
	["mpt-7b-chat", "mpt-30b-chat"],
	"MPT-Chat",
	"https://www.mosaicml.com/blog/mpt-30b",
	"a chatbot fine-tuned from MPT by MosaicML",
	)

	register_model_info(
	["guanaco-33b", "guanaco-65b"],
	"Guanaco",
	"https://github.com/artidoro/qlora",
	"a model fine-tuned with QLoRA by UW",
	)

	register_model_info(
	["gpt4all-13b-snoozy"],
	"GPT4All-Snoozy",
	"https://github.com/nomic-ai/gpt4all",
	"a finetuned LLaMA model on assistant style data by Nomic AI",
	)

	register_model_info(
	["koala-13b"],
	"Koala",
	"https://bair.berkeley.edu/blog/2023/04/03/koala",
	"a dialogue model for academic research by BAIR",
	)

	register_model_info(
	["RWKV-4-Raven-14B"],
	"RWKV-4-Raven",
	"https://huggingface.co/BlinkDL/rwkv-4-raven",
	"an RNN with transformer-level LLM performance",
	)

	register_model_info(
	["alpaca-13b"],
	"Alpaca",
	"https://crfm.stanford.edu/2023/03/13/alpaca.html",
	"a model fine-tuned from LLaMA on instruction-following demonstrations by Stanford",
	)

	register_model_info(
	["oasst-pythia-12b"],
	"OpenAssistant (oasst)",
	"https://open-assistant.io",
	"an Open Assistant for everyone by LAION",
	)

	register_model_info(
	["oasst-sft-7-llama-30b"],
	"OpenAssistant (oasst)",
	"https://open-assistant.io",
	"an Open Assistant for everyone by LAION",
	)

	register_model_info(
	["palm-2"],
	"PaLM 2 Chat",
	"https://cloud.google.com/vertex-ai/docs/release-notes#May_10_2023",
	"PaLM 2 for Chat (chat-bison@001) by Google",
	)

	register_model_info(
	["llama-7b", "llama-13b"],
	"LLaMA",
	"https://arxiv.org/abs/2302.13971",
	"open and efficient foundation language models by Meta",
	)

	register_model_info(
	["open-llama-7b-v2-open-instruct", "open-llama-7b-open-instruct"],
	"Open LLaMa (Open Instruct)",
	"https://medium.com/vmware-data-ml-blog/starter-llm-for-the-enterprise-instruction-tuning-openllama-7b-d05fc3bbaccc",
	"Open LLaMa fine-tuned on instruction-following data by VMware",
	)

	register_model_info(
	["dolly-v2-12b"],
	"Dolly",
	"https://www.databricks.com/blog/2023/04/12/dolly-first-open-commercially-viable-instruction-tuned-llm",
	"an instruction-tuned open large language model by Databricks",
	)

	register_model_info(
	["stablelm-tuned-alpha-7b"],
	"StableLM",
	"https://github.com/stability-AI/stableLM",
	"Stability AI language models",
	)

	register_model_info(
	["codet5p-6b"],
	"CodeT5p-6b",
	"https://huggingface.co/Salesforce/codet5p-6b",
	"Code completion model released by Salesforce",
	)

	register_model_info(
	["fastchat-t5-3b", "fastchat-t5-3b-v1.0"],
	"FastChat-T5",
	"https://huggingface.co/lmsys/fastchat-t5-3b-v1.0",
	"a chat assistant fine-tuned from FLAN-T5 by LMSYS",
	)

	register_model_info(
	["phoenix-inst-chat-7b"],
	"Phoenix-7B",
	"https://huggingface.co/FreedomIntelligence/phoenix-inst-chat-7b",
	"a multilingual chat assistant fine-tuned from Bloomz to democratize ChatGPT across languages by CUHK(SZ)",
	)

	register_model_info(
	["realm-7b-v1"],
	"ReaLM",
	"https://github.com/FreedomIntelligence/ReaLM",
	"A chatbot fine-tuned from LLaMA2 with data generated via iterative calls to UserGPT and ChatGPT by CUHK(SZ) and SRIBD.",
	)

	register_model_info(
	["billa-7b-sft"],
	"BiLLa-7B-SFT",
	"https://huggingface.co/Neutralzz/BiLLa-7B-SFT",
	"an instruction-tuned bilingual LLaMA with enhanced reasoning ability by an independent researcher",
	)

	register_model_info(
	["h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2"],
	"h2oGPT-GM-7b",
	"https://huggingface.co/h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2",
	"an instruction-tuned OpenLLaMA with enhanced conversational ability by H2O.ai",
	)

	register_model_info(
	["baize-v2-7b", "baize-v2-13b"],
	"Baize v2",
	"https://github.com/project-baize/baize-chatbot#v2",
	"A chatbot fine-tuned from LLaMA with ChatGPT self-chat data and Self-Disillation with Feedback (SDF) by UCSD and SYSU.",
	)

	register_model_info(
	[
	"airoboros-l2-7b-2.1",
	"airoboros-l2-13b-2.1",
	"airoboros-c34b-2.1",
	"airoboros-l2-70b-2.1",
	],
	"airoboros",
	"https://huggingface.co/jondurbin/airoboros-l2-70b-2.1",
	"an instruction-tuned LlaMa model tuned with 100% synthetic instruction-response pairs from GPT4",
	)

	register_model_info(
	[
	"spicyboros-7b-2.2",
	"spicyboros-13b-2.2",
	"spicyboros-70b-2.2",
	],
	"spicyboros",
	"https://huggingface.co/jondurbin/spicyboros-70b-2.2",
	"de-aligned versions of the airoboros models",
	)

	register_model_info(
	["Robin-7b-v2", "Robin-13b-v2", "Robin-33b-v2"],
	"Robin-v2",
	"https://huggingface.co/OptimalScale/robin-7b-v2-delta",
	"A chatbot fine-tuned from LLaMA-7b, achieving competitive performance on chitchat, commonsense reasoning and instruction-following tasks, by OptimalScale, HKUST.",
	)

	register_model_info(
	["manticore-13b-chat"],
	"Manticore 13B Chat",
	"https://huggingface.co/openaccess-ai-collective/manticore-13b-chat-pyg",
	"A chatbot fine-tuned from LlaMa across several CoT and chat datasets.",
	)

	register_model_info(
	["redpajama-incite-7b-chat"],
	"RedPajama-INCITE-7B-Chat",
	"https://huggingface.co/togethercomputer/RedPajama-INCITE-7B-Chat",
	"A chatbot fine-tuned from RedPajama-INCITE-7B-Base by Together",
	)

	register_model_info(
	[
	"falcon-7b",
	"falcon-7b-instruct",
	"falcon-40b",
	"falcon-40b-instruct",
	"falcon-180b",
	"falcon-180b-chat",
	],
	"Falcon",
	"https://huggingface.co/tiiuae/falcon-180B",
	"TII's flagship series of large language models",
	)

	register_model_info(
	["tigerbot-7b-sft"],
	"Tigerbot",
	"https://huggingface.co/TigerResearch/tigerbot-7b-sft",
	"TigerBot is a large-scale language model (LLM) with multiple languages and tasks.",
	)

	register_model_info(
	["internlm-chat-7b", "internlm-chat-7b-8k"],
	"InternLM",
	"https://huggingface.co/internlm/internlm-chat-7b",
	"InternLM is a multi-language large-scale language model (LLM), developed by SHLAB.",
	)

	register_model_info(
	["Qwen-7B-Chat"],
	"Qwen",
	"https://huggingface.co/Qwen/Qwen-7B-Chat",
	"Qwen is a multi-language large-scale language model (LLM), developed by Damo Academy.",
	)

	register_model_info(
	["Llama2-Chinese-13b-Chat", "LLama2-Chinese-13B"],
	"Llama2-Chinese",
	"https://huggingface.co/FlagAlpha/Llama2-Chinese-13b-Chat",
	"Llama2-Chinese is a multi-language large-scale language model (LLM), developed by FlagAlpha.",
	)

	register_model_info(
	["Chinese-Alpaca-2-7B", "Chinese-Alpaca-2-13B"],
	"Chinese-Alpaca",
	"https://huggingface.co/hfl/chinese-alpaca-2-13b",
	"New extended Chinese vocabulary beyond Llama-2, open-sourcing the Chinese LLaMA-2 and Alpaca-2 LLMs.",
	)

	register_model_info(
	["Vigogne-2-7B-Instruct", "Vigogne-2-13B-Instruct"],
	"Vigogne-Instruct",
	"https://huggingface.co/bofenghuang/vigogne-2-7b-instruct",
	"Vigogne-Instruct is a French large language model (LLM) optimized for instruction-following, developed by Bofeng Huang",
	)

	register_model_info(
	["Vigogne-2-7B-Chat", "Vigogne-2-13B-Chat"],
	"Vigogne-Chat",
	"https://huggingface.co/bofenghuang/vigogne-2-7b-chat",
	"Vigogne-Chat is a French large language model (LLM) optimized for instruction-following and multi-turn dialogues, developed by Bofeng Huang",
	)

	register_model_info(
	["stable-vicuna-13B-HF"],
	"stable-vicuna",
	"https://huggingface.co/TheBloke/stable-vicuna-13B-HF",
	"StableVicuna is a Vicuna model fine-tuned using RLHF via PPO on various conversational and instructional datasets.",
	)

	register_model_info(
	["deluxe-chat-v1", "deluxe-chat-v1.1", "deluxe-chat-v1.2"],
	"DeluxeChat",
	"",
	"Deluxe Chat",
	)

	register_model_info(
	[
	"Xwin-LM-7B-V0.1",
	"Xwin-LM-13B-V0.1",
	"Xwin-LM-70B-V0.1",
	"Xwin-LM-7B-V0.2",
	"Xwin-LM-13B-V0.2",
	],
	"Xwin-LM",
	"https://github.com/Xwin-LM/Xwin-LM",
	"Chat models developed by Xwin-LM team",
	)

	register_model_info(
	["lemur-70b-chat"],
	"Lemur-Chat",
	"https://huggingface.co/OpenLemur/lemur-70b-chat-v1",
	"an openly accessible language model optimized for both natural language and coding capabilities ",
	)

	register_model_info(
	["Mistral-7B-OpenOrca"],
	"Open-Orca",
	"https://huggingface.co/Open-Orca/Mistral-7B-OpenOrca",
	"A fine-tune of [Mistral 7B](https://huggingface.co/mistralai/Mistral-7B-v0.1) using [OpenOrca dataset](https://huggingface.co/datasets/Open-Orca/OpenOrca)",
	)

	register_model_info(
	["dolphin-2.2.1-mistral-7b"],
	"dolphin-mistral",
	"https://huggingface.co/ehartford/dolphin-2.2.1-mistral-7b",
	"An uncensored fine-tuned Mistral 7B",
	)

	register_model_info(
	[
	"AquilaChat-7B",
	"AquilaChat2-7B",
	"AquilaChat2-34B",
	],
	"Aquila-Chat",
	"https://huggingface.co/BAAI/AquilaChat2-34B",
	"Chat models developed by BAAI team",
	)

	register_model_info(
	["xDAN-L1-Chat-RL-v1"],
	"xDAN-L1-Chat",
	"https://huggingface.co/xDAN-AI/xDAN-L1-Chat-RL-v1",
	"A large language chat model created by xDAN-AI.",
	)

	register_model_info(
	["MetaMath-70B-V1.0", "MetaMath-7B-V1.0"],
	"MetaMath",
	"https://huggingface.co/meta-math",
	"MetaMath is a finetune of Llama2 on [MetaMathQA](https://huggingface.co/datasets/meta-math/MetaMathQA) that specializes in mathematical reasoning.",
	)

	register_model_info(
	["Yuan2-2B-hf", "Yuan2-51B-hf", "Yuan2-102B-hf"],
	"IEIYuan",
	"https://huggingface.co/IEITYuan",
	"Yuan2 is a Basemodel developed by IEI.",
	)