Spaces:

tianleliphoebe
/

visual-arena

Runtime error

App Files Files Community

visual-arena / fastchat /llm_judge /download_mt_bench_pregenerated.py

tianleliphoebe

Upload folder using huggingface_hub

ec0c335 verified 6 months ago

raw history blame contribute delete

No virus

2.25 kB

	"""
	Download the pre-generated model answers and judgments for MT-bench.
	"""
	import os

	from fastchat.utils import run_cmd

	filenames = [
	"data/mt_bench/model_answer/alpaca-13b.jsonl",
	"data/mt_bench/model_answer/baize-v2-13b.jsonl",
	"data/mt_bench/model_answer/chatglm-6b.jsonl",
	"data/mt_bench/model_answer/claude-instant-v1.jsonl",
	"data/mt_bench/model_answer/claude-v1.jsonl",
	"data/mt_bench/model_answer/dolly-v2-12b.jsonl",
	"data/mt_bench/model_answer/falcon-40b-instruct.jsonl",
	"data/mt_bench/model_answer/fastchat-t5-3b.jsonl",
	"data/mt_bench/model_answer/gpt-3.5-turbo.jsonl",
	"data/mt_bench/model_answer/gpt-4.jsonl",
	"data/mt_bench/model_answer/gpt4all-13b-snoozy.jsonl",
	"data/mt_bench/model_answer/guanaco-33b.jsonl",
	"data/mt_bench/model_answer/guanaco-65b.jsonl",
	"data/mt_bench/model_answer/h2ogpt-oasst-open-llama-13b.jsonl",
	"data/mt_bench/model_answer/koala-13b.jsonl",
	"data/mt_bench/model_answer/llama-13b.jsonl",
	"data/mt_bench/model_answer/mpt-30b-chat.jsonl",
	"data/mt_bench/model_answer/mpt-30b-instruct.jsonl",
	"data/mt_bench/model_answer/mpt-7b-chat.jsonl",
	"data/mt_bench/model_answer/nous-hermes-13b.jsonl",
	"data/mt_bench/model_answer/oasst-sft-4-pythia-12b.jsonl",
	"data/mt_bench/model_answer/oasst-sft-7-llama-30b.jsonl",
	"data/mt_bench/model_answer/palm-2-chat-bison-001.jsonl",
	"data/mt_bench/model_answer/rwkv-4-raven-14b.jsonl",
	"data/mt_bench/model_answer/stablelm-tuned-alpha-7b.jsonl",
	"data/mt_bench/model_answer/tulu-30b.jsonl",
	"data/mt_bench/model_answer/vicuna-13b-v1.3.jsonl",
	"data/mt_bench/model_answer/vicuna-33b-v1.3.jsonl",
	"data/mt_bench/model_answer/vicuna-7b-v1.3.jsonl",
	"data/mt_bench/model_answer/wizardlm-13b.jsonl",
	"data/mt_bench/model_answer/wizardlm-30b.jsonl",
	"data/mt_bench/model_judgment/gpt-4_single.jsonl",
	"data/mt_bench/model_judgment/gpt-4_pair.jsonl",
	]


	if __name__ == "__main__":
	prefix = "https://huggingface.co/spaces/lmsys/mt-bench/resolve/main/"

	for name in filenames:
	os.makedirs(os.path.dirname(name), exist_ok=True)
	ret = run_cmd(f"wget -q --show-progress -O {name} {prefix + name}")
	assert ret == 0