visual-arena / fastchat /llm_judge /download_mt_bench_pregenerated.py
tianleliphoebe's picture
Upload folder using huggingface_hub
ec0c335 verified
"""
Download the pre-generated model answers and judgments for MT-bench.
"""
import os
from fastchat.utils import run_cmd
filenames = [
"data/mt_bench/model_answer/alpaca-13b.jsonl",
"data/mt_bench/model_answer/baize-v2-13b.jsonl",
"data/mt_bench/model_answer/chatglm-6b.jsonl",
"data/mt_bench/model_answer/claude-instant-v1.jsonl",
"data/mt_bench/model_answer/claude-v1.jsonl",
"data/mt_bench/model_answer/dolly-v2-12b.jsonl",
"data/mt_bench/model_answer/falcon-40b-instruct.jsonl",
"data/mt_bench/model_answer/fastchat-t5-3b.jsonl",
"data/mt_bench/model_answer/gpt-3.5-turbo.jsonl",
"data/mt_bench/model_answer/gpt-4.jsonl",
"data/mt_bench/model_answer/gpt4all-13b-snoozy.jsonl",
"data/mt_bench/model_answer/guanaco-33b.jsonl",
"data/mt_bench/model_answer/guanaco-65b.jsonl",
"data/mt_bench/model_answer/h2ogpt-oasst-open-llama-13b.jsonl",
"data/mt_bench/model_answer/koala-13b.jsonl",
"data/mt_bench/model_answer/llama-13b.jsonl",
"data/mt_bench/model_answer/mpt-30b-chat.jsonl",
"data/mt_bench/model_answer/mpt-30b-instruct.jsonl",
"data/mt_bench/model_answer/mpt-7b-chat.jsonl",
"data/mt_bench/model_answer/nous-hermes-13b.jsonl",
"data/mt_bench/model_answer/oasst-sft-4-pythia-12b.jsonl",
"data/mt_bench/model_answer/oasst-sft-7-llama-30b.jsonl",
"data/mt_bench/model_answer/palm-2-chat-bison-001.jsonl",
"data/mt_bench/model_answer/rwkv-4-raven-14b.jsonl",
"data/mt_bench/model_answer/stablelm-tuned-alpha-7b.jsonl",
"data/mt_bench/model_answer/tulu-30b.jsonl",
"data/mt_bench/model_answer/vicuna-13b-v1.3.jsonl",
"data/mt_bench/model_answer/vicuna-33b-v1.3.jsonl",
"data/mt_bench/model_answer/vicuna-7b-v1.3.jsonl",
"data/mt_bench/model_answer/wizardlm-13b.jsonl",
"data/mt_bench/model_answer/wizardlm-30b.jsonl",
"data/mt_bench/model_judgment/gpt-4_single.jsonl",
"data/mt_bench/model_judgment/gpt-4_pair.jsonl",
]
if __name__ == "__main__":
prefix = "https://huggingface.co/spaces/lmsys/mt-bench/resolve/main/"
for name in filenames:
os.makedirs(os.path.dirname(name), exist_ok=True)
ret = run_cmd(f"wget -q --show-progress -O {name} {prefix + name}")
assert ret == 0