File size: 1,685 Bytes
8bf595d |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 |
# @title ##### Combine Rerun of the Bracket - All
import os
import json
from tqdm import tqdm
from pathlib import Path
MODEL_OUTPUT_DIR = Path(os.getenv("TG_MODEL_OUTPUT_DIR", "model_outputs"))
fd_new = MODEL_OUTPUT_DIR / "__runs__" / "_redo_bracket"
fd_ori = MODEL_OUTPUT_DIR / "revalidate_anagram_3"
fd_out = MODEL_OUTPUT_DIR / "revalidate_bracket_rerun"
OUTPUT_FILENAMES = [
"results_gemma-2-9b-it.1s.jsonl",
"results_gemma-2-9b-it.zs.jsonl",
"results_gemma-2-27b-it.1s.jsonl",
"results_gemma-2-27b-it.zs.jsonl",
"results_llama-3.1-8b-instruct.1s.jsonl",
"results_llama-3.1-8b-instruct.zs.jsonl",
"results_llama-3.1-70b-instruct.1s.jsonl",
"results_llama-3.1-70b-instruct.zs.jsonl",
"results_llama-3.3-70b-instruct.1s.jsonl",
"results_llama-3.3-70b-instruct.zs.jsonl",
"results_qwen2-5-7b-instruct.1s.jsonl",
"results_qwen2-5-7b-instruct.zs.jsonl",
"results_qwen2-5-14b-instruct.1s.jsonl",
"results_qwen2-5-14b-instruct.zs.jsonl",
"results_qwen2-5-32b-instruct.1s.jsonl",
"results_qwen2-5-32b-instruct.zs.jsonl",
"results_qwen2-5-72b-instruct.1s.jsonl",
"results_qwen2-5-72b-instruct.zs.jsonl",
]
os.makedirs(fd_out, exist_ok=True)
for fp in tqdm(OUTPUT_FILENAMES):
with open(fd_out / fp, "w", encoding="utf8") as o:
with open(fd_ori / fp, "r", encoding="utf8") as i:
for line in i:
res = json.loads(line)
if res['game'].startswith("Bracket Game"):
continue
o.write(line)
with open((fd_new / fp).with_suffix(".6.jsonl"), "r", encoding="utf8") as i:
for line in i:
o.write(line) |