File size: 1,685 Bytes
8bf595d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
# @title ##### Combine Rerun of the Bracket - All
import os
import json
from tqdm import tqdm
from pathlib import Path

MODEL_OUTPUT_DIR = Path(os.getenv("TG_MODEL_OUTPUT_DIR", "model_outputs"))
fd_new = MODEL_OUTPUT_DIR / "__runs__" / "_redo_bracket"
fd_ori = MODEL_OUTPUT_DIR / "revalidate_anagram_3"
fd_out = MODEL_OUTPUT_DIR / "revalidate_bracket_rerun"

OUTPUT_FILENAMES = [
    "results_gemma-2-9b-it.1s.jsonl",
    "results_gemma-2-9b-it.zs.jsonl",
    "results_gemma-2-27b-it.1s.jsonl",
    "results_gemma-2-27b-it.zs.jsonl",

    "results_llama-3.1-8b-instruct.1s.jsonl",
    "results_llama-3.1-8b-instruct.zs.jsonl",
    "results_llama-3.1-70b-instruct.1s.jsonl",
    "results_llama-3.1-70b-instruct.zs.jsonl",
    "results_llama-3.3-70b-instruct.1s.jsonl",
    "results_llama-3.3-70b-instruct.zs.jsonl",

    "results_qwen2-5-7b-instruct.1s.jsonl",
    "results_qwen2-5-7b-instruct.zs.jsonl",
    "results_qwen2-5-14b-instruct.1s.jsonl",
    "results_qwen2-5-14b-instruct.zs.jsonl",
    "results_qwen2-5-32b-instruct.1s.jsonl",
    "results_qwen2-5-32b-instruct.zs.jsonl",
    "results_qwen2-5-72b-instruct.1s.jsonl",
    "results_qwen2-5-72b-instruct.zs.jsonl",
]

os.makedirs(fd_out, exist_ok=True)
for fp in tqdm(OUTPUT_FILENAMES):
    with open(fd_out / fp, "w", encoding="utf8") as o:
        with open(fd_ori / fp, "r", encoding="utf8") as i:
            for line in i:
                res = json.loads(line)
                if res['game'].startswith("Bracket Game"):
                    continue
                o.write(line)
        with open((fd_new / fp).with_suffix(".6.jsonl"), "r", encoding="utf8") as i:
            for line in i:
                o.write(line)