pere commited on
Commit
e7539cc
1 Parent(s): 807357d
generate_stats.py CHANGED
@@ -12,8 +12,8 @@ bucket_name = "nb-t5x-us-central2"
12
  bucket = client.bucket(bucket_name)
13
 
14
 
15
- checkpoints=["exp1-t5-base-ul2-engvoc","exp2-t5-base-ul2-scandvoc","exp3-t5-base-span-engvoc","exp4-t5-base-span-scandvoc","exp5-t5-base-ul2-scandvoc-full","exp6-t5-base-span-scandvoc-full","exp7-t5-base-ul2-511-scandvoc","exp8-t5-base-span-511-scandvoc","exp9-t5-base-ul2-mt5voc","exp10-t5-base-span-mt5voc","exp11-t5-base-ul2-511-scandvoc-full","exp12-t5-base-span-511-scandvoc-full","exp13-t5-base-ul2-mt5voc-full","exp14-t5-base-span-mt5voc-full","exp15-t5-base-ul2-511-scandvoc-full-scratch","exp16-t5-base-span-511-scandvoc-full-scratch","exp17-t5-small-ul2-mt5voc-scratch","exp18-t5-small-span-mt5voc-scratch","exp19-t5-small-ul2-mt5voc","exp20-t5-small-span-mt5voc","exp21-t5-small-ul2-mt5voc-full","exp22-t5-small-span-mt5voc-full"]
16
- #checkpoints=["exp19-t5-small-ul2-mt5voc"]
17
 
18
  start=["100000","200000","300000","400000","500000","1000000","1100000","1184000","1200000","1204000","1284000","1300000","1384000","1400000","1484000","1500000"]
19
 
 
12
  bucket = client.bucket(bucket_name)
13
 
14
 
15
+ checkpoints=["exp1-t5-base-ul2-engvoc","exp2-t5-base-ul2-scandvoc","exp3-t5-base-span-engvoc","exp4-t5-base-span-scandvoc","exp5-t5-base-ul2-scandvoc-full","exp6-t5-base-span-scandvoc-full","exp7-t5-base-ul2-511-scandvoc","exp8-t5-base-span-511-scandvoc","exp9-t5-base-ul2-mt5voc","exp10-t5-base-span-mt5voc","exp11-t5-base-ul2-511-scandvoc-full","exp12-t5-base-span-511-scandvoc-full","exp13-t5-base-ul2-mt5voc-full","exp14-t5-base-span-mt5voc-full","exp15-t5-base-ul2-511-scandvoc-full-scratch","exp16-t5-base-span-511-scandvoc-full-scratch","exp17-t5-small-ul2-mt5voc-scratch","exp18-t5-small-span-mt5voc-scratch","exp19-t5-small-ul2-mt5voc","exp20-t5-small-span-mt5voc","exp21-t5-small-ul2-mt5voc-full","exp22-t5-small-span-mt5voc-full"]
16
+
17
 
18
  start=["100000","200000","300000","400000","500000","1000000","1100000","1184000","1200000","1204000","1284000","1300000","1384000","1400000","1484000","1500000"]
19
 
generate_stats_various.py ADDED
@@ -0,0 +1,116 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from google.cloud import storage
2
+ import pandas as pd
3
+ import json
4
+ import re
5
+ import sys
6
+
7
+ # Create a storage client
8
+ client = storage.Client()
9
+
10
+ # Get the bucket
11
+ bucket_name = "nb-t5x-us-central2"
12
+ bucket = client.bucket(bucket_name)
13
+
14
+
15
+ checkpoints=["exp100_mt5_small","exp101_north_t5_base_NCC","exp102_north_t5_base_NCC_lm","exp103_north_t5_base_scand3M","exp104_mt5_base","exp105_sab_base_2","exp106_sab_base_3","exp107_sab_base_4"]
16
+
17
+
18
+ start=["1500000","1600000","2000000","3000000","4000000"]
19
+
20
+ iterations=["1","2","3","4","5"]
21
+ file_names=[]
22
+
23
+ for i in iterations:
24
+ for c in checkpoints:
25
+ for s in start:
26
+ if "scand" in c:
27
+ name = f'finetuned/ul2test/eval_political_{c}_v{i}/inference_eval/parliament_max300_scand-metrics.jsonl'
28
+ elif "mt5" in c or "north" in c:
29
+ name = f'finetuned/ul2test/eval_political_{c}_v{i}/inference_eval/parliament_max300_mt5-metrics.jsonl'
30
+ else:
31
+ name = f'finetuned/ul2test/eval_political_{c}_v{i}/inference_eval/parliament_max300-metrics.jsonl'
32
+ file_names.append(name)
33
+
34
+
35
+ #list to store json files data
36
+ file_contents = []
37
+
38
+ downloaded = 0
39
+ not_downloaded = 0
40
+
41
+ #print(file_names)
42
+ #print(bucket)
43
+ #sys.exit(-1)
44
+
45
+ #iterate over the files
46
+ for file_name in file_names:
47
+ # Get the file
48
+ blob = bucket.get_blob(file_name)
49
+ print(f'gs://{bucket_name}/{file_name}')
50
+
51
+ if not blob:
52
+ #print(f"Unable to download {file_name}")
53
+ not_downloaded+=1
54
+ continue
55
+ else:
56
+ downloaded+=1
57
+
58
+ content = blob.download_as_string().decode("utf-8")
59
+
60
+ #print(file_name)
61
+ #print(content)
62
+
63
+ # Split the content by newline
64
+ lines = content.split("\n")
65
+
66
+ #iterate over the lines
67
+ for n,line in enumerate(lines):
68
+ if not line:
69
+ continue
70
+ #print(line)
71
+ #print(file_name)
72
+ data = json.loads(line)
73
+ data['base_file_name'] = file_name
74
+ pretraining_steps = 0 #re.search(r"(voc_|voc-full_|voc-full-scratch_|voc-scratch_)(.*?)(?=/)", file_name).group(2)
75
+ data['pretraining_steps'] = int(pretraining_steps)
76
+ data['finetuning_steps'] = int(str(data['step'])[-4:])
77
+ data['vocab'] = re.search(r"_(\w+?)-metric", file_name).group(1)
78
+ data['experiment'] = re.search(r"_exp(\w+?)_", file_name).group(1)
79
+ data['version'] = re.search(r"_v(\w+?)/", file_name).group(1)
80
+ data['experiment_name'] = re.search(r"exp\d+_(.*?)_v", file_name).group(1)
81
+ file_contents.append(data)
82
+
83
+ print(f"\nTotally {downloaded} files downloaded, {not_downloaded} files not downloaded")
84
+
85
+ df = pd.json_normalize(file_contents)
86
+ df = df.drop_duplicates(subset=['step','experiment','version']).reset_index()
87
+ only_5000 = df[df["finetuning_steps"] == 5000]
88
+ grouped_at_5000 = only_5000[["experiment_name","experiment","pretraining_steps", "accuracy", "f1_macro"]].groupby(["experiment","experiment_name","pretraining_steps"])
89
+ average_at_5000 = grouped_at_5000.mean().reset_index()
90
+ average_at_5000 = average_at_5000.assign(num_experiments=grouped_at_5000.size().values)
91
+ only_3000 = df[df["finetuning_steps"] == 3000]
92
+ grouped = only_3000[["experiment_name","experiment","pretraining_steps", "accuracy", "f1_macro"]].groupby(["experiment","experiment_name","pretraining_steps"])
93
+ average_at_3000 = grouped.mean().reset_index()
94
+ average_at_3000 = average_at_3000.assign(rows_count=grouped.size().values)
95
+
96
+ #print(average_at_3000.to_string(index=False))
97
+ print(average_at_5000.to_string(index=False))
98
+
99
+ print("\nNot complete:")
100
+ uncomplete = average_at_5000[average_at_5000['num_experiments'] != 5]
101
+ print(uncomplete)
102
+
103
+ df.to_json("stats_various/all.jsonl", orient="records", lines=True)
104
+ df.to_csv("stats_various/all.csv", index=False)
105
+
106
+ only_5000.to_json("stats_various/only_5000.jsonl", orient="records", lines=True)
107
+ only_5000.to_csv("stats_various/only_5000.csv", index=False)
108
+
109
+ average_at_5000.to_json("stats_various/average_at_5000.jsonl", orient="records", lines=True)
110
+ average_at_5000.to_csv("stats_various/average_at_5000.csv", index=False)
111
+
112
+
113
+ print(f"Files exported to stats")
114
+
115
+
116
+
stats_various/all.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ index,step,accuracy,f1_macro,base_file_name,pretraining_steps,finetuning_steps,vocab,experiment,version,experiment_name
2
+ 0,1001000,74.66666666666667,74.60734660693453,finetuned/ul2test/eval_political_exp100_mt5_small_v1/inference_eval/parliament_max300_mt5-metrics.jsonl,0,1000,max300_mt5,100,1,mt5_small
3
+ 1,1002000,72.41666666666666,72.3251667492313,finetuned/ul2test/eval_political_exp100_mt5_small_v1/inference_eval/parliament_max300_mt5-metrics.jsonl,0,2000,max300_mt5,100,1,mt5_small
4
+ 2,1003000,70.83333333333334,70.8099001698586,finetuned/ul2test/eval_political_exp100_mt5_small_v1/inference_eval/parliament_max300_mt5-metrics.jsonl,0,3000,max300_mt5,100,1,mt5_small
5
+ 3,1004000,69.41666666666667,69.36558803950199,finetuned/ul2test/eval_political_exp100_mt5_small_v1/inference_eval/parliament_max300_mt5-metrics.jsonl,0,4000,max300_mt5,100,1,mt5_small
6
+ 4,1005000,69.41666666666667,69.37734632872348,finetuned/ul2test/eval_political_exp100_mt5_small_v1/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,100,1,mt5_small
7
+ 25,1501000,76.58333333333334,76.57967390738136,finetuned/ul2test/eval_political_exp101_north_t5_base_NCC_v1/inference_eval/parliament_max300_mt5-metrics.jsonl,0,1000,max300_mt5,101,1,north_t5_base_NCC
8
+ 26,1502000,80.58333333333333,80.57349866703352,finetuned/ul2test/eval_political_exp101_north_t5_base_NCC_v1/inference_eval/parliament_max300_mt5-metrics.jsonl,0,2000,max300_mt5,101,1,north_t5_base_NCC
9
+ 27,1503000,84.0,83.97845992946074,finetuned/ul2test/eval_political_exp101_north_t5_base_NCC_v1/inference_eval/parliament_max300_mt5-metrics.jsonl,0,3000,max300_mt5,101,1,north_t5_base_NCC
10
+ 28,1504000,85.0,84.99983333148147,finetuned/ul2test/eval_political_exp101_north_t5_base_NCC_v1/inference_eval/parliament_max300_mt5-metrics.jsonl,0,4000,max300_mt5,101,1,north_t5_base_NCC
11
+ 29,1505000,85.08333333333333,85.06756094458106,finetuned/ul2test/eval_political_exp101_north_t5_base_NCC_v1/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,101,1,north_t5_base_NCC
12
+ 50,1601000,73.66666666666667,73.3240286344604,finetuned/ul2test/eval_political_exp102_north_t5_base_NCC_lm_v1/inference_eval/parliament_max300_mt5-metrics.jsonl,0,1000,max300_mt5,102,1,north_t5_base_NCC_lm
13
+ 51,1602000,77.08333333333334,76.87830491350034,finetuned/ul2test/eval_political_exp102_north_t5_base_NCC_lm_v1/inference_eval/parliament_max300_mt5-metrics.jsonl,0,2000,max300_mt5,102,1,north_t5_base_NCC_lm
14
+ 52,1603000,80.33333333333333,80.3175326859618,finetuned/ul2test/eval_political_exp102_north_t5_base_NCC_lm_v1/inference_eval/parliament_max300_mt5-metrics.jsonl,0,3000,max300_mt5,102,1,north_t5_base_NCC_lm
15
+ 53,1604000,80.83333333333333,80.82289246367466,finetuned/ul2test/eval_political_exp102_north_t5_base_NCC_lm_v1/inference_eval/parliament_max300_mt5-metrics.jsonl,0,4000,max300_mt5,102,1,north_t5_base_NCC_lm
16
+ 54,1605000,82.0,81.92362732545003,finetuned/ul2test/eval_political_exp102_north_t5_base_NCC_lm_v1/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,102,1,north_t5_base_NCC_lm
17
+ 75,1001000,75.0,74.96634363978238,finetuned/ul2test/eval_political_exp104_mt5_base_v1/inference_eval/parliament_max300_mt5-metrics.jsonl,0,1000,max300_mt5,104,1,mt5_base
18
+ 76,1002000,73.66666666666667,73.65019804044194,finetuned/ul2test/eval_political_exp104_mt5_base_v1/inference_eval/parliament_max300_mt5-metrics.jsonl,0,2000,max300_mt5,104,1,mt5_base
19
+ 77,1003000,74.08333333333333,74.07683453977005,finetuned/ul2test/eval_political_exp104_mt5_base_v1/inference_eval/parliament_max300_mt5-metrics.jsonl,0,3000,max300_mt5,104,1,mt5_base
20
+ 78,1004000,73.16666666666667,73.16480311132719,finetuned/ul2test/eval_political_exp104_mt5_base_v1/inference_eval/parliament_max300_mt5-metrics.jsonl,0,4000,max300_mt5,104,1,mt5_base
21
+ 79,1005000,73.83333333333333,73.79139957264957,finetuned/ul2test/eval_political_exp104_mt5_base_v1/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,104,1,mt5_base
22
+ 100,1001000,73.0,72.98919567827132,finetuned/ul2test/eval_political_exp100_mt5_small_v2/inference_eval/parliament_max300_mt5-metrics.jsonl,0,1000,max300_mt5,100,2,mt5_small
23
+ 101,1002000,69.83333333333334,69.63902308105207,finetuned/ul2test/eval_political_exp100_mt5_small_v2/inference_eval/parliament_max300_mt5-metrics.jsonl,0,2000,max300_mt5,100,2,mt5_small
24
+ 102,1003000,69.58333333333333,69.52388374266188,finetuned/ul2test/eval_political_exp100_mt5_small_v2/inference_eval/parliament_max300_mt5-metrics.jsonl,0,3000,max300_mt5,100,2,mt5_small
25
+ 103,1004000,68.25,67.95570429815494,finetuned/ul2test/eval_political_exp100_mt5_small_v2/inference_eval/parliament_max300_mt5-metrics.jsonl,0,4000,max300_mt5,100,2,mt5_small
26
+ 104,1005000,68.41666666666667,68.33484302144639,finetuned/ul2test/eval_political_exp100_mt5_small_v2/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,100,2,mt5_small
27
+ 125,1501000,77.25,77.24922584171267,finetuned/ul2test/eval_political_exp101_north_t5_base_NCC_v2/inference_eval/parliament_max300_mt5-metrics.jsonl,0,1000,max300_mt5,101,2,north_t5_base_NCC
28
+ 126,1502000,80.58333333333333,80.54245898502062,finetuned/ul2test/eval_political_exp101_north_t5_base_NCC_v2/inference_eval/parliament_max300_mt5-metrics.jsonl,0,2000,max300_mt5,101,2,north_t5_base_NCC
29
+ 127,1503000,81.66666666666667,81.5485775630703,finetuned/ul2test/eval_political_exp101_north_t5_base_NCC_v2/inference_eval/parliament_max300_mt5-metrics.jsonl,0,3000,max300_mt5,101,2,north_t5_base_NCC
30
+ 128,1504000,85.33333333333334,85.30132288094072,finetuned/ul2test/eval_political_exp101_north_t5_base_NCC_v2/inference_eval/parliament_max300_mt5-metrics.jsonl,0,4000,max300_mt5,101,2,north_t5_base_NCC
31
+ 129,1505000,86.41666666666666,86.40079147949793,finetuned/ul2test/eval_political_exp101_north_t5_base_NCC_v2/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,101,2,north_t5_base_NCC
32
+ 150,1601000,74.5,74.28391343931648,finetuned/ul2test/eval_political_exp102_north_t5_base_NCC_lm_v2/inference_eval/parliament_max300_mt5-metrics.jsonl,0,1000,max300_mt5,102,2,north_t5_base_NCC_lm
33
+ 151,1602000,79.0,78.98686679174484,finetuned/ul2test/eval_political_exp102_north_t5_base_NCC_lm_v2/inference_eval/parliament_max300_mt5-metrics.jsonl,0,2000,max300_mt5,102,2,north_t5_base_NCC_lm
34
+ 152,1603000,80.08333333333333,80.06438065077145,finetuned/ul2test/eval_political_exp102_north_t5_base_NCC_lm_v2/inference_eval/parliament_max300_mt5-metrics.jsonl,0,3000,max300_mt5,102,2,north_t5_base_NCC_lm
35
+ 153,1604000,79.83333333333333,79.77214406914248,finetuned/ul2test/eval_political_exp102_north_t5_base_NCC_lm_v2/inference_eval/parliament_max300_mt5-metrics.jsonl,0,4000,max300_mt5,102,2,north_t5_base_NCC_lm
36
+ 154,1605000,81.16666666666667,81.12845178152426,finetuned/ul2test/eval_political_exp102_north_t5_base_NCC_lm_v2/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,102,2,north_t5_base_NCC_lm
37
+ 175,1001000,73.91666666666666,73.91360513838082,finetuned/ul2test/eval_political_exp104_mt5_base_v2/inference_eval/parliament_max300_mt5-metrics.jsonl,0,1000,max300_mt5,104,2,mt5_base
38
+ 176,1002000,72.58333333333333,72.43846300450075,finetuned/ul2test/eval_political_exp104_mt5_base_v2/inference_eval/parliament_max300_mt5-metrics.jsonl,0,2000,max300_mt5,104,2,mt5_base
39
+ 177,1003000,73.91666666666666,73.9114308357719,finetuned/ul2test/eval_political_exp104_mt5_base_v2/inference_eval/parliament_max300_mt5-metrics.jsonl,0,3000,max300_mt5,104,2,mt5_base
40
+ 178,1004000,72.5,72.38331952499311,finetuned/ul2test/eval_political_exp104_mt5_base_v2/inference_eval/parliament_max300_mt5-metrics.jsonl,0,4000,max300_mt5,104,2,mt5_base
41
+ 179,1005000,73.33333333333333,73.27089116519426,finetuned/ul2test/eval_political_exp104_mt5_base_v2/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,104,2,mt5_base
42
+ 200,1001000,71.08333333333333,70.96378073331098,finetuned/ul2test/eval_political_exp100_mt5_small_v3/inference_eval/parliament_max300_mt5-metrics.jsonl,0,1000,max300_mt5,100,3,mt5_small
43
+ 201,1002000,67.41666666666667,66.98636604464721,finetuned/ul2test/eval_political_exp100_mt5_small_v3/inference_eval/parliament_max300_mt5-metrics.jsonl,0,2000,max300_mt5,100,3,mt5_small
44
+ 202,1003000,67.16666666666666,67.15352807789783,finetuned/ul2test/eval_political_exp100_mt5_small_v3/inference_eval/parliament_max300_mt5-metrics.jsonl,0,3000,max300_mt5,100,3,mt5_small
45
+ 203,1004000,66.91666666666667,66.80044516951355,finetuned/ul2test/eval_political_exp100_mt5_small_v3/inference_eval/parliament_max300_mt5-metrics.jsonl,0,4000,max300_mt5,100,3,mt5_small
46
+ 204,1005000,67.5,67.49990972197143,finetuned/ul2test/eval_political_exp100_mt5_small_v3/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,100,3,mt5_small
47
+ 225,1501000,75.58333333333334,75.24151145080096,finetuned/ul2test/eval_political_exp101_north_t5_base_NCC_v3/inference_eval/parliament_max300_mt5-metrics.jsonl,0,1000,max300_mt5,101,3,north_t5_base_NCC
48
+ 226,1502000,81.16666666666667,81.16666666666667,finetuned/ul2test/eval_political_exp101_north_t5_base_NCC_v3/inference_eval/parliament_max300_mt5-metrics.jsonl,0,2000,max300_mt5,101,3,north_t5_base_NCC
49
+ 227,1503000,84.5,84.49272019364645,finetuned/ul2test/eval_political_exp101_north_t5_base_NCC_v3/inference_eval/parliament_max300_mt5-metrics.jsonl,0,3000,max300_mt5,101,3,north_t5_base_NCC
50
+ 228,1504000,85.66666666666667,85.66184745428325,finetuned/ul2test/eval_political_exp101_north_t5_base_NCC_v3/inference_eval/parliament_max300_mt5-metrics.jsonl,0,4000,max300_mt5,101,3,north_t5_base_NCC
51
+ 229,1505000,86.41666666666666,86.41394001990676,finetuned/ul2test/eval_political_exp101_north_t5_base_NCC_v3/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,101,3,north_t5_base_NCC
52
+ 250,1601000,75.58333333333334,75.53915092469106,finetuned/ul2test/eval_political_exp102_north_t5_base_NCC_lm_v3/inference_eval/parliament_max300_mt5-metrics.jsonl,0,1000,max300_mt5,102,3,north_t5_base_NCC_lm
53
+ 251,1602000,76.58333333333334,76.27408915229121,finetuned/ul2test/eval_political_exp102_north_t5_base_NCC_lm_v3/inference_eval/parliament_max300_mt5-metrics.jsonl,0,2000,max300_mt5,102,3,north_t5_base_NCC_lm
54
+ 252,1603000,80.58333333333333,80.57943573397716,finetuned/ul2test/eval_political_exp102_north_t5_base_NCC_lm_v3/inference_eval/parliament_max300_mt5-metrics.jsonl,0,3000,max300_mt5,102,3,north_t5_base_NCC_lm
55
+ 253,1604000,79.41666666666667,79.22587653974873,finetuned/ul2test/eval_political_exp102_north_t5_base_NCC_lm_v3/inference_eval/parliament_max300_mt5-metrics.jsonl,0,4000,max300_mt5,102,3,north_t5_base_NCC_lm
56
+ 254,1605000,82.08333333333333,82.0788405982333,finetuned/ul2test/eval_political_exp102_north_t5_base_NCC_lm_v3/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,102,3,north_t5_base_NCC_lm
57
+ 275,1001000,73.66666666666667,73.666374070823,finetuned/ul2test/eval_political_exp104_mt5_base_v3/inference_eval/parliament_max300_mt5-metrics.jsonl,0,1000,max300_mt5,104,3,mt5_base
58
+ 276,1002000,72.25,72.15251446208568,finetuned/ul2test/eval_political_exp104_mt5_base_v3/inference_eval/parliament_max300_mt5-metrics.jsonl,0,2000,max300_mt5,104,3,mt5_base
59
+ 277,1003000,72.83333333333334,72.82578494026119,finetuned/ul2test/eval_political_exp104_mt5_base_v3/inference_eval/parliament_max300_mt5-metrics.jsonl,0,3000,max300_mt5,104,3,mt5_base
60
+ 278,1004000,73.58333333333333,73.43054049013809,finetuned/ul2test/eval_political_exp104_mt5_base_v3/inference_eval/parliament_max300_mt5-metrics.jsonl,0,4000,max300_mt5,104,3,mt5_base
61
+ 279,1005000,73.33333333333333,73.18248481039178,finetuned/ul2test/eval_political_exp104_mt5_base_v3/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,104,3,mt5_base
62
+ 300,1001000,72.41666666666666,72.27757324073913,finetuned/ul2test/eval_political_exp100_mt5_small_v4/inference_eval/parliament_max300_mt5-metrics.jsonl,0,1000,max300_mt5,100,4,mt5_small
63
+ 301,1002000,69.5,69.45511598988514,finetuned/ul2test/eval_political_exp100_mt5_small_v4/inference_eval/parliament_max300_mt5-metrics.jsonl,0,2000,max300_mt5,100,4,mt5_small
64
+ 302,1003000,68.58333333333333,68.39349677332814,finetuned/ul2test/eval_political_exp100_mt5_small_v4/inference_eval/parliament_max300_mt5-metrics.jsonl,0,3000,max300_mt5,100,4,mt5_small
65
+ 303,1004000,67.75,67.66086525987252,finetuned/ul2test/eval_political_exp100_mt5_small_v4/inference_eval/parliament_max300_mt5-metrics.jsonl,0,4000,max300_mt5,100,4,mt5_small
66
+ 304,1005000,67.75,67.74012041187613,finetuned/ul2test/eval_political_exp100_mt5_small_v4/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,100,4,mt5_small
67
+ 325,1501000,74.08333333333333,73.59616422733052,finetuned/ul2test/eval_political_exp101_north_t5_base_NCC_v4/inference_eval/parliament_max300_mt5-metrics.jsonl,0,1000,max300_mt5,101,4,north_t5_base_NCC
68
+ 326,1502000,76.58333333333334,76.31807937657274,finetuned/ul2test/eval_political_exp101_north_t5_base_NCC_v4/inference_eval/parliament_max300_mt5-metrics.jsonl,0,2000,max300_mt5,101,4,north_t5_base_NCC
69
+ 327,1503000,82.08333333333333,82.07136846186935,finetuned/ul2test/eval_political_exp101_north_t5_base_NCC_v4/inference_eval/parliament_max300_mt5-metrics.jsonl,0,3000,max300_mt5,101,4,north_t5_base_NCC
70
+ 328,1504000,83.25,83.2480339706535,finetuned/ul2test/eval_political_exp101_north_t5_base_NCC_v4/inference_eval/parliament_max300_mt5-metrics.jsonl,0,4000,max300_mt5,101,4,north_t5_base_NCC
71
+ 329,1505000,83.75,83.74746054070948,finetuned/ul2test/eval_political_exp101_north_t5_base_NCC_v4/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,101,4,north_t5_base_NCC
72
+ 350,1601000,75.5,75.31458510590659,finetuned/ul2test/eval_political_exp102_north_t5_base_NCC_lm_v4/inference_eval/parliament_max300_mt5-metrics.jsonl,0,1000,max300_mt5,102,4,north_t5_base_NCC_lm
73
+ 351,1602000,79.33333333333333,79.33051998744273,finetuned/ul2test/eval_political_exp102_north_t5_base_NCC_lm_v4/inference_eval/parliament_max300_mt5-metrics.jsonl,0,2000,max300_mt5,102,4,north_t5_base_NCC_lm
74
+ 352,1603000,79.91666666666667,79.88312457089913,finetuned/ul2test/eval_political_exp102_north_t5_base_NCC_lm_v4/inference_eval/parliament_max300_mt5-metrics.jsonl,0,3000,max300_mt5,102,4,north_t5_base_NCC_lm
75
+ 353,1604000,81.16666666666667,81.16666666666667,finetuned/ul2test/eval_political_exp102_north_t5_base_NCC_lm_v4/inference_eval/parliament_max300_mt5-metrics.jsonl,0,4000,max300_mt5,102,4,north_t5_base_NCC_lm
76
+ 354,1605000,81.25,81.23580958099564,finetuned/ul2test/eval_political_exp102_north_t5_base_NCC_lm_v4/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,102,4,north_t5_base_NCC_lm
77
+ 375,1001000,74.33333333333333,74.33326203683899,finetuned/ul2test/eval_political_exp104_mt5_base_v4/inference_eval/parliament_max300_mt5-metrics.jsonl,0,1000,max300_mt5,104,4,mt5_base
78
+ 376,1002000,74.25,74.23495249656223,finetuned/ul2test/eval_political_exp104_mt5_base_v4/inference_eval/parliament_max300_mt5-metrics.jsonl,0,2000,max300_mt5,104,4,mt5_base
79
+ 377,1003000,73.83333333333333,73.82286247832467,finetuned/ul2test/eval_political_exp104_mt5_base_v4/inference_eval/parliament_max300_mt5-metrics.jsonl,0,3000,max300_mt5,104,4,mt5_base
80
+ 378,1004000,72.91666666666666,72.91574504965794,finetuned/ul2test/eval_political_exp104_mt5_base_v4/inference_eval/parliament_max300_mt5-metrics.jsonl,0,4000,max300_mt5,104,4,mt5_base
81
+ 379,1005000,71.5,71.46163174935191,finetuned/ul2test/eval_political_exp104_mt5_base_v4/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,104,4,mt5_base
82
+ 400,1001000,72.08333333333333,72.08098736074349,finetuned/ul2test/eval_political_exp100_mt5_small_v5/inference_eval/parliament_max300_mt5-metrics.jsonl,0,1000,max300_mt5,100,5,mt5_small
83
+ 401,1002000,70.08333333333333,70.07982186798311,finetuned/ul2test/eval_political_exp100_mt5_small_v5/inference_eval/parliament_max300_mt5-metrics.jsonl,0,2000,max300_mt5,100,5,mt5_small
84
+ 402,1003000,70.16666666666667,70.16666666666667,finetuned/ul2test/eval_political_exp100_mt5_small_v5/inference_eval/parliament_max300_mt5-metrics.jsonl,0,3000,max300_mt5,100,5,mt5_small
85
+ 403,1004000,68.83333333333333,68.82285434826706,finetuned/ul2test/eval_political_exp100_mt5_small_v5/inference_eval/parliament_max300_mt5-metrics.jsonl,0,4000,max300_mt5,100,5,mt5_small
86
+ 404,1005000,70.0,69.98991327640678,finetuned/ul2test/eval_political_exp100_mt5_small_v5/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,100,5,mt5_small
87
+ 425,1501000,75.16666666666667,74.7056776416864,finetuned/ul2test/eval_political_exp101_north_t5_base_NCC_v5/inference_eval/parliament_max300_mt5-metrics.jsonl,0,1000,max300_mt5,101,5,north_t5_base_NCC
88
+ 426,1502000,83.25,83.24663769325929,finetuned/ul2test/eval_political_exp101_north_t5_base_NCC_v5/inference_eval/parliament_max300_mt5-metrics.jsonl,0,2000,max300_mt5,101,5,north_t5_base_NCC
89
+ 427,1503000,83.33333333333334,83.25126452952802,finetuned/ul2test/eval_political_exp101_north_t5_base_NCC_v5/inference_eval/parliament_max300_mt5-metrics.jsonl,0,3000,max300_mt5,101,5,north_t5_base_NCC
90
+ 428,1504000,85.75,85.74951508766617,finetuned/ul2test/eval_political_exp101_north_t5_base_NCC_v5/inference_eval/parliament_max300_mt5-metrics.jsonl,0,4000,max300_mt5,101,5,north_t5_base_NCC
91
+ 429,1505000,86.0,85.9968492910905,finetuned/ul2test/eval_political_exp101_north_t5_base_NCC_v5/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,101,5,north_t5_base_NCC
92
+ 450,1601000,74.75,74.71753661472265,finetuned/ul2test/eval_political_exp102_north_t5_base_NCC_lm_v5/inference_eval/parliament_max300_mt5-metrics.jsonl,0,1000,max300_mt5,102,5,north_t5_base_NCC_lm
93
+ 451,1602000,79.25,79.15025423711073,finetuned/ul2test/eval_political_exp102_north_t5_base_NCC_lm_v5/inference_eval/parliament_max300_mt5-metrics.jsonl,0,2000,max300_mt5,102,5,north_t5_base_NCC_lm
94
+ 452,1603000,79.83333333333333,79.80365592773828,finetuned/ul2test/eval_political_exp102_north_t5_base_NCC_lm_v5/inference_eval/parliament_max300_mt5-metrics.jsonl,0,3000,max300_mt5,102,5,north_t5_base_NCC_lm
95
+ 453,1604000,81.16666666666667,81.16143373159213,finetuned/ul2test/eval_political_exp102_north_t5_base_NCC_lm_v5/inference_eval/parliament_max300_mt5-metrics.jsonl,0,4000,max300_mt5,102,5,north_t5_base_NCC_lm
96
+ 454,1605000,82.66666666666667,82.66430708624229,finetuned/ul2test/eval_political_exp102_north_t5_base_NCC_lm_v5/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,102,5,north_t5_base_NCC_lm
97
+ 475,1001000,71.33333333333334,71.1921749907882,finetuned/ul2test/eval_political_exp104_mt5_base_v5/inference_eval/parliament_max300_mt5-metrics.jsonl,0,1000,max300_mt5,104,5,mt5_base
98
+ 476,1002000,71.33333333333334,71.3177174239308,finetuned/ul2test/eval_political_exp104_mt5_base_v5/inference_eval/parliament_max300_mt5-metrics.jsonl,0,2000,max300_mt5,104,5,mt5_base
99
+ 477,1003000,71.0,70.99871105382461,finetuned/ul2test/eval_political_exp104_mt5_base_v5/inference_eval/parliament_max300_mt5-metrics.jsonl,0,3000,max300_mt5,104,5,mt5_base
100
+ 478,1004000,69.91666666666667,69.75027215677348,finetuned/ul2test/eval_political_exp104_mt5_base_v5/inference_eval/parliament_max300_mt5-metrics.jsonl,0,4000,max300_mt5,104,5,mt5_base
101
+ 479,1005000,70.83333333333334,70.79756034475567,finetuned/ul2test/eval_political_exp104_mt5_base_v5/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,104,5,mt5_base
stats_various/all.jsonl ADDED
@@ -0,0 +1,100 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"index":0,"step":1001000,"accuracy":74.6666666667,"f1_macro":74.6073466069,"base_file_name":"finetuned\/ul2test\/eval_political_exp100_mt5_small_v1\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":1000,"vocab":"max300_mt5","experiment":"100","version":"1","experiment_name":"mt5_small"}
2
+ {"index":1,"step":1002000,"accuracy":72.4166666667,"f1_macro":72.3251667492,"base_file_name":"finetuned\/ul2test\/eval_political_exp100_mt5_small_v1\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":2000,"vocab":"max300_mt5","experiment":"100","version":"1","experiment_name":"mt5_small"}
3
+ {"index":2,"step":1003000,"accuracy":70.8333333333,"f1_macro":70.8099001699,"base_file_name":"finetuned\/ul2test\/eval_political_exp100_mt5_small_v1\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":3000,"vocab":"max300_mt5","experiment":"100","version":"1","experiment_name":"mt5_small"}
4
+ {"index":3,"step":1004000,"accuracy":69.4166666667,"f1_macro":69.3655880395,"base_file_name":"finetuned\/ul2test\/eval_political_exp100_mt5_small_v1\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":4000,"vocab":"max300_mt5","experiment":"100","version":"1","experiment_name":"mt5_small"}
5
+ {"index":4,"step":1005000,"accuracy":69.4166666667,"f1_macro":69.3773463287,"base_file_name":"finetuned\/ul2test\/eval_political_exp100_mt5_small_v1\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"100","version":"1","experiment_name":"mt5_small"}
6
+ {"index":25,"step":1501000,"accuracy":76.5833333333,"f1_macro":76.5796739074,"base_file_name":"finetuned\/ul2test\/eval_political_exp101_north_t5_base_NCC_v1\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":1000,"vocab":"max300_mt5","experiment":"101","version":"1","experiment_name":"north_t5_base_NCC"}
7
+ {"index":26,"step":1502000,"accuracy":80.5833333333,"f1_macro":80.573498667,"base_file_name":"finetuned\/ul2test\/eval_political_exp101_north_t5_base_NCC_v1\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":2000,"vocab":"max300_mt5","experiment":"101","version":"1","experiment_name":"north_t5_base_NCC"}
8
+ {"index":27,"step":1503000,"accuracy":84.0,"f1_macro":83.9784599295,"base_file_name":"finetuned\/ul2test\/eval_political_exp101_north_t5_base_NCC_v1\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":3000,"vocab":"max300_mt5","experiment":"101","version":"1","experiment_name":"north_t5_base_NCC"}
9
+ {"index":28,"step":1504000,"accuracy":85.0,"f1_macro":84.9998333315,"base_file_name":"finetuned\/ul2test\/eval_political_exp101_north_t5_base_NCC_v1\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":4000,"vocab":"max300_mt5","experiment":"101","version":"1","experiment_name":"north_t5_base_NCC"}
10
+ {"index":29,"step":1505000,"accuracy":85.0833333333,"f1_macro":85.0675609446,"base_file_name":"finetuned\/ul2test\/eval_political_exp101_north_t5_base_NCC_v1\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"101","version":"1","experiment_name":"north_t5_base_NCC"}
11
+ {"index":50,"step":1601000,"accuracy":73.6666666667,"f1_macro":73.3240286345,"base_file_name":"finetuned\/ul2test\/eval_political_exp102_north_t5_base_NCC_lm_v1\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":1000,"vocab":"max300_mt5","experiment":"102","version":"1","experiment_name":"north_t5_base_NCC_lm"}
12
+ {"index":51,"step":1602000,"accuracy":77.0833333333,"f1_macro":76.8783049135,"base_file_name":"finetuned\/ul2test\/eval_political_exp102_north_t5_base_NCC_lm_v1\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":2000,"vocab":"max300_mt5","experiment":"102","version":"1","experiment_name":"north_t5_base_NCC_lm"}
13
+ {"index":52,"step":1603000,"accuracy":80.3333333333,"f1_macro":80.317532686,"base_file_name":"finetuned\/ul2test\/eval_political_exp102_north_t5_base_NCC_lm_v1\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":3000,"vocab":"max300_mt5","experiment":"102","version":"1","experiment_name":"north_t5_base_NCC_lm"}
14
+ {"index":53,"step":1604000,"accuracy":80.8333333333,"f1_macro":80.8228924637,"base_file_name":"finetuned\/ul2test\/eval_political_exp102_north_t5_base_NCC_lm_v1\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":4000,"vocab":"max300_mt5","experiment":"102","version":"1","experiment_name":"north_t5_base_NCC_lm"}
15
+ {"index":54,"step":1605000,"accuracy":82.0,"f1_macro":81.9236273255,"base_file_name":"finetuned\/ul2test\/eval_political_exp102_north_t5_base_NCC_lm_v1\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"102","version":"1","experiment_name":"north_t5_base_NCC_lm"}
16
+ {"index":75,"step":1001000,"accuracy":75.0,"f1_macro":74.9663436398,"base_file_name":"finetuned\/ul2test\/eval_political_exp104_mt5_base_v1\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":1000,"vocab":"max300_mt5","experiment":"104","version":"1","experiment_name":"mt5_base"}
17
+ {"index":76,"step":1002000,"accuracy":73.6666666667,"f1_macro":73.6501980404,"base_file_name":"finetuned\/ul2test\/eval_political_exp104_mt5_base_v1\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":2000,"vocab":"max300_mt5","experiment":"104","version":"1","experiment_name":"mt5_base"}
18
+ {"index":77,"step":1003000,"accuracy":74.0833333333,"f1_macro":74.0768345398,"base_file_name":"finetuned\/ul2test\/eval_political_exp104_mt5_base_v1\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":3000,"vocab":"max300_mt5","experiment":"104","version":"1","experiment_name":"mt5_base"}
19
+ {"index":78,"step":1004000,"accuracy":73.1666666667,"f1_macro":73.1648031113,"base_file_name":"finetuned\/ul2test\/eval_political_exp104_mt5_base_v1\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":4000,"vocab":"max300_mt5","experiment":"104","version":"1","experiment_name":"mt5_base"}
20
+ {"index":79,"step":1005000,"accuracy":73.8333333333,"f1_macro":73.7913995726,"base_file_name":"finetuned\/ul2test\/eval_political_exp104_mt5_base_v1\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"104","version":"1","experiment_name":"mt5_base"}
21
+ {"index":100,"step":1001000,"accuracy":73.0,"f1_macro":72.9891956783,"base_file_name":"finetuned\/ul2test\/eval_political_exp100_mt5_small_v2\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":1000,"vocab":"max300_mt5","experiment":"100","version":"2","experiment_name":"mt5_small"}
22
+ {"index":101,"step":1002000,"accuracy":69.8333333333,"f1_macro":69.6390230811,"base_file_name":"finetuned\/ul2test\/eval_political_exp100_mt5_small_v2\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":2000,"vocab":"max300_mt5","experiment":"100","version":"2","experiment_name":"mt5_small"}
23
+ {"index":102,"step":1003000,"accuracy":69.5833333333,"f1_macro":69.5238837427,"base_file_name":"finetuned\/ul2test\/eval_political_exp100_mt5_small_v2\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":3000,"vocab":"max300_mt5","experiment":"100","version":"2","experiment_name":"mt5_small"}
24
+ {"index":103,"step":1004000,"accuracy":68.25,"f1_macro":67.9557042982,"base_file_name":"finetuned\/ul2test\/eval_political_exp100_mt5_small_v2\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":4000,"vocab":"max300_mt5","experiment":"100","version":"2","experiment_name":"mt5_small"}
25
+ {"index":104,"step":1005000,"accuracy":68.4166666667,"f1_macro":68.3348430214,"base_file_name":"finetuned\/ul2test\/eval_political_exp100_mt5_small_v2\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"100","version":"2","experiment_name":"mt5_small"}
26
+ {"index":125,"step":1501000,"accuracy":77.25,"f1_macro":77.2492258417,"base_file_name":"finetuned\/ul2test\/eval_political_exp101_north_t5_base_NCC_v2\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":1000,"vocab":"max300_mt5","experiment":"101","version":"2","experiment_name":"north_t5_base_NCC"}
27
+ {"index":126,"step":1502000,"accuracy":80.5833333333,"f1_macro":80.542458985,"base_file_name":"finetuned\/ul2test\/eval_political_exp101_north_t5_base_NCC_v2\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":2000,"vocab":"max300_mt5","experiment":"101","version":"2","experiment_name":"north_t5_base_NCC"}
28
+ {"index":127,"step":1503000,"accuracy":81.6666666667,"f1_macro":81.5485775631,"base_file_name":"finetuned\/ul2test\/eval_political_exp101_north_t5_base_NCC_v2\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":3000,"vocab":"max300_mt5","experiment":"101","version":"2","experiment_name":"north_t5_base_NCC"}
29
+ {"index":128,"step":1504000,"accuracy":85.3333333333,"f1_macro":85.3013228809,"base_file_name":"finetuned\/ul2test\/eval_political_exp101_north_t5_base_NCC_v2\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":4000,"vocab":"max300_mt5","experiment":"101","version":"2","experiment_name":"north_t5_base_NCC"}
30
+ {"index":129,"step":1505000,"accuracy":86.4166666667,"f1_macro":86.4007914795,"base_file_name":"finetuned\/ul2test\/eval_political_exp101_north_t5_base_NCC_v2\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"101","version":"2","experiment_name":"north_t5_base_NCC"}
31
+ {"index":150,"step":1601000,"accuracy":74.5,"f1_macro":74.2839134393,"base_file_name":"finetuned\/ul2test\/eval_political_exp102_north_t5_base_NCC_lm_v2\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":1000,"vocab":"max300_mt5","experiment":"102","version":"2","experiment_name":"north_t5_base_NCC_lm"}
32
+ {"index":151,"step":1602000,"accuracy":79.0,"f1_macro":78.9868667917,"base_file_name":"finetuned\/ul2test\/eval_political_exp102_north_t5_base_NCC_lm_v2\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":2000,"vocab":"max300_mt5","experiment":"102","version":"2","experiment_name":"north_t5_base_NCC_lm"}
33
+ {"index":152,"step":1603000,"accuracy":80.0833333333,"f1_macro":80.0643806508,"base_file_name":"finetuned\/ul2test\/eval_political_exp102_north_t5_base_NCC_lm_v2\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":3000,"vocab":"max300_mt5","experiment":"102","version":"2","experiment_name":"north_t5_base_NCC_lm"}
34
+ {"index":153,"step":1604000,"accuracy":79.8333333333,"f1_macro":79.7721440691,"base_file_name":"finetuned\/ul2test\/eval_political_exp102_north_t5_base_NCC_lm_v2\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":4000,"vocab":"max300_mt5","experiment":"102","version":"2","experiment_name":"north_t5_base_NCC_lm"}
35
+ {"index":154,"step":1605000,"accuracy":81.1666666667,"f1_macro":81.1284517815,"base_file_name":"finetuned\/ul2test\/eval_political_exp102_north_t5_base_NCC_lm_v2\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"102","version":"2","experiment_name":"north_t5_base_NCC_lm"}
36
+ {"index":175,"step":1001000,"accuracy":73.9166666667,"f1_macro":73.9136051384,"base_file_name":"finetuned\/ul2test\/eval_political_exp104_mt5_base_v2\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":1000,"vocab":"max300_mt5","experiment":"104","version":"2","experiment_name":"mt5_base"}
37
+ {"index":176,"step":1002000,"accuracy":72.5833333333,"f1_macro":72.4384630045,"base_file_name":"finetuned\/ul2test\/eval_political_exp104_mt5_base_v2\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":2000,"vocab":"max300_mt5","experiment":"104","version":"2","experiment_name":"mt5_base"}
38
+ {"index":177,"step":1003000,"accuracy":73.9166666667,"f1_macro":73.9114308358,"base_file_name":"finetuned\/ul2test\/eval_political_exp104_mt5_base_v2\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":3000,"vocab":"max300_mt5","experiment":"104","version":"2","experiment_name":"mt5_base"}
39
+ {"index":178,"step":1004000,"accuracy":72.5,"f1_macro":72.383319525,"base_file_name":"finetuned\/ul2test\/eval_political_exp104_mt5_base_v2\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":4000,"vocab":"max300_mt5","experiment":"104","version":"2","experiment_name":"mt5_base"}
40
+ {"index":179,"step":1005000,"accuracy":73.3333333333,"f1_macro":73.2708911652,"base_file_name":"finetuned\/ul2test\/eval_political_exp104_mt5_base_v2\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"104","version":"2","experiment_name":"mt5_base"}
41
+ {"index":200,"step":1001000,"accuracy":71.0833333333,"f1_macro":70.9637807333,"base_file_name":"finetuned\/ul2test\/eval_political_exp100_mt5_small_v3\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":1000,"vocab":"max300_mt5","experiment":"100","version":"3","experiment_name":"mt5_small"}
42
+ {"index":201,"step":1002000,"accuracy":67.4166666667,"f1_macro":66.9863660446,"base_file_name":"finetuned\/ul2test\/eval_political_exp100_mt5_small_v3\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":2000,"vocab":"max300_mt5","experiment":"100","version":"3","experiment_name":"mt5_small"}
43
+ {"index":202,"step":1003000,"accuracy":67.1666666667,"f1_macro":67.1535280779,"base_file_name":"finetuned\/ul2test\/eval_political_exp100_mt5_small_v3\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":3000,"vocab":"max300_mt5","experiment":"100","version":"3","experiment_name":"mt5_small"}
44
+ {"index":203,"step":1004000,"accuracy":66.9166666667,"f1_macro":66.8004451695,"base_file_name":"finetuned\/ul2test\/eval_political_exp100_mt5_small_v3\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":4000,"vocab":"max300_mt5","experiment":"100","version":"3","experiment_name":"mt5_small"}
45
+ {"index":204,"step":1005000,"accuracy":67.5,"f1_macro":67.499909722,"base_file_name":"finetuned\/ul2test\/eval_political_exp100_mt5_small_v3\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"100","version":"3","experiment_name":"mt5_small"}
46
+ {"index":225,"step":1501000,"accuracy":75.5833333333,"f1_macro":75.2415114508,"base_file_name":"finetuned\/ul2test\/eval_political_exp101_north_t5_base_NCC_v3\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":1000,"vocab":"max300_mt5","experiment":"101","version":"3","experiment_name":"north_t5_base_NCC"}
47
+ {"index":226,"step":1502000,"accuracy":81.1666666667,"f1_macro":81.1666666667,"base_file_name":"finetuned\/ul2test\/eval_political_exp101_north_t5_base_NCC_v3\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":2000,"vocab":"max300_mt5","experiment":"101","version":"3","experiment_name":"north_t5_base_NCC"}
48
+ {"index":227,"step":1503000,"accuracy":84.5,"f1_macro":84.4927201936,"base_file_name":"finetuned\/ul2test\/eval_political_exp101_north_t5_base_NCC_v3\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":3000,"vocab":"max300_mt5","experiment":"101","version":"3","experiment_name":"north_t5_base_NCC"}
49
+ {"index":228,"step":1504000,"accuracy":85.6666666667,"f1_macro":85.6618474543,"base_file_name":"finetuned\/ul2test\/eval_political_exp101_north_t5_base_NCC_v3\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":4000,"vocab":"max300_mt5","experiment":"101","version":"3","experiment_name":"north_t5_base_NCC"}
50
+ {"index":229,"step":1505000,"accuracy":86.4166666667,"f1_macro":86.4139400199,"base_file_name":"finetuned\/ul2test\/eval_political_exp101_north_t5_base_NCC_v3\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"101","version":"3","experiment_name":"north_t5_base_NCC"}
51
+ {"index":250,"step":1601000,"accuracy":75.5833333333,"f1_macro":75.5391509247,"base_file_name":"finetuned\/ul2test\/eval_political_exp102_north_t5_base_NCC_lm_v3\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":1000,"vocab":"max300_mt5","experiment":"102","version":"3","experiment_name":"north_t5_base_NCC_lm"}
52
+ {"index":251,"step":1602000,"accuracy":76.5833333333,"f1_macro":76.2740891523,"base_file_name":"finetuned\/ul2test\/eval_political_exp102_north_t5_base_NCC_lm_v3\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":2000,"vocab":"max300_mt5","experiment":"102","version":"3","experiment_name":"north_t5_base_NCC_lm"}
53
+ {"index":252,"step":1603000,"accuracy":80.5833333333,"f1_macro":80.579435734,"base_file_name":"finetuned\/ul2test\/eval_political_exp102_north_t5_base_NCC_lm_v3\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":3000,"vocab":"max300_mt5","experiment":"102","version":"3","experiment_name":"north_t5_base_NCC_lm"}
54
+ {"index":253,"step":1604000,"accuracy":79.4166666667,"f1_macro":79.2258765397,"base_file_name":"finetuned\/ul2test\/eval_political_exp102_north_t5_base_NCC_lm_v3\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":4000,"vocab":"max300_mt5","experiment":"102","version":"3","experiment_name":"north_t5_base_NCC_lm"}
55
+ {"index":254,"step":1605000,"accuracy":82.0833333333,"f1_macro":82.0788405982,"base_file_name":"finetuned\/ul2test\/eval_political_exp102_north_t5_base_NCC_lm_v3\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"102","version":"3","experiment_name":"north_t5_base_NCC_lm"}
56
+ {"index":275,"step":1001000,"accuracy":73.6666666667,"f1_macro":73.6663740708,"base_file_name":"finetuned\/ul2test\/eval_political_exp104_mt5_base_v3\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":1000,"vocab":"max300_mt5","experiment":"104","version":"3","experiment_name":"mt5_base"}
57
+ {"index":276,"step":1002000,"accuracy":72.25,"f1_macro":72.1525144621,"base_file_name":"finetuned\/ul2test\/eval_political_exp104_mt5_base_v3\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":2000,"vocab":"max300_mt5","experiment":"104","version":"3","experiment_name":"mt5_base"}
58
+ {"index":277,"step":1003000,"accuracy":72.8333333333,"f1_macro":72.8257849403,"base_file_name":"finetuned\/ul2test\/eval_political_exp104_mt5_base_v3\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":3000,"vocab":"max300_mt5","experiment":"104","version":"3","experiment_name":"mt5_base"}
59
+ {"index":278,"step":1004000,"accuracy":73.5833333333,"f1_macro":73.4305404901,"base_file_name":"finetuned\/ul2test\/eval_political_exp104_mt5_base_v3\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":4000,"vocab":"max300_mt5","experiment":"104","version":"3","experiment_name":"mt5_base"}
60
+ {"index":279,"step":1005000,"accuracy":73.3333333333,"f1_macro":73.1824848104,"base_file_name":"finetuned\/ul2test\/eval_political_exp104_mt5_base_v3\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"104","version":"3","experiment_name":"mt5_base"}
61
+ {"index":300,"step":1001000,"accuracy":72.4166666667,"f1_macro":72.2775732407,"base_file_name":"finetuned\/ul2test\/eval_political_exp100_mt5_small_v4\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":1000,"vocab":"max300_mt5","experiment":"100","version":"4","experiment_name":"mt5_small"}
62
+ {"index":301,"step":1002000,"accuracy":69.5,"f1_macro":69.4551159899,"base_file_name":"finetuned\/ul2test\/eval_political_exp100_mt5_small_v4\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":2000,"vocab":"max300_mt5","experiment":"100","version":"4","experiment_name":"mt5_small"}
63
+ {"index":302,"step":1003000,"accuracy":68.5833333333,"f1_macro":68.3934967733,"base_file_name":"finetuned\/ul2test\/eval_political_exp100_mt5_small_v4\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":3000,"vocab":"max300_mt5","experiment":"100","version":"4","experiment_name":"mt5_small"}
64
+ {"index":303,"step":1004000,"accuracy":67.75,"f1_macro":67.6608652599,"base_file_name":"finetuned\/ul2test\/eval_political_exp100_mt5_small_v4\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":4000,"vocab":"max300_mt5","experiment":"100","version":"4","experiment_name":"mt5_small"}
65
+ {"index":304,"step":1005000,"accuracy":67.75,"f1_macro":67.7401204119,"base_file_name":"finetuned\/ul2test\/eval_political_exp100_mt5_small_v4\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"100","version":"4","experiment_name":"mt5_small"}
66
+ {"index":325,"step":1501000,"accuracy":74.0833333333,"f1_macro":73.5961642273,"base_file_name":"finetuned\/ul2test\/eval_political_exp101_north_t5_base_NCC_v4\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":1000,"vocab":"max300_mt5","experiment":"101","version":"4","experiment_name":"north_t5_base_NCC"}
67
+ {"index":326,"step":1502000,"accuracy":76.5833333333,"f1_macro":76.3180793766,"base_file_name":"finetuned\/ul2test\/eval_political_exp101_north_t5_base_NCC_v4\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":2000,"vocab":"max300_mt5","experiment":"101","version":"4","experiment_name":"north_t5_base_NCC"}
68
+ {"index":327,"step":1503000,"accuracy":82.0833333333,"f1_macro":82.0713684619,"base_file_name":"finetuned\/ul2test\/eval_political_exp101_north_t5_base_NCC_v4\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":3000,"vocab":"max300_mt5","experiment":"101","version":"4","experiment_name":"north_t5_base_NCC"}
69
+ {"index":328,"step":1504000,"accuracy":83.25,"f1_macro":83.2480339707,"base_file_name":"finetuned\/ul2test\/eval_political_exp101_north_t5_base_NCC_v4\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":4000,"vocab":"max300_mt5","experiment":"101","version":"4","experiment_name":"north_t5_base_NCC"}
70
+ {"index":329,"step":1505000,"accuracy":83.75,"f1_macro":83.7474605407,"base_file_name":"finetuned\/ul2test\/eval_political_exp101_north_t5_base_NCC_v4\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"101","version":"4","experiment_name":"north_t5_base_NCC"}
71
+ {"index":350,"step":1601000,"accuracy":75.5,"f1_macro":75.3145851059,"base_file_name":"finetuned\/ul2test\/eval_political_exp102_north_t5_base_NCC_lm_v4\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":1000,"vocab":"max300_mt5","experiment":"102","version":"4","experiment_name":"north_t5_base_NCC_lm"}
72
+ {"index":351,"step":1602000,"accuracy":79.3333333333,"f1_macro":79.3305199874,"base_file_name":"finetuned\/ul2test\/eval_political_exp102_north_t5_base_NCC_lm_v4\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":2000,"vocab":"max300_mt5","experiment":"102","version":"4","experiment_name":"north_t5_base_NCC_lm"}
73
+ {"index":352,"step":1603000,"accuracy":79.9166666667,"f1_macro":79.8831245709,"base_file_name":"finetuned\/ul2test\/eval_political_exp102_north_t5_base_NCC_lm_v4\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":3000,"vocab":"max300_mt5","experiment":"102","version":"4","experiment_name":"north_t5_base_NCC_lm"}
74
+ {"index":353,"step":1604000,"accuracy":81.1666666667,"f1_macro":81.1666666667,"base_file_name":"finetuned\/ul2test\/eval_political_exp102_north_t5_base_NCC_lm_v4\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":4000,"vocab":"max300_mt5","experiment":"102","version":"4","experiment_name":"north_t5_base_NCC_lm"}
75
+ {"index":354,"step":1605000,"accuracy":81.25,"f1_macro":81.235809581,"base_file_name":"finetuned\/ul2test\/eval_political_exp102_north_t5_base_NCC_lm_v4\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"102","version":"4","experiment_name":"north_t5_base_NCC_lm"}
76
+ {"index":375,"step":1001000,"accuracy":74.3333333333,"f1_macro":74.3332620368,"base_file_name":"finetuned\/ul2test\/eval_political_exp104_mt5_base_v4\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":1000,"vocab":"max300_mt5","experiment":"104","version":"4","experiment_name":"mt5_base"}
77
+ {"index":376,"step":1002000,"accuracy":74.25,"f1_macro":74.2349524966,"base_file_name":"finetuned\/ul2test\/eval_political_exp104_mt5_base_v4\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":2000,"vocab":"max300_mt5","experiment":"104","version":"4","experiment_name":"mt5_base"}
78
+ {"index":377,"step":1003000,"accuracy":73.8333333333,"f1_macro":73.8228624783,"base_file_name":"finetuned\/ul2test\/eval_political_exp104_mt5_base_v4\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":3000,"vocab":"max300_mt5","experiment":"104","version":"4","experiment_name":"mt5_base"}
79
+ {"index":378,"step":1004000,"accuracy":72.9166666667,"f1_macro":72.9157450497,"base_file_name":"finetuned\/ul2test\/eval_political_exp104_mt5_base_v4\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":4000,"vocab":"max300_mt5","experiment":"104","version":"4","experiment_name":"mt5_base"}
80
+ {"index":379,"step":1005000,"accuracy":71.5,"f1_macro":71.4616317494,"base_file_name":"finetuned\/ul2test\/eval_political_exp104_mt5_base_v4\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"104","version":"4","experiment_name":"mt5_base"}
81
+ {"index":400,"step":1001000,"accuracy":72.0833333333,"f1_macro":72.0809873607,"base_file_name":"finetuned\/ul2test\/eval_political_exp100_mt5_small_v5\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":1000,"vocab":"max300_mt5","experiment":"100","version":"5","experiment_name":"mt5_small"}
82
+ {"index":401,"step":1002000,"accuracy":70.0833333333,"f1_macro":70.079821868,"base_file_name":"finetuned\/ul2test\/eval_political_exp100_mt5_small_v5\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":2000,"vocab":"max300_mt5","experiment":"100","version":"5","experiment_name":"mt5_small"}
83
+ {"index":402,"step":1003000,"accuracy":70.1666666667,"f1_macro":70.1666666667,"base_file_name":"finetuned\/ul2test\/eval_political_exp100_mt5_small_v5\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":3000,"vocab":"max300_mt5","experiment":"100","version":"5","experiment_name":"mt5_small"}
84
+ {"index":403,"step":1004000,"accuracy":68.8333333333,"f1_macro":68.8228543483,"base_file_name":"finetuned\/ul2test\/eval_political_exp100_mt5_small_v5\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":4000,"vocab":"max300_mt5","experiment":"100","version":"5","experiment_name":"mt5_small"}
85
+ {"index":404,"step":1005000,"accuracy":70.0,"f1_macro":69.9899132764,"base_file_name":"finetuned\/ul2test\/eval_political_exp100_mt5_small_v5\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"100","version":"5","experiment_name":"mt5_small"}
86
+ {"index":425,"step":1501000,"accuracy":75.1666666667,"f1_macro":74.7056776417,"base_file_name":"finetuned\/ul2test\/eval_political_exp101_north_t5_base_NCC_v5\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":1000,"vocab":"max300_mt5","experiment":"101","version":"5","experiment_name":"north_t5_base_NCC"}
87
+ {"index":426,"step":1502000,"accuracy":83.25,"f1_macro":83.2466376933,"base_file_name":"finetuned\/ul2test\/eval_political_exp101_north_t5_base_NCC_v5\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":2000,"vocab":"max300_mt5","experiment":"101","version":"5","experiment_name":"north_t5_base_NCC"}
88
+ {"index":427,"step":1503000,"accuracy":83.3333333333,"f1_macro":83.2512645295,"base_file_name":"finetuned\/ul2test\/eval_political_exp101_north_t5_base_NCC_v5\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":3000,"vocab":"max300_mt5","experiment":"101","version":"5","experiment_name":"north_t5_base_NCC"}
89
+ {"index":428,"step":1504000,"accuracy":85.75,"f1_macro":85.7495150877,"base_file_name":"finetuned\/ul2test\/eval_political_exp101_north_t5_base_NCC_v5\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":4000,"vocab":"max300_mt5","experiment":"101","version":"5","experiment_name":"north_t5_base_NCC"}
90
+ {"index":429,"step":1505000,"accuracy":86.0,"f1_macro":85.9968492911,"base_file_name":"finetuned\/ul2test\/eval_political_exp101_north_t5_base_NCC_v5\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"101","version":"5","experiment_name":"north_t5_base_NCC"}
91
+ {"index":450,"step":1601000,"accuracy":74.75,"f1_macro":74.7175366147,"base_file_name":"finetuned\/ul2test\/eval_political_exp102_north_t5_base_NCC_lm_v5\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":1000,"vocab":"max300_mt5","experiment":"102","version":"5","experiment_name":"north_t5_base_NCC_lm"}
92
+ {"index":451,"step":1602000,"accuracy":79.25,"f1_macro":79.1502542371,"base_file_name":"finetuned\/ul2test\/eval_political_exp102_north_t5_base_NCC_lm_v5\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":2000,"vocab":"max300_mt5","experiment":"102","version":"5","experiment_name":"north_t5_base_NCC_lm"}
93
+ {"index":452,"step":1603000,"accuracy":79.8333333333,"f1_macro":79.8036559277,"base_file_name":"finetuned\/ul2test\/eval_political_exp102_north_t5_base_NCC_lm_v5\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":3000,"vocab":"max300_mt5","experiment":"102","version":"5","experiment_name":"north_t5_base_NCC_lm"}
94
+ {"index":453,"step":1604000,"accuracy":81.1666666667,"f1_macro":81.1614337316,"base_file_name":"finetuned\/ul2test\/eval_political_exp102_north_t5_base_NCC_lm_v5\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":4000,"vocab":"max300_mt5","experiment":"102","version":"5","experiment_name":"north_t5_base_NCC_lm"}
95
+ {"index":454,"step":1605000,"accuracy":82.6666666667,"f1_macro":82.6643070862,"base_file_name":"finetuned\/ul2test\/eval_political_exp102_north_t5_base_NCC_lm_v5\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"102","version":"5","experiment_name":"north_t5_base_NCC_lm"}
96
+ {"index":475,"step":1001000,"accuracy":71.3333333333,"f1_macro":71.1921749908,"base_file_name":"finetuned\/ul2test\/eval_political_exp104_mt5_base_v5\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":1000,"vocab":"max300_mt5","experiment":"104","version":"5","experiment_name":"mt5_base"}
97
+ {"index":476,"step":1002000,"accuracy":71.3333333333,"f1_macro":71.3177174239,"base_file_name":"finetuned\/ul2test\/eval_political_exp104_mt5_base_v5\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":2000,"vocab":"max300_mt5","experiment":"104","version":"5","experiment_name":"mt5_base"}
98
+ {"index":477,"step":1003000,"accuracy":71.0,"f1_macro":70.9987110538,"base_file_name":"finetuned\/ul2test\/eval_political_exp104_mt5_base_v5\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":3000,"vocab":"max300_mt5","experiment":"104","version":"5","experiment_name":"mt5_base"}
99
+ {"index":478,"step":1004000,"accuracy":69.9166666667,"f1_macro":69.7502721568,"base_file_name":"finetuned\/ul2test\/eval_political_exp104_mt5_base_v5\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":4000,"vocab":"max300_mt5","experiment":"104","version":"5","experiment_name":"mt5_base"}
100
+ {"index":479,"step":1005000,"accuracy":70.8333333333,"f1_macro":70.7975603448,"base_file_name":"finetuned\/ul2test\/eval_political_exp104_mt5_base_v5\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"104","version":"5","experiment_name":"mt5_base"}
stats_various/average_at_5000.csv ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ experiment,experiment_name,pretraining_steps,accuracy,f1_macro,num_experiments
2
+ 100,mt5_small,0,68.61666666666667,68.58842655208484,5
3
+ 101,north_t5_base_NCC,0,85.53333333333333,85.52532045515714,5
4
+ 102,north_t5_base_NCC_lm,0,81.83333333333334,81.8062072744891,5
5
+ 104,mt5_base,0,72.56666666666666,72.50079352846863,5
stats_various/average_at_5000.jsonl ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {"experiment":"100","experiment_name":"mt5_small","pretraining_steps":0,"accuracy":68.6166666667,"f1_macro":68.5884265521,"num_experiments":5}
2
+ {"experiment":"101","experiment_name":"north_t5_base_NCC","pretraining_steps":0,"accuracy":85.5333333333,"f1_macro":85.5253204552,"num_experiments":5}
3
+ {"experiment":"102","experiment_name":"north_t5_base_NCC_lm","pretraining_steps":0,"accuracy":81.8333333333,"f1_macro":81.8062072745,"num_experiments":5}
4
+ {"experiment":"104","experiment_name":"mt5_base","pretraining_steps":0,"accuracy":72.5666666667,"f1_macro":72.5007935285,"num_experiments":5}
stats_various/only_5000.csv ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ index,step,accuracy,f1_macro,base_file_name,pretraining_steps,finetuning_steps,vocab,experiment,version,experiment_name
2
+ 4,1005000,69.41666666666667,69.37734632872348,finetuned/ul2test/eval_political_exp100_mt5_small_v1/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,100,1,mt5_small
3
+ 29,1505000,85.08333333333333,85.06756094458106,finetuned/ul2test/eval_political_exp101_north_t5_base_NCC_v1/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,101,1,north_t5_base_NCC
4
+ 54,1605000,82.0,81.92362732545003,finetuned/ul2test/eval_political_exp102_north_t5_base_NCC_lm_v1/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,102,1,north_t5_base_NCC_lm
5
+ 79,1005000,73.83333333333333,73.79139957264957,finetuned/ul2test/eval_political_exp104_mt5_base_v1/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,104,1,mt5_base
6
+ 104,1005000,68.41666666666667,68.33484302144639,finetuned/ul2test/eval_political_exp100_mt5_small_v2/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,100,2,mt5_small
7
+ 129,1505000,86.41666666666666,86.40079147949793,finetuned/ul2test/eval_political_exp101_north_t5_base_NCC_v2/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,101,2,north_t5_base_NCC
8
+ 154,1605000,81.16666666666667,81.12845178152426,finetuned/ul2test/eval_political_exp102_north_t5_base_NCC_lm_v2/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,102,2,north_t5_base_NCC_lm
9
+ 179,1005000,73.33333333333333,73.27089116519426,finetuned/ul2test/eval_political_exp104_mt5_base_v2/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,104,2,mt5_base
10
+ 204,1005000,67.5,67.49990972197143,finetuned/ul2test/eval_political_exp100_mt5_small_v3/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,100,3,mt5_small
11
+ 229,1505000,86.41666666666666,86.41394001990676,finetuned/ul2test/eval_political_exp101_north_t5_base_NCC_v3/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,101,3,north_t5_base_NCC
12
+ 254,1605000,82.08333333333333,82.0788405982333,finetuned/ul2test/eval_political_exp102_north_t5_base_NCC_lm_v3/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,102,3,north_t5_base_NCC_lm
13
+ 279,1005000,73.33333333333333,73.18248481039178,finetuned/ul2test/eval_political_exp104_mt5_base_v3/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,104,3,mt5_base
14
+ 304,1005000,67.75,67.74012041187613,finetuned/ul2test/eval_political_exp100_mt5_small_v4/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,100,4,mt5_small
15
+ 329,1505000,83.75,83.74746054070948,finetuned/ul2test/eval_political_exp101_north_t5_base_NCC_v4/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,101,4,north_t5_base_NCC
16
+ 354,1605000,81.25,81.23580958099564,finetuned/ul2test/eval_political_exp102_north_t5_base_NCC_lm_v4/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,102,4,north_t5_base_NCC_lm
17
+ 379,1005000,71.5,71.46163174935191,finetuned/ul2test/eval_political_exp104_mt5_base_v4/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,104,4,mt5_base
18
+ 404,1005000,70.0,69.98991327640678,finetuned/ul2test/eval_political_exp100_mt5_small_v5/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,100,5,mt5_small
19
+ 429,1505000,86.0,85.9968492910905,finetuned/ul2test/eval_political_exp101_north_t5_base_NCC_v5/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,101,5,north_t5_base_NCC
20
+ 454,1605000,82.66666666666667,82.66430708624229,finetuned/ul2test/eval_political_exp102_north_t5_base_NCC_lm_v5/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,102,5,north_t5_base_NCC_lm
21
+ 479,1005000,70.83333333333334,70.79756034475567,finetuned/ul2test/eval_political_exp104_mt5_base_v5/inference_eval/parliament_max300_mt5-metrics.jsonl,0,5000,max300_mt5,104,5,mt5_base
stats_various/only_5000.jsonl ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"index":4,"step":1005000,"accuracy":69.4166666667,"f1_macro":69.3773463287,"base_file_name":"finetuned\/ul2test\/eval_political_exp100_mt5_small_v1\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"100","version":"1","experiment_name":"mt5_small"}
2
+ {"index":29,"step":1505000,"accuracy":85.0833333333,"f1_macro":85.0675609446,"base_file_name":"finetuned\/ul2test\/eval_political_exp101_north_t5_base_NCC_v1\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"101","version":"1","experiment_name":"north_t5_base_NCC"}
3
+ {"index":54,"step":1605000,"accuracy":82.0,"f1_macro":81.9236273255,"base_file_name":"finetuned\/ul2test\/eval_political_exp102_north_t5_base_NCC_lm_v1\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"102","version":"1","experiment_name":"north_t5_base_NCC_lm"}
4
+ {"index":79,"step":1005000,"accuracy":73.8333333333,"f1_macro":73.7913995726,"base_file_name":"finetuned\/ul2test\/eval_political_exp104_mt5_base_v1\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"104","version":"1","experiment_name":"mt5_base"}
5
+ {"index":104,"step":1005000,"accuracy":68.4166666667,"f1_macro":68.3348430214,"base_file_name":"finetuned\/ul2test\/eval_political_exp100_mt5_small_v2\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"100","version":"2","experiment_name":"mt5_small"}
6
+ {"index":129,"step":1505000,"accuracy":86.4166666667,"f1_macro":86.4007914795,"base_file_name":"finetuned\/ul2test\/eval_political_exp101_north_t5_base_NCC_v2\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"101","version":"2","experiment_name":"north_t5_base_NCC"}
7
+ {"index":154,"step":1605000,"accuracy":81.1666666667,"f1_macro":81.1284517815,"base_file_name":"finetuned\/ul2test\/eval_political_exp102_north_t5_base_NCC_lm_v2\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"102","version":"2","experiment_name":"north_t5_base_NCC_lm"}
8
+ {"index":179,"step":1005000,"accuracy":73.3333333333,"f1_macro":73.2708911652,"base_file_name":"finetuned\/ul2test\/eval_political_exp104_mt5_base_v2\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"104","version":"2","experiment_name":"mt5_base"}
9
+ {"index":204,"step":1005000,"accuracy":67.5,"f1_macro":67.499909722,"base_file_name":"finetuned\/ul2test\/eval_political_exp100_mt5_small_v3\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"100","version":"3","experiment_name":"mt5_small"}
10
+ {"index":229,"step":1505000,"accuracy":86.4166666667,"f1_macro":86.4139400199,"base_file_name":"finetuned\/ul2test\/eval_political_exp101_north_t5_base_NCC_v3\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"101","version":"3","experiment_name":"north_t5_base_NCC"}
11
+ {"index":254,"step":1605000,"accuracy":82.0833333333,"f1_macro":82.0788405982,"base_file_name":"finetuned\/ul2test\/eval_political_exp102_north_t5_base_NCC_lm_v3\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"102","version":"3","experiment_name":"north_t5_base_NCC_lm"}
12
+ {"index":279,"step":1005000,"accuracy":73.3333333333,"f1_macro":73.1824848104,"base_file_name":"finetuned\/ul2test\/eval_political_exp104_mt5_base_v3\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"104","version":"3","experiment_name":"mt5_base"}
13
+ {"index":304,"step":1005000,"accuracy":67.75,"f1_macro":67.7401204119,"base_file_name":"finetuned\/ul2test\/eval_political_exp100_mt5_small_v4\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"100","version":"4","experiment_name":"mt5_small"}
14
+ {"index":329,"step":1505000,"accuracy":83.75,"f1_macro":83.7474605407,"base_file_name":"finetuned\/ul2test\/eval_political_exp101_north_t5_base_NCC_v4\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"101","version":"4","experiment_name":"north_t5_base_NCC"}
15
+ {"index":354,"step":1605000,"accuracy":81.25,"f1_macro":81.235809581,"base_file_name":"finetuned\/ul2test\/eval_political_exp102_north_t5_base_NCC_lm_v4\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"102","version":"4","experiment_name":"north_t5_base_NCC_lm"}
16
+ {"index":379,"step":1005000,"accuracy":71.5,"f1_macro":71.4616317494,"base_file_name":"finetuned\/ul2test\/eval_political_exp104_mt5_base_v4\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"104","version":"4","experiment_name":"mt5_base"}
17
+ {"index":404,"step":1005000,"accuracy":70.0,"f1_macro":69.9899132764,"base_file_name":"finetuned\/ul2test\/eval_political_exp100_mt5_small_v5\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"100","version":"5","experiment_name":"mt5_small"}
18
+ {"index":429,"step":1505000,"accuracy":86.0,"f1_macro":85.9968492911,"base_file_name":"finetuned\/ul2test\/eval_political_exp101_north_t5_base_NCC_v5\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"101","version":"5","experiment_name":"north_t5_base_NCC"}
19
+ {"index":454,"step":1605000,"accuracy":82.6666666667,"f1_macro":82.6643070862,"base_file_name":"finetuned\/ul2test\/eval_political_exp102_north_t5_base_NCC_lm_v5\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"102","version":"5","experiment_name":"north_t5_base_NCC_lm"}
20
+ {"index":479,"step":1005000,"accuracy":70.8333333333,"f1_macro":70.7975603448,"base_file_name":"finetuned\/ul2test\/eval_political_exp104_mt5_base_v5\/inference_eval\/parliament_max300_mt5-metrics.jsonl","pretraining_steps":0,"finetuning_steps":5000,"vocab":"max300_mt5","experiment":"104","version":"5","experiment_name":"mt5_base"}