pere commited on
Commit
3bfac5f
1 Parent(s): 5df95f8
stats/all.csv CHANGED
The diff for this file is too large to render. See raw diff
 
stats/all.jsonl CHANGED
The diff for this file is too large to render. See raw diff
 
stats/average_at_5000.csv CHANGED
@@ -52,7 +52,7 @@ experiment,experiment_name,pretraining_steps,accuracy,f1_macro,num_experiments
52
  17,t5-small-ul2-mt5voc-scratch,500000,81.45,81.39528145007205,5
53
  17,t5-small-ul2-mt5voc-scratch,1000000,81.7,81.67852155576905,5
54
  17,t5-small-ul2-mt5voc-scratch,1100000,81.56666666666668,81.52271320211511,5
55
- 18,t5-small-span-mt5voc-scratch,100000,82.29166666666667,82.2653488632385,4
56
  18,t5-small-span-mt5voc-scratch,200000,82.11666666666667,82.06098880578924,5
57
  18,t5-small-span-mt5voc-scratch,300000,82.53333333333333,82.49038612917455,5
58
  18,t5-small-span-mt5voc-scratch,400000,82.43333333333334,82.42718912983908,5
@@ -99,7 +99,7 @@ experiment,experiment_name,pretraining_steps,accuracy,f1_macro,num_experiments
99
  4,t5-base-span-scandvoc,1300000,83.43333333333332,83.41952324655281,5
100
  4,t5-base-span-scandvoc,1400000,76.83333333333334,73.48406842031721,5
101
  4,t5-base-span-scandvoc,1500000,75.76666666666667,72.41107299754478,5
102
- 5,t5-base-ul2-scandvoc-full,1184000,77.10416666666667,77.09637128744669,4
103
  5,t5-base-ul2-scandvoc-full,1284000,84.93333333333334,84.91954722609185,5
104
  5,t5-base-ul2-scandvoc-full,1384000,83.3,83.29187265250039,5
105
  5,t5-base-ul2-scandvoc-full,1484000,86.75,86.74973255081272,5
 
52
  17,t5-small-ul2-mt5voc-scratch,500000,81.45,81.39528145007205,5
53
  17,t5-small-ul2-mt5voc-scratch,1000000,81.7,81.67852155576905,5
54
  17,t5-small-ul2-mt5voc-scratch,1100000,81.56666666666668,81.52271320211511,5
55
+ 18,t5-small-span-mt5voc-scratch,100000,82.41666666666667,82.3927034098902,5
56
  18,t5-small-span-mt5voc-scratch,200000,82.11666666666667,82.06098880578924,5
57
  18,t5-small-span-mt5voc-scratch,300000,82.53333333333333,82.49038612917455,5
58
  18,t5-small-span-mt5voc-scratch,400000,82.43333333333334,82.42718912983908,5
 
99
  4,t5-base-span-scandvoc,1300000,83.43333333333332,83.41952324655281,5
100
  4,t5-base-span-scandvoc,1400000,76.83333333333334,73.48406842031721,5
101
  4,t5-base-span-scandvoc,1500000,75.76666666666667,72.41107299754478,5
102
+ 5,t5-base-ul2-scandvoc-full,1184000,77.13333333333334,77.12228601081839,5
103
  5,t5-base-ul2-scandvoc-full,1284000,84.93333333333334,84.91954722609185,5
104
  5,t5-base-ul2-scandvoc-full,1384000,83.3,83.29187265250039,5
105
  5,t5-base-ul2-scandvoc-full,1484000,86.75,86.74973255081272,5
stats/average_at_5000.jsonl CHANGED
@@ -51,7 +51,7 @@
51
  {"experiment":"17","experiment_name":"t5-small-ul2-mt5voc-scratch","pretraining_steps":500000,"accuracy":81.45,"f1_macro":81.3952814501,"num_experiments":5}
52
  {"experiment":"17","experiment_name":"t5-small-ul2-mt5voc-scratch","pretraining_steps":1000000,"accuracy":81.7,"f1_macro":81.6785215558,"num_experiments":5}
53
  {"experiment":"17","experiment_name":"t5-small-ul2-mt5voc-scratch","pretraining_steps":1100000,"accuracy":81.5666666667,"f1_macro":81.5227132021,"num_experiments":5}
54
- {"experiment":"18","experiment_name":"t5-small-span-mt5voc-scratch","pretraining_steps":100000,"accuracy":82.2916666667,"f1_macro":82.2653488632,"num_experiments":4}
55
  {"experiment":"18","experiment_name":"t5-small-span-mt5voc-scratch","pretraining_steps":200000,"accuracy":82.1166666667,"f1_macro":82.0609888058,"num_experiments":5}
56
  {"experiment":"18","experiment_name":"t5-small-span-mt5voc-scratch","pretraining_steps":300000,"accuracy":82.5333333333,"f1_macro":82.4903861292,"num_experiments":5}
57
  {"experiment":"18","experiment_name":"t5-small-span-mt5voc-scratch","pretraining_steps":400000,"accuracy":82.4333333333,"f1_macro":82.4271891298,"num_experiments":5}
@@ -98,7 +98,7 @@
98
  {"experiment":"4","experiment_name":"t5-base-span-scandvoc","pretraining_steps":1300000,"accuracy":83.4333333333,"f1_macro":83.4195232466,"num_experiments":5}
99
  {"experiment":"4","experiment_name":"t5-base-span-scandvoc","pretraining_steps":1400000,"accuracy":76.8333333333,"f1_macro":73.4840684203,"num_experiments":5}
100
  {"experiment":"4","experiment_name":"t5-base-span-scandvoc","pretraining_steps":1500000,"accuracy":75.7666666667,"f1_macro":72.4110729975,"num_experiments":5}
101
- {"experiment":"5","experiment_name":"t5-base-ul2-scandvoc-full","pretraining_steps":1184000,"accuracy":77.1041666667,"f1_macro":77.0963712874,"num_experiments":4}
102
  {"experiment":"5","experiment_name":"t5-base-ul2-scandvoc-full","pretraining_steps":1284000,"accuracy":84.9333333333,"f1_macro":84.9195472261,"num_experiments":5}
103
  {"experiment":"5","experiment_name":"t5-base-ul2-scandvoc-full","pretraining_steps":1384000,"accuracy":83.3,"f1_macro":83.2918726525,"num_experiments":5}
104
  {"experiment":"5","experiment_name":"t5-base-ul2-scandvoc-full","pretraining_steps":1484000,"accuracy":86.75,"f1_macro":86.7497325508,"num_experiments":5}
 
51
  {"experiment":"17","experiment_name":"t5-small-ul2-mt5voc-scratch","pretraining_steps":500000,"accuracy":81.45,"f1_macro":81.3952814501,"num_experiments":5}
52
  {"experiment":"17","experiment_name":"t5-small-ul2-mt5voc-scratch","pretraining_steps":1000000,"accuracy":81.7,"f1_macro":81.6785215558,"num_experiments":5}
53
  {"experiment":"17","experiment_name":"t5-small-ul2-mt5voc-scratch","pretraining_steps":1100000,"accuracy":81.5666666667,"f1_macro":81.5227132021,"num_experiments":5}
54
+ {"experiment":"18","experiment_name":"t5-small-span-mt5voc-scratch","pretraining_steps":100000,"accuracy":82.4166666667,"f1_macro":82.3927034099,"num_experiments":5}
55
  {"experiment":"18","experiment_name":"t5-small-span-mt5voc-scratch","pretraining_steps":200000,"accuracy":82.1166666667,"f1_macro":82.0609888058,"num_experiments":5}
56
  {"experiment":"18","experiment_name":"t5-small-span-mt5voc-scratch","pretraining_steps":300000,"accuracy":82.5333333333,"f1_macro":82.4903861292,"num_experiments":5}
57
  {"experiment":"18","experiment_name":"t5-small-span-mt5voc-scratch","pretraining_steps":400000,"accuracy":82.4333333333,"f1_macro":82.4271891298,"num_experiments":5}
 
98
  {"experiment":"4","experiment_name":"t5-base-span-scandvoc","pretraining_steps":1300000,"accuracy":83.4333333333,"f1_macro":83.4195232466,"num_experiments":5}
99
  {"experiment":"4","experiment_name":"t5-base-span-scandvoc","pretraining_steps":1400000,"accuracy":76.8333333333,"f1_macro":73.4840684203,"num_experiments":5}
100
  {"experiment":"4","experiment_name":"t5-base-span-scandvoc","pretraining_steps":1500000,"accuracy":75.7666666667,"f1_macro":72.4110729975,"num_experiments":5}
101
+ {"experiment":"5","experiment_name":"t5-base-ul2-scandvoc-full","pretraining_steps":1184000,"accuracy":77.1333333333,"f1_macro":77.1222860108,"num_experiments":5}
102
  {"experiment":"5","experiment_name":"t5-base-ul2-scandvoc-full","pretraining_steps":1284000,"accuracy":84.9333333333,"f1_macro":84.9195472261,"num_experiments":5}
103
  {"experiment":"5","experiment_name":"t5-base-ul2-scandvoc-full","pretraining_steps":1384000,"accuracy":83.3,"f1_macro":83.2918726525,"num_experiments":5}
104
  {"experiment":"5","experiment_name":"t5-base-ul2-scandvoc-full","pretraining_steps":1484000,"accuracy":86.75,"f1_macro":86.7497325508,"num_experiments":5}
stats/only_5000.csv CHANGED
The diff for this file is too large to render. See raw diff
 
stats/only_5000.jsonl CHANGED
The diff for this file is too large to render. See raw diff