anniew666 commited on
Commit
b27cd81
1 Parent(s): e481fc9

End of training

Browse files
Files changed (7) hide show
  1. all_results.json +36 -36
  2. cf.png +2 -2
  3. cf.txt +7 -7
  4. class_report.txt +10 -10
  5. eval_results.json +32 -32
  6. train_results.json +5 -5
  7. trainer_state.json +1235 -1194
all_results.json CHANGED
@@ -1,40 +1,40 @@
1
  {
2
- "epoch": 15.0,
3
- "eval_accuracy": 0.7630963972736124,
4
- "eval_b_acc": 0.6053830892588602,
5
- "eval_f1": 0.6276991641576467,
6
- "eval_f1_anger": 0.6168702073274639,
7
- "eval_f1_disgust": 0.43303571428571425,
8
- "eval_f1_fear": 0.638801261829653,
9
- "eval_f1_joy": 0.7379285799027169,
10
- "eval_f1_neutral": 0.8519039622384605,
11
- "eval_f1_sadness": 0.6683630195080577,
12
- "eval_f1_surprise": 0.44699140401146126,
13
- "eval_loss": 0.6577332019805908,
14
- "eval_micro_f1": 0.7630963972736124,
15
- "eval_prec": 0.6548174460459298,
16
- "eval_prec_anger": 0.6339754816112084,
17
- "eval_prec_disgust": 0.46411483253588515,
18
- "eval_prec_fear": 0.6923076923076923,
19
- "eval_prec_joy": 0.7441971763579803,
20
- "eval_prec_neutral": 0.8246199806695369,
21
- "eval_prec_sadness": 0.7163636363636363,
22
- "eval_prec_surprise": 0.50814332247557,
23
- "eval_recall": 0.6053830892588602,
24
- "eval_recall_anger": 0.6006637168141593,
25
- "eval_recall_disgust": 0.40585774058577406,
26
- "eval_recall_fear": 0.5929721815519766,
27
- "eval_recall_joy": 0.731764705882353,
28
- "eval_recall_neutral": 0.8810552009012392,
29
- "eval_recall_sadness": 0.6263910969793323,
30
- "eval_recall_surprise": 0.3989769820971867,
31
- "eval_runtime": 52.7414,
32
  "eval_samples": 20540,
33
- "eval_samples_per_second": 389.447,
34
- "eval_steps_per_second": 24.345,
35
- "train_loss": 0.6400373776102771,
36
- "train_runtime": 15988.8097,
37
  "train_samples": 187524,
38
- "train_samples_per_second": 175.927,
39
- "train_steps_per_second": 1.374
40
  }
 
1
  {
2
+ "epoch": 20.0,
3
+ "eval_accuracy": 0.7581304771178189,
4
+ "eval_b_acc": 0.6039152175326364,
5
+ "eval_f1": 0.6206372407316966,
6
+ "eval_f1_anger": 0.624553694040099,
7
+ "eval_f1_disgust": 0.4259259259259259,
8
+ "eval_f1_fear": 0.6247049567269867,
9
+ "eval_f1_joy": 0.7396948303347757,
10
+ "eval_f1_neutral": 0.8471082089552239,
11
+ "eval_f1_sadness": 0.6643598615916955,
12
+ "eval_f1_surprise": 0.41811320754716985,
13
+ "eval_loss": 0.6852018237113953,
14
+ "eval_micro_f1": 0.758130477117819,
15
+ "eval_prec": 0.6440153151637059,
16
+ "eval_prec_anger": 0.6202945990180033,
17
+ "eval_prec_disgust": 0.47668393782383417,
18
+ "eval_prec_fear": 0.6751700680272109,
19
+ "eval_prec_joy": 0.7166813768755517,
20
+ "eval_prec_neutral": 0.8417686318131257,
21
+ "eval_prec_sadness": 0.667379679144385,
22
+ "eval_prec_surprise": 0.5101289134438306,
23
+ "eval_recall": 0.6039152175326364,
24
+ "eval_recall_anger": 0.6288716814159292,
25
+ "eval_recall_disgust": 0.38493723849372385,
26
+ "eval_recall_fear": 0.5812591508052709,
27
+ "eval_recall_joy": 0.764235294117647,
28
+ "eval_recall_neutral": 0.8525159594442359,
29
+ "eval_recall_sadness": 0.6613672496025437,
30
+ "eval_recall_surprise": 0.35421994884910485,
31
+ "eval_runtime": 45.9859,
32
  "eval_samples": 20540,
33
+ "eval_samples_per_second": 446.659,
34
+ "eval_steps_per_second": 13.961,
35
+ "train_loss": 0.6315777759747294,
36
+ "train_runtime": 20512.0097,
37
  "train_samples": 187524,
38
+ "train_samples_per_second": 182.843,
39
+ "train_steps_per_second": 1.428
40
  }
cf.png CHANGED

Git LFS Details

  • SHA256: d01f228042b527113815349ac7f2f29ebd9b9f2364308980ba7dfaa7b79bc59a
  • Pointer size: 130 Bytes
  • Size of remote file: 57.6 kB

Git LFS Details

  • SHA256: 25206069fa666f7f10d0acb4e890e715b69537244b47562aa62533e9a8ff5a5c
  • Pointer size: 130 Bytes
  • Size of remote file: 58 kB
cf.txt CHANGED
@@ -1,7 +1,7 @@
1
- 6.316371681415928752e-01 4.756637168141592681e-02 2.101769911504424923e-02 5.475663716814159476e-02 1.637168141592920401e-01 6.084070796460176733e-02 2.046460176991150501e-02
2
- 2.133891213389121355e-01 4.037656903765690641e-01 5.020920502092050125e-02 7.740585774058576785e-02 8.995815899581589836e-02 1.485355648535564843e-01 1.673640167364016593e-02
3
- 6.588579795021962116e-02 2.781844802342606227e-02 5.885797950219618935e-01 6.295754026354319355e-02 1.390922401171303113e-01 6.588579795021962116e-02 4.978038067349926932e-02
4
- 2.117647058823529313e-02 4.000000000000000083e-03 6.823529411764705718e-03 7.630588235294117894e-01 1.642352941176470627e-01 2.447058823529411897e-02 1.623529411764705957e-02
5
- 3.276380022530980124e-02 4.224558768306421741e-03 4.318437852046564003e-03 7.904618850920014372e-02 8.428464138190011612e-01 2.384528726999624385e-02 1.295531355613969288e-02
6
- 5.140434552199257823e-02 3.391626921038685960e-02 2.172760996290408128e-02 6.306306306306305731e-02 1.510333863275039878e-01 6.618971913089559678e-01 1.695813460519342980e-02
7
- 4.859335038363171017e-02 1.918158567774936110e-02 3.452685421994884651e-02 2.046035805626598425e-01 2.442455242966752038e-01 6.649616368286445645e-02 3.823529411764705621e-01
 
1
+ 6.288716814159291957e-01 4.092920353982301002e-02 1.991150442477876079e-02 5.420353982300885054e-02 1.808628318584070693e-01 5.696902654867256471e-02 1.825221238938053159e-02
2
+ 2.092050209205020828e-01 3.849372384937238545e-01 5.020920502092050125e-02 6.903765690376569009e-02 1.087866108786610941e-01 1.589958158995815884e-01 1.882845188284518884e-02
3
+ 7.467057101024890398e-02 2.196193265007320705e-02 5.812591508052709077e-01 6.588579795021962116e-02 1.522693997071742356e-01 5.417276720351391073e-02 4.978038067349926932e-02
4
+ 2.235294117647058931e-02 3.058823529411764872e-03 5.411764705882352901e-03 7.642352941176470127e-01 1.689411764705882335e-01 2.423529411764705974e-02 1.176470588235294101e-02
5
+ 3.022906496432594889e-02 3.191888847164851654e-03 3.004130679684566263e-03 7.735636500187757780e-02 8.525159594442358602e-01 2.300037551633496088e-02 1.070221554637626818e-02
6
+ 4.928457869634340210e-02 3.126656067832538077e-02 2.437731849496555317e-02 6.412294647588764884e-02 1.558028616852146220e-01 6.613672496025436720e-01 1.377848436671966041e-02
7
+ 4.475703324808184141e-02 8.951406649616367936e-03 3.836317135549872220e-02 2.084398976982097251e-01 2.710997442455242989e-01 7.416879795396419395e-02 3.542199488491048487e-01
class_report.txt CHANGED
@@ -1,13 +1,13 @@
1
  precision recall f1-score support
2
 
3
- 0anger 0.61 0.63 0.62 1808
4
- 1disgust 0.44 0.40 0.42 478
5
- 2fear 0.66 0.59 0.62 683
6
- 3joy 0.71 0.76 0.74 4250
7
- 4neutral 0.85 0.84 0.85 10652
8
- 5sadness 0.66 0.66 0.66 1887
9
- 6surprise 0.48 0.38 0.43 782
10
 
11
- accuracy 0.75 20540
12
- macro avg 0.63 0.61 0.62 20540
13
- weighted avg 0.75 0.75 0.75 20540
 
1
  precision recall f1-score support
2
 
3
+ 0anger 0.62 0.63 0.62 1808
4
+ 1disgust 0.48 0.38 0.43 478
5
+ 2fear 0.68 0.58 0.62 683
6
+ 3joy 0.72 0.76 0.74 4250
7
+ 4neutral 0.84 0.85 0.85 10652
8
+ 5sadness 0.67 0.66 0.66 1887
9
+ 6surprise 0.51 0.35 0.42 782
10
 
11
+ accuracy 0.76 20540
12
+ macro avg 0.64 0.60 0.62 20540
13
+ weighted avg 0.75 0.76 0.75 20540
eval_results.json CHANGED
@@ -1,35 +1,35 @@
1
  {
2
- "epoch": 15.0,
3
- "eval_accuracy": 0.7630963972736124,
4
- "eval_b_acc": 0.6053830892588602,
5
- "eval_f1": 0.6276991641576467,
6
- "eval_f1_anger": 0.6168702073274639,
7
- "eval_f1_disgust": 0.43303571428571425,
8
- "eval_f1_fear": 0.638801261829653,
9
- "eval_f1_joy": 0.7379285799027169,
10
- "eval_f1_neutral": 0.8519039622384605,
11
- "eval_f1_sadness": 0.6683630195080577,
12
- "eval_f1_surprise": 0.44699140401146126,
13
- "eval_loss": 0.6577332019805908,
14
- "eval_micro_f1": 0.7630963972736124,
15
- "eval_prec": 0.6548174460459298,
16
- "eval_prec_anger": 0.6339754816112084,
17
- "eval_prec_disgust": 0.46411483253588515,
18
- "eval_prec_fear": 0.6923076923076923,
19
- "eval_prec_joy": 0.7441971763579803,
20
- "eval_prec_neutral": 0.8246199806695369,
21
- "eval_prec_sadness": 0.7163636363636363,
22
- "eval_prec_surprise": 0.50814332247557,
23
- "eval_recall": 0.6053830892588602,
24
- "eval_recall_anger": 0.6006637168141593,
25
- "eval_recall_disgust": 0.40585774058577406,
26
- "eval_recall_fear": 0.5929721815519766,
27
- "eval_recall_joy": 0.731764705882353,
28
- "eval_recall_neutral": 0.8810552009012392,
29
- "eval_recall_sadness": 0.6263910969793323,
30
- "eval_recall_surprise": 0.3989769820971867,
31
- "eval_runtime": 52.7414,
32
  "eval_samples": 20540,
33
- "eval_samples_per_second": 389.447,
34
- "eval_steps_per_second": 24.345
35
  }
 
1
  {
2
+ "epoch": 20.0,
3
+ "eval_accuracy": 0.7581304771178189,
4
+ "eval_b_acc": 0.6039152175326364,
5
+ "eval_f1": 0.6206372407316966,
6
+ "eval_f1_anger": 0.624553694040099,
7
+ "eval_f1_disgust": 0.4259259259259259,
8
+ "eval_f1_fear": 0.6247049567269867,
9
+ "eval_f1_joy": 0.7396948303347757,
10
+ "eval_f1_neutral": 0.8471082089552239,
11
+ "eval_f1_sadness": 0.6643598615916955,
12
+ "eval_f1_surprise": 0.41811320754716985,
13
+ "eval_loss": 0.6852018237113953,
14
+ "eval_micro_f1": 0.758130477117819,
15
+ "eval_prec": 0.6440153151637059,
16
+ "eval_prec_anger": 0.6202945990180033,
17
+ "eval_prec_disgust": 0.47668393782383417,
18
+ "eval_prec_fear": 0.6751700680272109,
19
+ "eval_prec_joy": 0.7166813768755517,
20
+ "eval_prec_neutral": 0.8417686318131257,
21
+ "eval_prec_sadness": 0.667379679144385,
22
+ "eval_prec_surprise": 0.5101289134438306,
23
+ "eval_recall": 0.6039152175326364,
24
+ "eval_recall_anger": 0.6288716814159292,
25
+ "eval_recall_disgust": 0.38493723849372385,
26
+ "eval_recall_fear": 0.5812591508052709,
27
+ "eval_recall_joy": 0.764235294117647,
28
+ "eval_recall_neutral": 0.8525159594442359,
29
+ "eval_recall_sadness": 0.6613672496025437,
30
+ "eval_recall_surprise": 0.35421994884910485,
31
+ "eval_runtime": 45.9859,
32
  "eval_samples": 20540,
33
+ "eval_samples_per_second": 446.659,
34
+ "eval_steps_per_second": 13.961
35
  }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 15.0,
3
- "train_loss": 0.6400373776102771,
4
- "train_runtime": 15988.8097,
5
  "train_samples": 187524,
6
- "train_samples_per_second": 175.927,
7
- "train_steps_per_second": 1.374
8
  }
 
1
  {
2
+ "epoch": 20.0,
3
+ "train_loss": 0.6315777759747294,
4
+ "train_runtime": 20512.0097,
5
  "train_samples": 187524,
6
+ "train_samples_per_second": 182.843,
7
+ "train_steps_per_second": 1.428
8
  }
trainer_state.json CHANGED
@@ -1,1284 +1,1325 @@
1
  {
2
- "best_metric": 0.6276991641576467,
3
- "best_model_checkpoint": ".exp/lora/lora-roberta-large-no-ed/checkpoint-17584",
4
- "epoch": 14.99744070977649,
5
- "global_step": 21975,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
- "epoch": 0.15,
12
- "learning_rate": 0.00019836214740673338,
13
- "loss": 1.2151,
14
- "step": 220
15
  },
16
  {
17
- "epoch": 0.3,
18
- "learning_rate": 0.0003976342129208371,
19
- "loss": 0.8737,
20
- "step": 440
21
- },
22
- {
23
- "epoch": 0.45,
24
- "learning_rate": 0.0005969062784349408,
25
- "loss": 0.8228,
26
- "step": 660
27
  },
28
  {
29
  "epoch": 0.6,
30
- "learning_rate": 0.0007970882620564149,
31
- "loss": 0.8081,
32
- "step": 880
33
- },
34
- {
35
- "epoch": 0.75,
36
- "eval_accuracy": 0.7138266796494644,
37
- "eval_b_acc": 0.5642215512771782,
38
- "eval_f1": 0.5601190771157161,
39
- "eval_f1_anger": 0.515716568993074,
40
- "eval_f1_disgust": 0.3879907621247113,
41
- "eval_f1_fear": 0.5360230547550433,
42
- "eval_f1_joy": 0.6877726536208402,
43
- "eval_f1_neutral": 0.8344834105302958,
44
- "eval_f1_sadness": 0.5870011402508551,
45
- "eval_f1_surprise": 0.3718459495351925,
46
- "eval_loss": 0.790067732334137,
47
- "eval_micro_f1": 0.7138266796494644,
48
- "eval_prec": 0.5616517829432821,
49
- "eval_prec_anger": 0.49743062692702983,
50
- "eval_prec_disgust": 0.4329896907216495,
51
- "eval_prec_fear": 0.5276595744680851,
52
- "eval_prec_joy": 0.7312483434932414,
53
- "eval_prec_neutral": 0.8402817437654674,
54
- "eval_prec_sadness": 0.5152121697357886,
55
- "eval_prec_surprise": 0.3867403314917127,
56
- "eval_recall": 0.5642215512771782,
57
- "eval_recall_anger": 0.5353982300884956,
58
- "eval_recall_disgust": 0.3514644351464435,
59
- "eval_recall_fear": 0.5446559297218155,
60
- "eval_recall_joy": 0.6491764705882352,
61
- "eval_recall_neutral": 0.8287645512579798,
62
- "eval_recall_sadness": 0.6820349761526232,
63
- "eval_recall_surprise": 0.35805626598465473,
64
- "eval_runtime": 53.9044,
65
- "eval_samples_per_second": 381.045,
66
- "eval_steps_per_second": 23.82,
67
- "step": 1099
68
- },
69
- {
70
- "epoch": 0.75,
71
- "learning_rate": 0.000997270245677889,
72
- "loss": 0.7828,
73
- "step": 1100
74
- },
75
- {
76
- "epoch": 0.9,
77
- "learning_rate": 0.0009896052883694194,
78
- "loss": 0.7661,
79
- "step": 1320
80
- },
81
- {
82
- "epoch": 1.05,
83
- "learning_rate": 0.0009790668710480935,
84
- "loss": 0.7799,
85
- "step": 1540
86
  },
87
  {
88
  "epoch": 1.2,
89
- "learning_rate": 0.0009685284537267676,
90
- "loss": 0.757,
91
- "step": 1760
92
- },
93
- {
94
- "epoch": 1.35,
95
- "learning_rate": 0.0009579900364054417,
96
- "loss": 0.7543,
97
- "step": 1980
98
- },
99
- {
100
- "epoch": 1.5,
101
- "eval_accuracy": 0.7262901655306718,
102
- "eval_b_acc": 0.5714411859458394,
103
- "eval_f1": 0.573711944542916,
104
- "eval_f1_anger": 0.5241837968561063,
105
- "eval_f1_disgust": 0.44267198404785646,
106
- "eval_f1_fear": 0.546070460704607,
107
- "eval_f1_joy": 0.7150729335494327,
108
- "eval_f1_neutral": 0.8296947358472735,
109
- "eval_f1_sadness": 0.6172300981461288,
110
- "eval_f1_surprise": 0.3410596026490066,
111
- "eval_loss": 0.7482287883758545,
112
- "eval_micro_f1": 0.7262901655306718,
113
- "eval_prec": 0.5892369276637266,
114
- "eval_prec_anger": 0.578,
115
- "eval_prec_disgust": 0.4228571428571429,
116
- "eval_prec_fear": 0.5081967213114754,
117
- "eval_prec_joy": 0.6611388611388611,
118
- "eval_prec_neutral": 0.8352997145575642,
119
- "eval_prec_sadness": 0.6355979786636721,
120
- "eval_prec_surprise": 0.4835680751173709,
121
- "eval_recall": 0.5714411859458394,
122
- "eval_recall_anger": 0.4795353982300885,
123
- "eval_recall_disgust": 0.46443514644351463,
124
- "eval_recall_fear": 0.5900439238653001,
125
- "eval_recall_joy": 0.7785882352941177,
126
- "eval_recall_neutral": 0.8241644761547128,
127
- "eval_recall_sadness": 0.5998940116587176,
128
- "eval_recall_surprise": 0.26342710997442453,
129
- "eval_runtime": 52.5664,
130
- "eval_samples_per_second": 390.744,
131
- "eval_steps_per_second": 24.426,
132
- "step": 2198
133
- },
134
- {
135
- "epoch": 1.5,
136
- "learning_rate": 0.0009474516190841157,
137
- "loss": 0.7562,
138
- "step": 2200
139
- },
140
- {
141
- "epoch": 1.65,
142
- "learning_rate": 0.0009369132017627898,
143
- "loss": 0.7601,
144
- "step": 2420
145
  },
146
  {
147
- "epoch": 1.8,
148
- "learning_rate": 0.0009263747844414639,
149
- "loss": 0.7501,
150
- "step": 2640
151
  },
152
  {
153
- "epoch": 1.95,
154
- "learning_rate": 0.000915836367120138,
155
- "loss": 0.737,
156
- "step": 2860
157
- },
158
- {
159
- "epoch": 2.1,
160
- "learning_rate": 0.0009052979497988121,
161
- "loss": 0.7292,
162
- "step": 3080
163
- },
164
- {
165
- "epoch": 2.25,
166
- "eval_accuracy": 0.739240506329114,
167
- "eval_b_acc": 0.5728734605953718,
168
- "eval_f1": 0.5834227565376339,
169
- "eval_f1_anger": 0.5439560439560439,
170
- "eval_f1_disgust": 0.41185185185185186,
171
- "eval_f1_fear": 0.593798449612403,
172
- "eval_f1_joy": 0.721927599723311,
173
- "eval_f1_neutral": 0.8387907060195567,
174
- "eval_f1_sadness": 0.6231551328304362,
175
- "eval_f1_surprise": 0.35047951176983433,
176
- "eval_loss": 0.7176372408866882,
177
- "eval_micro_f1": 0.739240506329114,
178
- "eval_prec": 0.633689371773426,
179
- "eval_prec_anger": 0.6069482288828338,
180
- "eval_prec_disgust": 0.31880733944954126,
181
- "eval_prec_fear": 0.6309719934102141,
182
- "eval_prec_joy": 0.7077305605786618,
183
- "eval_prec_neutral": 0.8031266105480158,
184
- "eval_prec_sadness": 0.8175559380378657,
185
- "eval_prec_surprise": 0.5506849315068493,
186
- "eval_recall": 0.5728734605953718,
187
- "eval_recall_anger": 0.4928097345132743,
188
- "eval_recall_disgust": 0.5815899581589958,
189
- "eval_recall_fear": 0.5607613469985359,
190
- "eval_recall_joy": 0.7367058823529412,
191
- "eval_recall_neutral": 0.8777694329703342,
192
- "eval_recall_sadness": 0.5034446210916799,
193
- "eval_recall_surprise": 0.2570332480818414,
194
- "eval_runtime": 52.5539,
195
- "eval_samples_per_second": 390.837,
196
- "eval_steps_per_second": 24.432,
197
- "step": 3297
198
- },
199
- {
200
- "epoch": 2.25,
201
- "learning_rate": 0.0008948074343744013,
202
- "loss": 0.7375,
203
- "step": 3300
204
  },
205
  {
206
- "epoch": 2.4,
207
- "learning_rate": 0.0008842690170530752,
208
- "loss": 0.7199,
209
- "step": 3520
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
210
  },
211
  {
212
- "epoch": 2.55,
213
- "learning_rate": 0.0008737305997317494,
214
- "loss": 0.7064,
215
- "step": 3740
216
  },
217
  {
218
- "epoch": 2.7,
219
- "learning_rate": 0.0008631921824104235,
220
- "loss": 0.7063,
221
- "step": 3960
222
  },
223
  {
224
- "epoch": 2.85,
225
- "learning_rate": 0.0008526537650890975,
226
- "loss": 0.7138,
227
- "step": 4180
228
  },
229
  {
230
- "epoch": 3.0,
231
- "eval_accuracy": 0.7448393378773126,
232
- "eval_b_acc": 0.5918170569783451,
233
- "eval_f1": 0.6005073740718484,
234
- "eval_f1_anger": 0.583310230108123,
235
- "eval_f1_disgust": 0.4129301355578728,
236
- "eval_f1_fear": 0.582723279648609,
237
- "eval_f1_joy": 0.729650507328072,
238
- "eval_f1_neutral": 0.8403856955626287,
239
- "eval_f1_sadness": 0.6514983351831298,
240
- "eval_f1_surprise": 0.40305343511450376,
241
- "eval_loss": 0.688290536403656,
242
- "eval_micro_f1": 0.7448393378773126,
243
- "eval_prec": 0.6144786785060393,
244
- "eval_prec_anger": 0.584769316286826,
245
- "eval_prec_disgust": 0.41164241164241167,
246
- "eval_prec_fear": 0.582723279648609,
247
- "eval_prec_joy": 0.7004329004329004,
248
- "eval_prec_neutral": 0.8380321135175504,
249
- "eval_prec_sadness": 0.6837507280139778,
250
- "eval_prec_surprise": 0.5,
251
- "eval_recall": 0.5918170569783451,
252
- "eval_recall_anger": 0.581858407079646,
253
- "eval_recall_disgust": 0.41422594142259417,
254
- "eval_recall_fear": 0.582723279648609,
255
- "eval_recall_joy": 0.7614117647058823,
256
- "eval_recall_neutral": 0.842752534735261,
257
- "eval_recall_sadness": 0.6221515633280339,
258
- "eval_recall_surprise": 0.3375959079283887,
259
- "eval_runtime": 52.617,
260
- "eval_samples_per_second": 390.368,
261
- "eval_steps_per_second": 24.403,
262
- "step": 4396
263
  },
264
  {
265
  "epoch": 3.0,
266
- "learning_rate": 0.0008421632496646868,
267
  "loss": 0.7289,
268
- "step": 4400
269
  },
270
  {
271
- "epoch": 3.15,
272
- "learning_rate": 0.0008316248323433608,
273
- "loss": 0.6887,
274
- "step": 4620
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
275
  },
276
  {
277
- "epoch": 3.3,
278
- "learning_rate": 0.0008210864150220348,
279
- "loss": 0.6982,
280
- "step": 4840
281
  },
282
  {
283
- "epoch": 3.45,
284
- "learning_rate": 0.0008105479977007089,
285
- "loss": 0.701,
286
- "step": 5060
287
  },
288
  {
289
  "epoch": 3.6,
290
- "learning_rate": 0.0008000095803793831,
291
- "loss": 0.7046,
292
- "step": 5280
293
- },
294
- {
295
- "epoch": 3.75,
296
- "eval_accuracy": 0.7464946445959104,
297
- "eval_b_acc": 0.5788756560881936,
298
- "eval_f1": 0.5986191545663104,
299
- "eval_f1_anger": 0.5739130434782608,
300
- "eval_f1_disgust": 0.3984476067270375,
301
- "eval_f1_fear": 0.5746569814366425,
302
- "eval_f1_joy": 0.730888607885964,
303
- "eval_f1_neutral": 0.8425003475279181,
304
- "eval_f1_sadness": 0.6517333333333334,
305
- "eval_f1_surprise": 0.418194161575017,
306
- "eval_loss": 0.682627260684967,
307
- "eval_micro_f1": 0.7464946445959104,
308
- "eval_prec": 0.6275132039697725,
309
- "eval_prec_anger": 0.5822424587364826,
310
- "eval_prec_disgust": 0.5220338983050847,
311
- "eval_prec_fear": 0.6402877697841727,
312
- "eval_prec_joy": 0.7145425938413127,
313
- "eval_prec_neutral": 0.8318235886174399,
314
- "eval_prec_sadness": 0.6559312936124531,
315
- "eval_prec_surprise": 0.44573082489146165,
316
- "eval_recall": 0.5788756560881936,
317
- "eval_recall_anger": 0.5658185840707964,
318
- "eval_recall_disgust": 0.32217573221757323,
319
- "eval_recall_fear": 0.5212298682284041,
320
- "eval_recall_joy": 0.748,
321
- "eval_recall_neutral": 0.8534547502816372,
322
- "eval_recall_sadness": 0.6475887652358241,
323
- "eval_recall_surprise": 0.3938618925831202,
324
- "eval_runtime": 54.8263,
325
- "eval_samples_per_second": 374.638,
326
- "eval_steps_per_second": 23.419,
327
- "step": 5495
328
  },
329
  {
330
- "epoch": 3.75,
331
- "learning_rate": 0.0007894711630580571,
332
- "loss": 0.7145,
333
- "step": 5500
334
  },
335
  {
336
- "epoch": 3.9,
337
- "learning_rate": 0.0007789806476336463,
338
- "loss": 0.7056,
339
- "step": 5720
340
  },
341
  {
342
- "epoch": 4.05,
343
- "learning_rate": 0.0007684422303123204,
344
- "loss": 0.6911,
345
- "step": 5940
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
346
  },
347
  {
348
  "epoch": 4.2,
349
- "learning_rate": 0.0007579038129909944,
350
- "loss": 0.6777,
351
- "step": 6160
352
- },
353
- {
354
- "epoch": 4.35,
355
- "learning_rate": 0.0007473653956696685,
356
- "loss": 0.6767,
357
- "step": 6380
358
- },
359
- {
360
- "epoch": 4.5,
361
- "eval_accuracy": 0.7435735150925025,
362
- "eval_b_acc": 0.5648744699236212,
363
- "eval_f1": 0.592256565822076,
364
- "eval_f1_anger": 0.5643717196665637,
365
- "eval_f1_disgust": 0.36467236467236464,
366
- "eval_f1_fear": 0.6036536934074663,
367
- "eval_f1_joy": 0.7215847324556106,
368
- "eval_f1_neutral": 0.8374881666140739,
369
- "eval_f1_sadness": 0.6377816291161179,
370
- "eval_f1_surprise": 0.416243654822335,
371
- "eval_loss": 0.6971003413200378,
372
- "eval_micro_f1": 0.7435735150925025,
373
- "eval_prec": 0.6422939486456166,
374
- "eval_prec_anger": 0.6387141858839972,
375
- "eval_prec_disgust": 0.5714285714285714,
376
- "eval_prec_fear": 0.6597222222222222,
377
- "eval_prec_joy": 0.7413750310250683,
378
- "eval_prec_neutral": 0.80556760038158,
379
- "eval_prec_sadness": 0.5985130111524164,
380
- "eval_prec_surprise": 0.4807370184254606,
381
- "eval_recall": 0.5648744699236212,
382
- "eval_recall_anger": 0.5055309734513275,
383
- "eval_recall_disgust": 0.26778242677824265,
384
- "eval_recall_fear": 0.5563689604685212,
385
- "eval_recall_joy": 0.7028235294117647,
386
- "eval_recall_neutral": 0.8720428088621855,
387
- "eval_recall_sadness": 0.6825649178590355,
388
- "eval_recall_surprise": 0.3670076726342711,
389
- "eval_runtime": 52.3013,
390
- "eval_samples_per_second": 392.725,
391
- "eval_steps_per_second": 24.55,
392
- "step": 6594
393
- },
394
- {
395
- "epoch": 4.5,
396
- "learning_rate": 0.0007368269783483425,
397
- "loss": 0.6834,
398
- "step": 6600
399
- },
400
- {
401
- "epoch": 4.65,
402
- "learning_rate": 0.0007262885610270167,
403
- "loss": 0.6924,
404
- "step": 6820
405
- },
406
- {
407
- "epoch": 4.8,
408
- "learning_rate": 0.0007157501437056908,
409
- "loss": 0.6872,
410
- "step": 7040
411
- },
412
- {
413
- "epoch": 4.95,
414
- "learning_rate": 0.0007052117263843648,
415
- "loss": 0.6681,
416
- "step": 7260
417
- },
418
- {
419
- "epoch": 5.1,
420
- "learning_rate": 0.000694673309063039,
421
- "loss": 0.661,
422
- "step": 7480
423
- },
424
- {
425
- "epoch": 5.25,
426
- "eval_accuracy": 0.7383641674780915,
427
- "eval_b_acc": 0.602771097930762,
428
- "eval_f1": 0.6030709415406346,
429
- "eval_f1_anger": 0.5770609318996416,
430
- "eval_f1_disgust": 0.41814595660749504,
431
- "eval_f1_fear": 0.6160198183319571,
432
- "eval_f1_joy": 0.7286771805600258,
433
- "eval_f1_neutral": 0.8364084854464726,
434
- "eval_f1_sadness": 0.6574813998346651,
435
- "eval_f1_surprise": 0.38770281810418444,
436
- "eval_loss": 0.7123843431472778,
437
- "eval_micro_f1": 0.7383641674780915,
438
- "eval_prec": 0.6294789669741513,
439
- "eval_prec_anger": 0.48493975903614456,
440
- "eval_prec_disgust": 0.39552238805970147,
441
- "eval_prec_fear": 0.7064393939393939,
442
- "eval_prec_joy": 0.6696903963715244,
443
- "eval_prec_neutral": 0.88136826783115,
444
- "eval_prec_sadness": 0.6848450057405281,
445
- "eval_prec_surprise": 0.583547557840617,
446
- "eval_recall": 0.602771097930762,
447
- "eval_recall_anger": 0.7123893805309734,
448
- "eval_recall_disgust": 0.4435146443514644,
449
- "eval_recall_fear": 0.5461200585651538,
450
- "eval_recall_joy": 0.7990588235294117,
451
- "eval_recall_neutral": 0.7958129928651896,
452
- "eval_recall_sadness": 0.6322204557498675,
453
- "eval_recall_surprise": 0.29028132992327366,
454
- "eval_runtime": 52.258,
455
- "eval_samples_per_second": 393.05,
456
- "eval_steps_per_second": 24.57,
457
- "step": 7693
458
- },
459
- {
460
- "epoch": 5.26,
461
- "learning_rate": 0.000684134891741713,
462
- "loss": 0.6623,
463
- "step": 7700
464
  },
465
  {
466
- "epoch": 5.41,
467
- "learning_rate": 0.000673596474420387,
468
- "loss": 0.6663,
469
- "step": 7920
470
  },
471
  {
472
- "epoch": 5.56,
473
- "learning_rate": 0.0006630580570990611,
474
- "loss": 0.6669,
475
- "step": 8140
476
  },
477
  {
478
- "epoch": 5.71,
479
- "learning_rate": 0.0006525196397777352,
480
- "loss": 0.6691,
481
- "step": 8360
482
- },
483
- {
484
- "epoch": 5.86,
485
- "learning_rate": 0.0006419812224564093,
486
- "loss": 0.6652,
487
- "step": 8580
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
488
  },
489
  {
490
  "epoch": 6.0,
491
- "eval_accuracy": 0.752921129503408,
492
- "eval_b_acc": 0.594191766213012,
493
- "eval_f1": 0.6135563471911549,
494
- "eval_f1_anger": 0.5377977217811529,
495
- "eval_f1_disgust": 0.4477933261571583,
496
- "eval_f1_fear": 0.6142208774583964,
497
- "eval_f1_joy": 0.7345635202271116,
498
- "eval_f1_neutral": 0.8443846671149968,
499
- "eval_f1_sadness": 0.659697386519945,
500
- "eval_f1_surprise": 0.4564369310793238,
501
- "eval_loss": 0.670600414276123,
502
- "eval_micro_f1": 0.752921129503408,
503
- "eval_prec": 0.6441161632494222,
504
- "eval_prec_anger": 0.7153351698806244,
505
- "eval_prec_disgust": 0.4611973392461197,
506
- "eval_prec_fear": 0.6353677621283255,
507
- "eval_prec_joy": 0.7385823025689819,
508
- "eval_prec_neutral": 0.8081180811808119,
509
- "eval_prec_sadness": 0.6859267734553776,
510
- "eval_prec_surprise": 0.4642857142857143,
511
- "eval_recall": 0.594191766213012,
512
- "eval_recall_anger": 0.43086283185840707,
513
- "eval_recall_disgust": 0.4351464435146444,
514
- "eval_recall_fear": 0.5944363103953147,
515
- "eval_recall_joy": 0.7305882352941176,
516
- "eval_recall_neutral": 0.8840593315809238,
517
- "eval_recall_sadness": 0.6354001059883413,
518
- "eval_recall_surprise": 0.44884910485933505,
519
- "eval_runtime": 52.6277,
520
- "eval_samples_per_second": 390.289,
521
- "eval_steps_per_second": 24.398,
522
- "step": 8792
523
- },
524
- {
525
- "epoch": 6.01,
526
- "learning_rate": 0.0006314428051350833,
527
- "loss": 0.66,
528
- "step": 8800
529
- },
530
- {
531
- "epoch": 6.16,
532
- "learning_rate": 0.0006209043878137575,
533
- "loss": 0.6414,
534
- "step": 9020
535
- },
536
- {
537
- "epoch": 6.31,
538
- "learning_rate": 0.0006103659704924315,
539
- "loss": 0.6445,
540
- "step": 9240
541
- },
542
- {
543
- "epoch": 6.46,
544
- "learning_rate": 0.0005998275531711056,
545
- "loss": 0.6405,
546
- "step": 9460
547
- },
548
- {
549
- "epoch": 6.61,
550
- "learning_rate": 0.0005892891358497796,
551
- "loss": 0.6532,
552
- "step": 9680
553
- },
554
- {
555
- "epoch": 6.75,
556
- "eval_accuracy": 0.7581791626095423,
557
- "eval_b_acc": 0.5852602000181494,
558
- "eval_f1": 0.614564401804941,
559
- "eval_f1_anger": 0.5887445887445888,
560
- "eval_f1_disgust": 0.4246079613992763,
561
- "eval_f1_fear": 0.6189300411522632,
562
- "eval_f1_joy": 0.7366662689416538,
563
- "eval_f1_neutral": 0.8483534354248544,
564
- "eval_f1_sadness": 0.6636794939377966,
565
- "eval_f1_surprise": 0.42096902303415407,
566
- "eval_loss": 0.6566693782806396,
567
- "eval_micro_f1": 0.7581791626095423,
568
- "eval_prec": 0.6577687706916829,
569
- "eval_prec_anger": 0.6155703077851539,
570
- "eval_prec_disgust": 0.5014245014245015,
571
- "eval_prec_fear": 0.706766917293233,
572
- "eval_prec_joy": 0.7472766884531591,
573
- "eval_prec_neutral": 0.8175881584675664,
574
- "eval_prec_sadness": 0.6601992658626115,
575
- "eval_prec_surprise": 0.5555555555555556,
576
- "eval_recall": 0.5852602000181494,
577
- "eval_recall_anger": 0.5641592920353983,
578
- "eval_recall_disgust": 0.3682008368200837,
579
- "eval_recall_fear": 0.5505124450951684,
580
- "eval_recall_joy": 0.7263529411764705,
581
- "eval_recall_neutral": 0.88152459631994,
582
- "eval_recall_sadness": 0.6671966083730789,
583
- "eval_recall_surprise": 0.3388746803069054,
584
- "eval_runtime": 52.2302,
585
- "eval_samples_per_second": 393.259,
586
- "eval_steps_per_second": 24.583,
587
- "step": 9891
588
- },
589
- {
590
- "epoch": 6.76,
591
- "learning_rate": 0.0005787507185284537,
592
- "loss": 0.6566,
593
- "step": 9900
594
- },
595
- {
596
- "epoch": 6.91,
597
- "learning_rate": 0.0005682602031040429,
598
- "loss": 0.6528,
599
- "step": 10120
600
- },
601
- {
602
- "epoch": 7.06,
603
- "learning_rate": 0.000557769687679632,
604
- "loss": 0.6419,
605
- "step": 10340
606
- },
607
- {
608
- "epoch": 7.21,
609
- "learning_rate": 0.0005472312703583062,
610
- "loss": 0.6305,
611
- "step": 10560
612
- },
613
- {
614
- "epoch": 7.36,
615
- "learning_rate": 0.0005366928530369802,
616
- "loss": 0.6314,
617
- "step": 10780
618
- },
619
- {
620
- "epoch": 7.5,
621
- "eval_accuracy": 0.7554527750730282,
622
- "eval_b_acc": 0.5864396115457234,
623
- "eval_f1": 0.6141846408191719,
624
- "eval_f1_anger": 0.6100183582480986,
625
- "eval_f1_disgust": 0.4005235602094241,
626
- "eval_f1_fear": 0.6080586080586081,
627
- "eval_f1_joy": 0.7392614080107107,
628
- "eval_f1_neutral": 0.8438656485688855,
629
- "eval_f1_sadness": 0.6687747035573123,
630
- "eval_f1_surprise": 0.4287901990811639,
631
- "eval_loss": 0.6726419925689697,
632
- "eval_micro_f1": 0.7554527750730282,
633
- "eval_prec": 0.6673306947742298,
634
- "eval_prec_anger": 0.5800498753117207,
635
- "eval_prec_disgust": 0.534965034965035,
636
- "eval_prec_fear": 0.8117359413202934,
637
- "eval_prec_joy": 0.7029492892000849,
638
- "eval_prec_neutral": 0.8421692379616643,
639
- "eval_prec_sadness": 0.6650943396226415,
640
- "eval_prec_surprise": 0.5343511450381679,
641
- "eval_recall": 0.5864396115457234,
642
- "eval_recall_anger": 0.6432522123893806,
643
- "eval_recall_disgust": 0.3200836820083682,
644
- "eval_recall_fear": 0.486090775988287,
645
- "eval_recall_joy": 0.7795294117647059,
646
- "eval_recall_neutral": 0.8455689072474653,
647
- "eval_recall_sadness": 0.6724960254372019,
648
- "eval_recall_surprise": 0.35805626598465473,
649
- "eval_runtime": 52.4759,
650
- "eval_samples_per_second": 391.418,
651
- "eval_steps_per_second": 24.468,
652
- "step": 10990
653
- },
654
- {
655
- "epoch": 7.51,
656
- "learning_rate": 0.0005261544357156543,
657
- "loss": 0.6297,
658
- "step": 11000
659
- },
660
- {
661
- "epoch": 7.66,
662
- "learning_rate": 0.0005156160183943285,
663
- "loss": 0.6373,
664
- "step": 11220
665
- },
666
- {
667
- "epoch": 7.81,
668
- "learning_rate": 0.0005050776010730025,
669
- "loss": 0.6278,
670
- "step": 11440
671
- },
672
- {
673
- "epoch": 7.96,
674
- "learning_rate": 0.0004945391837516765,
675
- "loss": 0.6321,
676
- "step": 11660
677
- },
678
- {
679
- "epoch": 8.11,
680
- "learning_rate": 0.0004840007664303506,
681
- "loss": 0.6045,
682
- "step": 11880
683
- },
684
- {
685
- "epoch": 8.25,
686
- "eval_accuracy": 0.7577896786757546,
687
- "eval_b_acc": 0.6005624120936303,
688
- "eval_f1": 0.6238197827942396,
689
- "eval_f1_anger": 0.6038186157517901,
690
- "eval_f1_disgust": 0.4337078651685393,
691
- "eval_f1_fear": 0.6333907056798622,
692
- "eval_f1_joy": 0.7377106333527018,
693
- "eval_f1_neutral": 0.8465511724642318,
694
- "eval_f1_sadness": 0.6661166116611661,
695
- "eval_f1_surprise": 0.4454428754813864,
696
- "eval_loss": 0.6667613387107849,
697
- "eval_micro_f1": 0.7577896786757546,
698
- "eval_prec": 0.6550680878375978,
699
- "eval_prec_anger": 0.655440414507772,
700
- "eval_prec_disgust": 0.4684466019417476,
701
- "eval_prec_fear": 0.7682672233820459,
702
- "eval_prec_joy": 0.7288174512055109,
703
- "eval_prec_neutral": 0.8249443207126949,
704
- "eval_prec_sadness": 0.6923956546598056,
705
- "eval_prec_surprise": 0.44716494845360827,
706
- "eval_recall": 0.6005624120936303,
707
- "eval_recall_anger": 0.5597345132743363,
708
- "eval_recall_disgust": 0.40376569037656906,
709
- "eval_recall_fear": 0.5387994143484627,
710
- "eval_recall_joy": 0.7468235294117647,
711
- "eval_recall_neutral": 0.8693203154337213,
712
- "eval_recall_sadness": 0.6417594064652888,
713
- "eval_recall_surprise": 0.4437340153452685,
714
- "eval_runtime": 54.5559,
715
- "eval_samples_per_second": 376.494,
716
- "eval_steps_per_second": 23.535,
717
- "step": 12089
718
  },
719
  {
720
- "epoch": 8.26,
721
- "learning_rate": 0.00047346234910902474,
722
- "loss": 0.6078,
723
- "step": 12100
724
- },
725
- {
726
- "epoch": 8.41,
727
- "learning_rate": 0.0004629239317876988,
728
- "loss": 0.6091,
729
- "step": 12320
730
- },
731
- {
732
- "epoch": 8.56,
733
- "learning_rate": 0.0004523855144663729,
734
- "loss": 0.6127,
735
- "step": 12540
736
- },
737
- {
738
- "epoch": 8.71,
739
- "learning_rate": 0.00044184709714504693,
740
- "loss": 0.6243,
741
- "step": 12760
742
- },
743
- {
744
- "epoch": 8.86,
745
- "learning_rate": 0.000431308679823721,
746
- "loss": 0.6182,
747
- "step": 12980
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
748
  },
749
  {
750
  "epoch": 9.0,
751
- "eval_accuracy": 0.7570593962999026,
752
- "eval_b_acc": 0.6044499151869599,
753
- "eval_f1": 0.6204901474344295,
754
- "eval_f1_anger": 0.6087460179554011,
755
- "eval_f1_disgust": 0.44725738396624476,
756
- "eval_f1_fear": 0.6212361331220285,
757
- "eval_f1_joy": 0.7376712328767122,
758
- "eval_f1_neutral": 0.8463038632986627,
759
- "eval_f1_sadness": 0.6678737713398861,
760
- "eval_f1_surprise": 0.41434262948207173,
761
- "eval_loss": 0.6659196615219116,
762
- "eval_micro_f1": 0.7570593962999026,
763
- "eval_prec": 0.6461033688057751,
764
- "eval_prec_anger": 0.6389057750759879,
765
- "eval_prec_disgust": 0.451063829787234,
766
- "eval_prec_fear": 0.6770293609671848,
767
- "eval_prec_joy": 0.7164079822616408,
768
- "eval_prec_neutral": 0.8372840867328188,
769
- "eval_prec_sadness": 0.6523496715512885,
770
- "eval_prec_surprise": 0.5496828752642706,
771
- "eval_recall": 0.6044499151869599,
772
- "eval_recall_anger": 0.5813053097345132,
773
- "eval_recall_disgust": 0.4435146443514644,
774
- "eval_recall_fear": 0.5739385065885798,
775
- "eval_recall_joy": 0.760235294117647,
776
- "eval_recall_neutral": 0.8555200901239204,
777
- "eval_recall_sadness": 0.6841547429782724,
778
- "eval_recall_surprise": 0.33248081841432225,
779
- "eval_runtime": 53.1364,
780
- "eval_samples_per_second": 386.552,
781
- "eval_steps_per_second": 24.164,
782
- "step": 13188
783
- },
784
- {
785
- "epoch": 9.01,
786
- "learning_rate": 0.0004207702625023951,
787
- "loss": 0.6299,
788
- "step": 13200
789
- },
790
- {
791
- "epoch": 9.16,
792
- "learning_rate": 0.00041023184518106917,
793
- "loss": 0.5991,
794
- "step": 13420
795
- },
796
- {
797
- "epoch": 9.31,
798
- "learning_rate": 0.00039969342785974325,
799
- "loss": 0.5962,
800
- "step": 13640
801
- },
802
- {
803
- "epoch": 9.46,
804
- "learning_rate": 0.00038915501053841733,
805
- "loss": 0.6014,
806
- "step": 13860
807
  },
808
  {
809
- "epoch": 9.61,
810
- "learning_rate": 0.0003786165932170914,
811
- "loss": 0.5927,
812
- "step": 14080
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
813
  },
814
  {
815
- "epoch": 9.75,
816
- "eval_accuracy": 0.7466407010710808,
817
- "eval_b_acc": 0.5639997332284856,
818
- "eval_f1": 0.595181302839129,
819
- "eval_f1_anger": 0.5956719817767653,
820
- "eval_f1_disgust": 0.3489736070381232,
821
- "eval_f1_fear": 0.6333059885151764,
822
- "eval_f1_joy": 0.7182098034572578,
823
- "eval_f1_neutral": 0.8372471833853672,
824
- "eval_f1_sadness": 0.6523649521840268,
825
- "eval_f1_surprise": 0.38049560351718625,
826
- "eval_loss": 0.7097288966178894,
827
- "eval_micro_f1": 0.7466407010710808,
828
- "eval_prec": 0.6560660561913124,
829
- "eval_prec_anger": 0.613849765258216,
830
- "eval_prec_disgust": 0.5833333333333334,
831
- "eval_prec_fear": 0.7201492537313433,
832
- "eval_prec_joy": 0.7228312678741659,
833
- "eval_prec_neutral": 0.8081055113983754,
834
- "eval_prec_sadness": 0.6367305751765893,
835
- "eval_prec_surprise": 0.5074626865671642,
836
- "eval_recall": 0.5639997332284856,
837
- "eval_recall_anger": 0.5785398230088495,
838
- "eval_recall_disgust": 0.2489539748953975,
839
- "eval_recall_fear": 0.5651537335285505,
840
- "eval_recall_joy": 0.7136470588235294,
841
- "eval_recall_neutral": 0.8685692827638002,
842
- "eval_recall_sadness": 0.6687864334923158,
843
- "eval_recall_surprise": 0.30434782608695654,
844
- "eval_runtime": 53.7235,
845
- "eval_samples_per_second": 382.328,
846
- "eval_steps_per_second": 23.9,
847
- "step": 14287
848
- },
849
- {
850
- "epoch": 9.76,
851
- "learning_rate": 0.0003680781758957655,
852
- "loss": 0.5977,
853
- "step": 14300
854
- },
855
- {
856
- "epoch": 9.91,
857
- "learning_rate": 0.00035753975857443957,
858
- "loss": 0.6181,
859
- "step": 14520
860
- },
861
- {
862
- "epoch": 10.06,
863
- "learning_rate": 0.00034704924315002875,
864
- "loss": 0.595,
865
- "step": 14740
866
- },
867
- {
868
- "epoch": 10.21,
869
- "learning_rate": 0.00033651082582870283,
870
- "loss": 0.5668,
871
- "step": 14960
872
- },
873
- {
874
- "epoch": 10.36,
875
- "learning_rate": 0.0003259724085073769,
876
- "loss": 0.5736,
877
- "step": 15180
878
- },
879
- {
880
- "epoch": 10.5,
881
- "eval_accuracy": 0.758666017526777,
882
- "eval_b_acc": 0.6092103490403898,
883
- "eval_f1": 0.6224896550246998,
884
- "eval_f1_anger": 0.6192840344917692,
885
- "eval_f1_disgust": 0.42822966507177035,
886
- "eval_f1_fear": 0.6338028169014085,
887
- "eval_f1_joy": 0.742619926199262,
888
- "eval_f1_neutral": 0.8472516603080401,
889
- "eval_f1_sadness": 0.672,
890
- "eval_f1_surprise": 0.4142394822006473,
891
- "eval_loss": 0.6662837862968445,
892
- "eval_micro_f1": 0.758666017526777,
893
- "eval_prec": 0.6494125401879046,
894
- "eval_prec_anger": 0.586924219910847,
895
- "eval_prec_disgust": 0.5,
896
- "eval_prec_fear": 0.680672268907563,
897
- "eval_prec_joy": 0.7281772953414745,
898
- "eval_prec_neutral": 0.8501748747518669,
899
- "eval_prec_sadness": 0.6360624704212021,
900
- "eval_prec_surprise": 0.5638766519823789,
901
- "eval_recall": 0.6092103490403898,
902
- "eval_recall_anger": 0.6554203539823009,
903
- "eval_recall_disgust": 0.37447698744769875,
904
- "eval_recall_fear": 0.5929721815519766,
905
- "eval_recall_joy": 0.7576470588235295,
906
- "eval_recall_neutral": 0.8443484791588434,
907
- "eval_recall_sadness": 0.712241653418124,
908
- "eval_recall_surprise": 0.3273657289002558,
909
- "eval_runtime": 52.4006,
910
- "eval_samples_per_second": 391.98,
911
- "eval_steps_per_second": 24.504,
912
- "step": 15386
913
- },
914
- {
915
- "epoch": 10.51,
916
- "learning_rate": 0.000315433991186051,
917
- "loss": 0.5779,
918
- "step": 15400
919
- },
920
- {
921
- "epoch": 10.66,
922
- "learning_rate": 0.00030489557386472507,
923
- "loss": 0.5816,
924
- "step": 15620
925
- },
926
- {
927
- "epoch": 10.81,
928
- "learning_rate": 0.0002943571565433991,
929
- "loss": 0.5866,
930
- "step": 15840
931
- },
932
- {
933
- "epoch": 10.96,
934
- "learning_rate": 0.0002838187392220732,
935
- "loss": 0.5797,
936
- "step": 16060
937
- },
938
- {
939
- "epoch": 11.11,
940
- "learning_rate": 0.00027328032190074725,
941
- "loss": 0.5687,
942
- "step": 16280
943
- },
944
- {
945
- "epoch": 11.25,
946
- "eval_accuracy": 0.7633398247322298,
947
- "eval_b_acc": 0.6147514191038456,
948
- "eval_f1": 0.6337188907871468,
949
- "eval_f1_anger": 0.6268229911352589,
950
- "eval_f1_disgust": 0.470076169749728,
951
- "eval_f1_fear": 0.6422018348623854,
952
- "eval_f1_joy": 0.7406107406107406,
953
- "eval_f1_neutral": 0.8523923886938851,
954
- "eval_f1_sadness": 0.6596455175956846,
955
- "eval_f1_surprise": 0.4442825928623452,
956
- "eval_loss": 0.6598661541938782,
957
- "eval_micro_f1": 0.7633398247322298,
958
- "eval_prec": 0.6594926170544204,
959
- "eval_prec_anger": 0.6489046773238603,
960
- "eval_prec_disgust": 0.4897959183673469,
961
- "eval_prec_fear": 0.7461240310077519,
962
- "eval_prec_joy": 0.7365603909704445,
963
- "eval_prec_neutral": 0.8389090909090909,
964
- "eval_prec_sadness": 0.6400797607178464,
965
- "eval_prec_surprise": 0.5160744500846024,
966
- "eval_recall": 0.6147514191038456,
967
- "eval_recall_anger": 0.6061946902654868,
968
- "eval_recall_disgust": 0.45188284518828453,
969
- "eval_recall_fear": 0.5636896046852123,
970
- "eval_recall_joy": 0.7447058823529412,
971
- "eval_recall_neutral": 0.8663161847540368,
972
- "eval_recall_sadness": 0.6804451510333863,
973
- "eval_recall_surprise": 0.3900255754475703,
974
- "eval_runtime": 54.1532,
975
- "eval_samples_per_second": 379.294,
976
- "eval_steps_per_second": 23.711,
977
- "step": 16485
978
- },
979
- {
980
- "epoch": 11.26,
981
- "learning_rate": 0.0002627419045794214,
982
- "loss": 0.5575,
983
- "step": 16500
984
- },
985
- {
986
- "epoch": 11.41,
987
- "learning_rate": 0.00025220348725809547,
988
- "loss": 0.5672,
989
- "step": 16720
990
- },
991
- {
992
- "epoch": 11.56,
993
- "learning_rate": 0.00024166506993676952,
994
- "loss": 0.5582,
995
- "step": 16940
996
- },
997
- {
998
- "epoch": 11.71,
999
- "learning_rate": 0.00023112665261544357,
1000
- "loss": 0.5607,
1001
- "step": 17160
1002
- },
1003
- {
1004
- "epoch": 11.86,
1005
- "learning_rate": 0.00022058823529411765,
1006
- "loss": 0.5652,
1007
- "step": 17380
1008
  },
1009
  {
1010
  "epoch": 12.0,
1011
- "eval_accuracy": 0.7630963972736124,
1012
- "eval_b_acc": 0.6053830892588602,
1013
- "eval_f1": 0.6276991641576467,
1014
- "eval_f1_anger": 0.6168702073274639,
1015
- "eval_f1_disgust": 0.43303571428571425,
1016
- "eval_f1_fear": 0.638801261829653,
1017
- "eval_f1_joy": 0.7379285799027169,
1018
- "eval_f1_neutral": 0.8519039622384605,
1019
- "eval_f1_sadness": 0.6683630195080577,
1020
- "eval_f1_surprise": 0.44699140401146126,
1021
- "eval_loss": 0.6577332019805908,
1022
- "eval_micro_f1": 0.7630963972736124,
1023
- "eval_prec": 0.6548174460459298,
1024
- "eval_prec_anger": 0.6339754816112084,
1025
- "eval_prec_disgust": 0.46411483253588515,
1026
- "eval_prec_fear": 0.6923076923076923,
1027
- "eval_prec_joy": 0.7441971763579803,
1028
- "eval_prec_neutral": 0.8246199806695369,
1029
- "eval_prec_sadness": 0.7163636363636363,
1030
- "eval_prec_surprise": 0.50814332247557,
1031
- "eval_recall": 0.6053830892588602,
1032
- "eval_recall_anger": 0.6006637168141593,
1033
- "eval_recall_disgust": 0.40585774058577406,
1034
- "eval_recall_fear": 0.5929721815519766,
1035
- "eval_recall_joy": 0.731764705882353,
1036
- "eval_recall_neutral": 0.8810552009012392,
1037
- "eval_recall_sadness": 0.6263910969793323,
1038
- "eval_recall_surprise": 0.3989769820971867,
1039
- "eval_runtime": 53.0543,
1040
- "eval_samples_per_second": 387.151,
1041
- "eval_steps_per_second": 24.202,
1042
- "step": 17584
1043
- },
1044
- {
1045
- "epoch": 12.01,
1046
- "learning_rate": 0.00021004981797279173,
1047
- "loss": 0.5559,
1048
- "step": 17600
1049
- },
1050
- {
1051
- "epoch": 12.16,
1052
- "learning_rate": 0.00019951140065146582,
1053
- "loss": 0.5439,
1054
- "step": 17820
1055
- },
1056
- {
1057
- "epoch": 12.31,
1058
- "learning_rate": 0.00018897298333013987,
1059
- "loss": 0.5438,
1060
- "step": 18040
1061
- },
1062
- {
1063
- "epoch": 12.46,
1064
- "learning_rate": 0.00017843456600881395,
1065
- "loss": 0.543,
1066
- "step": 18260
1067
- },
1068
- {
1069
- "epoch": 12.61,
1070
- "learning_rate": 0.00016789614868748803,
1071
- "loss": 0.5377,
1072
- "step": 18480
1073
- },
1074
- {
1075
- "epoch": 12.75,
1076
- "eval_accuracy": 0.7619766309639727,
1077
- "eval_b_acc": 0.6124179118880813,
1078
- "eval_f1": 0.6250179854378021,
1079
- "eval_f1_anger": 0.6205983584855705,
1080
- "eval_f1_disgust": 0.41743119266055045,
1081
- "eval_f1_fear": 0.6180981595092024,
1082
- "eval_f1_joy": 0.7463065558633425,
1083
- "eval_f1_neutral": 0.8512547315295107,
1084
- "eval_f1_sadness": 0.6756976429151992,
1085
- "eval_f1_surprise": 0.44573925710123824,
1086
- "eval_loss": 0.6680665612220764,
1087
- "eval_micro_f1": 0.7619766309639727,
1088
- "eval_prec": 0.6421501390714648,
1089
- "eval_prec_anger": 0.595226003047232,
1090
- "eval_prec_disgust": 0.4619289340101523,
1091
- "eval_prec_fear": 0.6489533011272142,
1092
- "eval_prec_joy": 0.732442229270503,
1093
- "eval_prec_neutral": 0.8474923234390993,
1094
- "eval_prec_sadness": 0.6912416851441242,
1095
- "eval_prec_surprise": 0.5177664974619289,
1096
- "eval_recall": 0.6124179118880813,
1097
- "eval_recall_anger": 0.6482300884955752,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1098
  "eval_recall_disgust": 0.3807531380753138,
1099
- "eval_recall_fear": 0.5900439238653001,
1100
- "eval_recall_joy": 0.7607058823529412,
1101
- "eval_recall_neutral": 0.8550506947052197,
1102
- "eval_recall_sadness": 0.6608373078961314,
1103
- "eval_recall_surprise": 0.391304347826087,
1104
- "eval_runtime": 53.2844,
1105
- "eval_samples_per_second": 385.479,
1106
- "eval_steps_per_second": 24.097,
1107
- "step": 18683
1108
  },
1109
  {
1110
- "epoch": 12.76,
1111
- "learning_rate": 0.0001573577313661621,
1112
- "loss": 0.5457,
1113
- "step": 18700
1114
  },
1115
  {
1116
- "epoch": 12.91,
1117
- "learning_rate": 0.00014681931404483616,
1118
- "loss": 0.5445,
1119
- "step": 18920
1120
  },
1121
  {
1122
- "epoch": 13.06,
1123
- "learning_rate": 0.0001363287986204254,
1124
- "loss": 0.5323,
1125
- "step": 19140
1126
  },
1127
  {
1128
- "epoch": 13.21,
1129
- "learning_rate": 0.00012579038129909945,
1130
- "loss": 0.5214,
1131
- "step": 19360
1132
  },
1133
  {
1134
- "epoch": 13.36,
1135
- "learning_rate": 0.00011525196397777351,
1136
- "loss": 0.5312,
1137
- "step": 19580
1138
- },
1139
- {
1140
- "epoch": 13.5,
1141
- "eval_accuracy": 0.7594449853943525,
1142
- "eval_b_acc": 0.6161690104230055,
1143
- "eval_f1": 0.62474808335526,
1144
- "eval_f1_anger": 0.6223776223776223,
1145
- "eval_f1_disgust": 0.4353448275862069,
1146
- "eval_f1_fear": 0.6165413533834586,
1147
- "eval_f1_joy": 0.742164744261913,
1148
- "eval_f1_neutral": 0.8496567185091775,
1149
- "eval_f1_sadness": 0.6675588865096359,
1150
- "eval_f1_surprise": 0.4395924308588064,
1151
- "eval_loss": 0.6776713132858276,
1152
- "eval_micro_f1": 0.7594449853943525,
1153
- "eval_prec": 0.636197719648956,
1154
- "eval_prec_anger": 0.6057591623036649,
1155
- "eval_prec_disgust": 0.4488888888888889,
1156
- "eval_prec_fear": 0.633693972179289,
1157
- "eval_prec_joy": 0.7350565428109854,
1158
- "eval_prec_neutral": 0.8454317315735663,
1159
- "eval_prec_sadness": 0.6744186046511628,
1160
- "eval_prec_surprise": 0.5101351351351351,
1161
- "eval_recall": 0.6161690104230055,
1162
- "eval_recall_anger": 0.639933628318584,
1163
- "eval_recall_disgust": 0.4225941422594142,
1164
- "eval_recall_fear": 0.6002928257686676,
1165
- "eval_recall_joy": 0.7494117647058823,
1166
- "eval_recall_neutral": 0.8539241457003379,
1167
- "eval_recall_sadness": 0.6608373078961314,
1168
- "eval_recall_surprise": 0.38618925831202044,
1169
- "eval_runtime": 52.4495,
1170
- "eval_samples_per_second": 391.615,
1171
- "eval_steps_per_second": 24.481,
1172
- "step": 19782
1173
- },
1174
- {
1175
- "epoch": 13.51,
1176
- "learning_rate": 0.00010471354665644759,
1177
- "loss": 0.5261,
1178
- "step": 19800
1179
- },
1180
- {
1181
- "epoch": 13.66,
1182
- "learning_rate": 9.417512933512167e-05,
1183
- "loss": 0.5282,
1184
- "step": 20020
1185
- },
1186
- {
1187
- "epoch": 13.81,
1188
- "learning_rate": 8.363671201379575e-05,
1189
- "loss": 0.5201,
1190
- "step": 20240
1191
- },
1192
- {
1193
- "epoch": 13.96,
1194
- "learning_rate": 7.309829469246983e-05,
1195
- "loss": 0.5292,
1196
- "step": 20460
1197
- },
1198
- {
1199
- "epoch": 14.11,
1200
- "learning_rate": 6.25598773711439e-05,
1201
- "loss": 0.512,
1202
- "step": 20680
1203
- },
1204
- {
1205
- "epoch": 14.25,
1206
- "eval_accuracy": 0.7568646543330088,
1207
- "eval_b_acc": 0.6172231293216093,
1208
- "eval_f1": 0.6274045304621182,
1209
- "eval_f1_anger": 0.6168593177332957,
1210
- "eval_f1_disgust": 0.44719101123595506,
1211
- "eval_f1_fear": 0.621580547112462,
1212
- "eval_f1_joy": 0.7408979227161047,
1213
- "eval_f1_neutral": 0.8446776328228398,
1214
- "eval_f1_sadness": 0.6684141546526867,
1215
- "eval_f1_surprise": 0.4522111269614835,
1216
- "eval_loss": 0.6823310852050781,
1217
- "eval_micro_f1": 0.7568646543330088,
1218
- "eval_prec": 0.6409438141857619,
1219
- "eval_prec_anger": 0.6290971822886716,
1220
- "eval_prec_disgust": 0.4830097087378641,
1221
- "eval_prec_fear": 0.6461295418641391,
1222
- "eval_prec_joy": 0.7051445578231292,
1223
- "eval_prec_neutral": 0.8506283320639756,
1224
- "eval_prec_sadness": 0.6613070539419087,
1225
- "eval_prec_surprise": 0.5112903225806451,
1226
- "eval_recall": 0.6172231293216093,
1227
- "eval_recall_anger": 0.6050884955752213,
1228
- "eval_recall_disgust": 0.41631799163179917,
1229
- "eval_recall_fear": 0.5988286969253295,
1230
- "eval_recall_joy": 0.7804705882352941,
1231
- "eval_recall_neutral": 0.838809613218175,
1232
- "eval_recall_sadness": 0.6756756756756757,
1233
- "eval_recall_surprise": 0.4053708439897698,
1234
- "eval_runtime": 53.2289,
1235
- "eval_samples_per_second": 385.881,
1236
- "eval_steps_per_second": 24.122,
1237
- "step": 20881
1238
- },
1239
- {
1240
- "epoch": 14.26,
1241
- "learning_rate": 5.202146004981798e-05,
1242
- "loss": 0.5179,
1243
- "step": 20900
1244
- },
1245
- {
1246
- "epoch": 14.41,
1247
- "learning_rate": 4.148304272849205e-05,
1248
- "loss": 0.5085,
1249
- "step": 21120
1250
- },
1251
- {
1252
- "epoch": 14.56,
1253
- "learning_rate": 3.099252730408124e-05,
1254
- "loss": 0.5083,
1255
- "step": 21340
1256
- },
1257
- {
1258
- "epoch": 14.71,
1259
- "learning_rate": 2.0454109982755316e-05,
1260
- "loss": 0.5121,
1261
- "step": 21560
1262
- },
1263
- {
1264
- "epoch": 14.86,
1265
- "learning_rate": 9.915692661429392e-06,
1266
- "loss": 0.5026,
1267
- "step": 21780
1268
  },
1269
  {
1270
  "epoch": 15.0,
1271
- "step": 21975,
1272
- "total_flos": 6.592350719428977e+17,
1273
- "train_loss": 0.6400373776102771,
1274
- "train_runtime": 15988.8097,
1275
- "train_samples_per_second": 175.927,
1276
- "train_steps_per_second": 1.374
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1277
  }
1278
  ],
1279
- "max_steps": 21975,
1280
- "num_train_epochs": 15,
1281
- "total_flos": 6.592350719428977e+17,
1282
  "trial_name": null,
1283
  "trial_params": null
1284
  }
 
1
  {
2
+ "best_metric": 0.6206372407316966,
3
+ "best_model_checkpoint": ".exp/lora/lora-roberta-large-no-ed/checkpoint-26370",
4
+ "epoch": 19.996587613035317,
5
+ "global_step": 29300,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
+ "epoch": 0.2,
12
+ "learning_rate": 0.0001993174061433447,
13
+ "loss": 1.1563,
14
+ "step": 293
15
  },
16
  {
17
+ "epoch": 0.4,
18
+ "learning_rate": 0.0003993174061433447,
19
+ "loss": 0.843,
20
+ "step": 586
 
 
 
 
 
 
21
  },
22
  {
23
  "epoch": 0.6,
24
+ "learning_rate": 0.0005993174061433447,
25
+ "loss": 0.8076,
26
+ "step": 879
27
+ },
28
+ {
29
+ "epoch": 0.8,
30
+ "learning_rate": 0.0007986348122866894,
31
+ "loss": 0.7841,
32
+ "step": 1172
33
+ },
34
+ {
35
+ "epoch": 1.0,
36
+ "learning_rate": 0.000997269624573379,
37
+ "loss": 0.7938,
38
+ "step": 1465
39
+ },
40
+ {
41
+ "epoch": 1.0,
42
+ "eval_accuracy": 0.7256572541382668,
43
+ "eval_b_acc": 0.4993304744933974,
44
+ "eval_f1": 0.5432686921853633,
45
+ "eval_f1_anger": 0.4929859719438877,
46
+ "eval_f1_disgust": 0.35524475524475524,
47
+ "eval_f1_fear": 0.5487421383647799,
48
+ "eval_f1_joy": 0.7036857419980601,
49
+ "eval_f1_neutral": 0.8260165373795926,
50
+ "eval_f1_sadness": 0.5789971617786188,
51
+ "eval_f1_surprise": 0.2972085385878489,
52
+ "eval_loss": 0.7589048147201538,
53
+ "eval_micro_f1": 0.7256572541382668,
54
+ "eval_prec": 0.6232926407057092,
55
+ "eval_prec_anger": 0.6222596964586846,
56
+ "eval_prec_disgust": 0.5358649789029536,
57
+ "eval_prec_fear": 0.5925297113752123,
58
+ "eval_prec_joy": 0.7258629314657329,
59
+ "eval_prec_neutral": 0.7564402810304449,
60
+ "eval_prec_sadness": 0.7149532710280374,
61
+ "eval_prec_surprise": 0.4151376146788991,
62
+ "eval_recall": 0.4993304744933974,
63
+ "eval_recall_anger": 0.4081858407079646,
64
+ "eval_recall_disgust": 0.26569037656903766,
65
+ "eval_recall_fear": 0.5109809663250366,
66
+ "eval_recall_joy": 0.6828235294117647,
67
+ "eval_recall_neutral": 0.9096883214419828,
68
+ "eval_recall_sadness": 0.4864864864864865,
69
+ "eval_recall_surprise": 0.23145780051150894,
70
+ "eval_runtime": 46.5427,
71
+ "eval_samples_per_second": 441.315,
72
+ "eval_steps_per_second": 13.794,
73
+ "step": 1465
 
 
 
 
 
 
74
  },
75
  {
76
  "epoch": 1.2,
77
+ "learning_rate": 0.0009896173881803485,
78
+ "loss": 0.9272,
79
+ "step": 1758
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
80
  },
81
  {
82
+ "epoch": 1.4,
83
+ "learning_rate": 0.0009790910723908748,
84
+ "loss": 0.8827,
85
+ "step": 2051
86
  },
87
  {
88
+ "epoch": 1.6,
89
+ "learning_rate": 0.0009685647566014011,
90
+ "loss": 0.8217,
91
+ "step": 2344
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
92
  },
93
  {
94
+ "epoch": 1.8,
95
+ "learning_rate": 0.0009580384408119275,
96
+ "loss": 0.7703,
97
+ "step": 2637
98
+ },
99
+ {
100
+ "epoch": 2.0,
101
+ "learning_rate": 0.0009475480510149093,
102
+ "loss": 0.7546,
103
+ "step": 2930
104
+ },
105
+ {
106
+ "epoch": 2.0,
107
+ "eval_accuracy": 0.7242940603700098,
108
+ "eval_b_acc": 0.5498815920183304,
109
+ "eval_f1": 0.5735049733331309,
110
+ "eval_f1_anger": 0.5553202752779248,
111
+ "eval_f1_disgust": 0.3609226594301221,
112
+ "eval_f1_fear": 0.5940274414850686,
113
+ "eval_f1_joy": 0.6989024028478196,
114
+ "eval_f1_neutral": 0.8265419298837825,
115
+ "eval_f1_sadness": 0.6172381835032437,
116
+ "eval_f1_surprise": 0.3615819209039548,
117
+ "eval_loss": 0.7481706142425537,
118
+ "eval_micro_f1": 0.7242940603700097,
119
+ "eval_prec": 0.6272234980815083,
120
+ "eval_prec_anger": 0.5324873096446701,
121
+ "eval_prec_disgust": 0.5135135135135135,
122
+ "eval_prec_fear": 0.6618705035971223,
123
+ "eval_prec_joy": 0.6027630905679686,
124
+ "eval_prec_neutral": 0.8497768963807635,
125
+ "eval_prec_sadness": 0.74,
126
+ "eval_prec_surprise": 0.49015317286652077,
127
+ "eval_recall": 0.5498815920183304,
128
+ "eval_recall_anger": 0.5801991150442478,
129
+ "eval_recall_disgust": 0.27824267782426776,
130
+ "eval_recall_fear": 0.5387994143484627,
131
+ "eval_recall_joy": 0.8315294117647059,
132
+ "eval_recall_neutral": 0.804543747653023,
133
+ "eval_recall_sadness": 0.5294117647058824,
134
+ "eval_recall_surprise": 0.2864450127877238,
135
+ "eval_runtime": 46.047,
136
+ "eval_samples_per_second": 446.066,
137
+ "eval_steps_per_second": 13.942,
138
+ "step": 2930
139
  },
140
  {
141
+ "epoch": 2.2,
142
+ "learning_rate": 0.0009370217352254357,
143
+ "loss": 0.7432,
144
+ "step": 3223
145
  },
146
  {
147
+ "epoch": 2.4,
148
+ "learning_rate": 0.0009265313454284174,
149
+ "loss": 0.737,
150
+ "step": 3516
151
  },
152
  {
153
+ "epoch": 2.6,
154
+ "learning_rate": 0.0009160050296389439,
155
+ "loss": 0.7192,
156
+ "step": 3809
157
  },
158
  {
159
+ "epoch": 2.8,
160
+ "learning_rate": 0.0009054787138494701,
161
+ "loss": 0.7207,
162
+ "step": 4102
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
163
  },
164
  {
165
  "epoch": 3.0,
166
+ "learning_rate": 0.0008949523980599964,
167
  "loss": 0.7289,
168
+ "step": 4395
169
  },
170
  {
171
+ "epoch": 3.0,
172
+ "eval_accuracy": 0.7320837390457644,
173
+ "eval_b_acc": 0.5839323096679138,
174
+ "eval_f1": 0.5984237846360054,
175
+ "eval_f1_anger": 0.5667558727326791,
176
+ "eval_f1_disgust": 0.44855967078189296,
177
+ "eval_f1_fear": 0.5956375838926176,
178
+ "eval_f1_joy": 0.7127241855035551,
179
+ "eval_f1_neutral": 0.8253590792352327,
180
+ "eval_f1_sadness": 0.641439534268325,
181
+ "eval_f1_surprise": 0.39849056603773586,
182
+ "eval_loss": 0.729333221912384,
183
+ "eval_micro_f1": 0.7320837390457644,
184
+ "eval_prec": 0.6234201141460577,
185
+ "eval_prec_anger": 0.6128617363344051,
186
+ "eval_prec_disgust": 0.44129554655870445,
187
+ "eval_prec_fear": 0.6974459724950884,
188
+ "eval_prec_joy": 0.6491397641600618,
189
+ "eval_prec_neutral": 0.8364179679969154,
190
+ "eval_prec_sadness": 0.6405919661733616,
191
+ "eval_prec_surprise": 0.4861878453038674,
192
+ "eval_recall": 0.5839323096679138,
193
+ "eval_recall_anger": 0.5271017699115044,
194
+ "eval_recall_disgust": 0.4560669456066946,
195
+ "eval_recall_fear": 0.5197657393850659,
196
+ "eval_recall_joy": 0.7901176470588235,
197
+ "eval_recall_neutral": 0.8145888096132182,
198
+ "eval_recall_sadness": 0.6422893481717011,
199
+ "eval_recall_surprise": 0.3375959079283887,
200
+ "eval_runtime": 46.166,
201
+ "eval_samples_per_second": 444.916,
202
+ "eval_steps_per_second": 13.906,
203
+ "step": 4395
204
  },
205
  {
206
+ "epoch": 3.2,
207
+ "learning_rate": 0.0008844260822705228,
208
+ "loss": 0.7017,
209
+ "step": 4688
210
  },
211
  {
212
+ "epoch": 3.4,
213
+ "learning_rate": 0.0008738997664810491,
214
+ "loss": 0.7116,
215
+ "step": 4981
216
  },
217
  {
218
  "epoch": 3.6,
219
+ "learning_rate": 0.0008633734506915754,
220
+ "loss": 0.7143,
221
+ "step": 5274
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
222
  },
223
  {
224
+ "epoch": 3.8,
225
+ "learning_rate": 0.0008528471349021016,
226
+ "loss": 0.7218,
227
+ "step": 5567
228
  },
229
  {
230
+ "epoch": 4.0,
231
+ "learning_rate": 0.000842320819112628,
232
+ "loss": 0.7076,
233
+ "step": 5860
234
  },
235
  {
236
+ "epoch": 4.0,
237
+ "eval_accuracy": 0.7466407010710808,
238
+ "eval_b_acc": 0.5649303370058901,
239
+ "eval_f1": 0.5972285504575797,
240
+ "eval_f1_anger": 0.5746792544178165,
241
+ "eval_f1_disgust": 0.3785166240409207,
242
+ "eval_f1_fear": 0.6040515653775322,
243
+ "eval_f1_joy": 0.7226870078740156,
244
+ "eval_f1_neutral": 0.8435877759219971,
245
+ "eval_f1_sadness": 0.6404109589041096,
246
+ "eval_f1_surprise": 0.4166666666666667,
247
+ "eval_loss": 0.6897642612457275,
248
+ "eval_micro_f1": 0.7466407010710808,
249
+ "eval_prec": 0.6572406702350582,
250
+ "eval_prec_anger": 0.5109771846749892,
251
+ "eval_prec_disgust": 0.4868421052631579,
252
+ "eval_prec_fear": 0.8138957816377171,
253
+ "eval_prec_joy": 0.7573491490458999,
254
+ "eval_prec_neutral": 0.81245109120946,
255
+ "eval_prec_sadness": 0.6938775510204082,
256
+ "eval_prec_surprise": 0.5252918287937743,
257
+ "eval_recall": 0.5649303370058901,
258
+ "eval_recall_anger": 0.6565265486725663,
259
+ "eval_recall_disgust": 0.30962343096234307,
260
+ "eval_recall_fear": 0.4802342606149341,
261
+ "eval_recall_joy": 0.6910588235294117,
262
+ "eval_recall_neutral": 0.8772061584678934,
263
+ "eval_recall_sadness": 0.5945945945945946,
264
+ "eval_recall_surprise": 0.3452685421994885,
265
+ "eval_runtime": 46.2244,
266
+ "eval_samples_per_second": 444.354,
267
+ "eval_steps_per_second": 13.889,
268
+ "step": 5860
269
  },
270
  {
271
  "epoch": 4.2,
272
+ "learning_rate": 0.0008317945033231543,
273
+ "loss": 0.6977,
274
+ "step": 6153
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
275
  },
276
  {
277
+ "epoch": 4.4,
278
+ "learning_rate": 0.0008212681875336806,
279
+ "loss": 0.685,
280
+ "step": 6446
281
  },
282
  {
283
+ "epoch": 4.6,
284
+ "learning_rate": 0.000810741871744207,
285
+ "loss": 0.6985,
286
+ "step": 6739
287
  },
288
  {
289
+ "epoch": 4.8,
290
+ "learning_rate": 0.0008002155559547333,
291
+ "loss": 0.6976,
292
+ "step": 7032
293
+ },
294
+ {
295
+ "epoch": 5.0,
296
+ "learning_rate": 0.0007896892401652595,
297
+ "loss": 0.6925,
298
+ "step": 7325
299
+ },
300
+ {
301
+ "epoch": 5.0,
302
+ "eval_accuracy": 0.7402629016553067,
303
+ "eval_b_acc": 0.5916067970161544,
304
+ "eval_f1": 0.5971544894232231,
305
+ "eval_f1_anger": 0.5747069094537292,
306
+ "eval_f1_disgust": 0.3850687622789784,
307
+ "eval_f1_fear": 0.5954887218045113,
308
+ "eval_f1_joy": 0.721651810899244,
309
+ "eval_f1_neutral": 0.8404170008019246,
310
+ "eval_f1_sadness": 0.6490066225165564,
311
+ "eval_f1_surprise": 0.41374159820761763,
312
+ "eval_loss": 0.7038670182228088,
313
+ "eval_micro_f1": 0.7402629016553067,
314
+ "eval_prec": 0.6121145881871085,
315
+ "eval_prec_anger": 0.5233984552476147,
316
+ "eval_prec_disgust": 0.362962962962963,
317
+ "eval_prec_fear": 0.6120556414219475,
318
+ "eval_prec_joy": 0.693258183394754,
319
+ "eval_prec_neutral": 0.8446003602920261,
320
+ "eval_prec_sadness": 0.751219512195122,
321
+ "eval_prec_surprise": 0.49730700179533216,
322
+ "eval_recall": 0.5916067970161544,
323
+ "eval_recall_anger": 0.6371681415929203,
324
+ "eval_recall_disgust": 0.4100418410041841,
325
+ "eval_recall_fear": 0.5797950219619327,
326
+ "eval_recall_joy": 0.7524705882352941,
327
+ "eval_recall_neutral": 0.8362748779571911,
328
+ "eval_recall_sadness": 0.5712771595124536,
329
+ "eval_recall_surprise": 0.35421994884910485,
330
+ "eval_runtime": 46.1526,
331
+ "eval_samples_per_second": 445.045,
332
+ "eval_steps_per_second": 13.91,
333
+ "step": 7325
334
+ },
335
+ {
336
+ "epoch": 5.2,
337
+ "learning_rate": 0.0007791629243757859,
338
+ "loss": 0.6851,
339
+ "step": 7618
340
+ },
341
+ {
342
+ "epoch": 5.4,
343
+ "learning_rate": 0.0007686366085863123,
344
+ "loss": 0.671,
345
+ "step": 7911
346
+ },
347
+ {
348
+ "epoch": 5.6,
349
+ "learning_rate": 0.000758146218789294,
350
+ "loss": 0.6817,
351
+ "step": 8204
352
+ },
353
+ {
354
+ "epoch": 5.8,
355
+ "learning_rate": 0.0007476558289922759,
356
+ "loss": 0.683,
357
+ "step": 8497
358
  },
359
  {
360
  "epoch": 6.0,
361
+ "learning_rate": 0.0007371295132028022,
362
+ "loss": 0.6841,
363
+ "step": 8790
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
364
  },
365
  {
366
+ "epoch": 6.0,
367
+ "eval_accuracy": 0.7516066212268744,
368
+ "eval_b_acc": 0.5820003637019402,
369
+ "eval_f1": 0.6075976734562277,
370
+ "eval_f1_anger": 0.5587018771874006,
371
+ "eval_f1_disgust": 0.4760180995475113,
372
+ "eval_f1_fear": 0.5998107852412488,
373
+ "eval_f1_joy": 0.7342120343839541,
374
+ "eval_f1_neutral": 0.8439233370913191,
375
+ "eval_f1_sadness": 0.6554338668913225,
376
+ "eval_f1_surprise": 0.3850837138508371,
377
+ "eval_loss": 0.6704264283180237,
378
+ "eval_micro_f1": 0.7516066212268744,
379
+ "eval_prec": 0.6607440078057637,
380
+ "eval_prec_anger": 0.6576779026217229,
381
+ "eval_prec_disgust": 0.4194577352472089,
382
+ "eval_prec_fear": 0.8475935828877005,
383
+ "eval_prec_joy": 0.7157541899441341,
384
+ "eval_prec_neutral": 0.8120281176776881,
385
+ "eval_prec_sadness": 0.6971326164874552,
386
+ "eval_prec_surprise": 0.4755639097744361,
387
+ "eval_recall": 0.5820003637019402,
388
+ "eval_recall_anger": 0.4856194690265487,
389
+ "eval_recall_disgust": 0.5502092050209205,
390
+ "eval_recall_fear": 0.46412884333821375,
391
+ "eval_recall_joy": 0.7536470588235294,
392
+ "eval_recall_neutral": 0.8784265865565152,
393
+ "eval_recall_sadness": 0.6184419713831478,
394
+ "eval_recall_surprise": 0.3235294117647059,
395
+ "eval_runtime": 46.0795,
396
+ "eval_samples_per_second": 445.752,
397
+ "eval_steps_per_second": 13.932,
398
+ "step": 8790
399
+ },
400
+ {
401
+ "epoch": 6.2,
402
+ "learning_rate": 0.0007266031974133286,
403
+ "loss": 0.6618,
404
+ "step": 9083
405
+ },
406
+ {
407
+ "epoch": 6.4,
408
+ "learning_rate": 0.0007160768816238548,
409
+ "loss": 0.6658,
410
+ "step": 9376
411
+ },
412
+ {
413
+ "epoch": 6.6,
414
+ "learning_rate": 0.0007055505658343812,
415
+ "loss": 0.6721,
416
+ "step": 9669
417
+ },
418
+ {
419
+ "epoch": 6.8,
420
+ "learning_rate": 0.0006950242500449076,
421
+ "loss": 0.6664,
422
+ "step": 9962
423
+ },
424
+ {
425
+ "epoch": 7.0,
426
+ "learning_rate": 0.0006844979342554338,
427
+ "loss": 0.6715,
428
+ "step": 10255
429
+ },
430
+ {
431
+ "epoch": 7.0,
432
+ "eval_accuracy": 0.7411879259980526,
433
+ "eval_b_acc": 0.6179791982250035,
434
+ "eval_f1": 0.611239662539826,
435
+ "eval_f1_anger": 0.5761816741484025,
436
+ "eval_f1_disgust": 0.45527156549520764,
437
+ "eval_f1_fear": 0.6020128087831657,
438
+ "eval_f1_joy": 0.7317787540835867,
439
+ "eval_f1_neutral": 0.8391440250060112,
440
+ "eval_f1_sadness": 0.6545357238426546,
441
+ "eval_f1_surprise": 0.4197530864197531,
442
+ "eval_loss": 0.6918847560882568,
443
+ "eval_micro_f1": 0.7411879259980525,
444
+ "eval_prec": 0.6245536912240063,
445
+ "eval_prec_anger": 0.551288529560384,
446
+ "eval_prec_disgust": 0.3682170542635659,
447
+ "eval_prec_fear": 0.802439024390244,
448
+ "eval_prec_joy": 0.7019667170953101,
449
+ "eval_prec_neutral": 0.860199152124618,
450
+ "eval_prec_sadness": 0.6610810810810811,
451
+ "eval_prec_surprise": 0.42668428005284015,
452
+ "eval_recall": 0.6179791982250035,
453
+ "eval_recall_anger": 0.603429203539823,
454
+ "eval_recall_disgust": 0.5962343096234309,
455
+ "eval_recall_fear": 0.4816983894582723,
456
+ "eval_recall_joy": 0.764235294117647,
457
+ "eval_recall_neutral": 0.8190950056327451,
458
+ "eval_recall_sadness": 0.6481187069422364,
459
+ "eval_recall_surprise": 0.41304347826086957,
460
+ "eval_runtime": 46.1915,
461
+ "eval_samples_per_second": 444.671,
462
+ "eval_steps_per_second": 13.899,
463
+ "step": 10255
464
+ },
465
+ {
466
+ "epoch": 7.2,
467
+ "learning_rate": 0.0006739716184659601,
468
+ "loss": 0.6479,
469
+ "step": 10548
470
+ },
471
+ {
472
+ "epoch": 7.4,
473
+ "learning_rate": 0.0006634453026764866,
474
+ "loss": 0.6561,
475
+ "step": 10841
476
+ },
477
+ {
478
+ "epoch": 7.6,
479
+ "learning_rate": 0.0006529189868870128,
480
+ "loss": 0.6625,
481
+ "step": 11134
482
+ },
483
+ {
484
+ "epoch": 7.8,
485
+ "learning_rate": 0.0006423926710975391,
486
+ "loss": 0.658,
487
+ "step": 11427
488
+ },
489
+ {
490
+ "epoch": 8.0,
491
+ "learning_rate": 0.0006318663553080653,
492
+ "loss": 0.6562,
493
+ "step": 11720
494
+ },
495
+ {
496
+ "epoch": 8.0,
497
+ "eval_accuracy": 0.7325219084712755,
498
+ "eval_b_acc": 0.6128679845265063,
499
+ "eval_f1": 0.6013536581571658,
500
+ "eval_f1_anger": 0.5731053840265374,
501
+ "eval_f1_disgust": 0.42007434944237915,
502
+ "eval_f1_fear": 0.5870646766169154,
503
+ "eval_f1_joy": 0.7238035658429777,
504
+ "eval_f1_neutral": 0.8292248292248293,
505
+ "eval_f1_sadness": 0.6645180193378261,
506
+ "eval_f1_surprise": 0.4116847826086957,
507
+ "eval_loss": 0.7244542241096497,
508
+ "eval_micro_f1": 0.7325219084712755,
509
+ "eval_prec": 0.5985056915840363,
510
+ "eval_prec_anger": 0.5319753671245855,
511
+ "eval_prec_disgust": 0.3779264214046823,
512
+ "eval_prec_fear": 0.5704419889502762,
513
+ "eval_prec_joy": 0.6498782999438307,
514
+ "eval_prec_neutral": 0.8770680628272252,
515
+ "eval_prec_sadness": 0.7431192660550459,
516
+ "eval_prec_surprise": 0.4391304347826087,
517
+ "eval_recall": 0.6128679845265063,
518
+ "eval_recall_anger": 0.6211283185840708,
519
+ "eval_recall_disgust": 0.47280334728033474,
520
+ "eval_recall_fear": 0.6046852122986823,
521
+ "eval_recall_joy": 0.8167058823529412,
522
+ "eval_recall_neutral": 0.7863312054074352,
523
+ "eval_recall_sadness": 0.6009538950715422,
524
+ "eval_recall_surprise": 0.3874680306905371,
525
+ "eval_runtime": 46.2278,
526
+ "eval_samples_per_second": 444.321,
527
+ "eval_steps_per_second": 13.888,
528
+ "step": 11720
529
+ },
530
+ {
531
+ "epoch": 8.2,
532
+ "learning_rate": 0.0006213400395185917,
533
+ "loss": 0.6406,
534
+ "step": 12013
535
+ },
536
+ {
537
+ "epoch": 8.4,
538
+ "learning_rate": 0.0006108137237291181,
539
+ "loss": 0.6459,
540
+ "step": 12306
541
+ },
542
+ {
543
+ "epoch": 8.6,
544
+ "learning_rate": 0.0006002874079396443,
545
+ "loss": 0.6482,
546
+ "step": 12599
547
+ },
548
+ {
549
+ "epoch": 8.8,
550
+ "learning_rate": 0.0005897610921501707,
551
+ "loss": 0.6502,
552
+ "step": 12892
553
  },
554
  {
555
  "epoch": 9.0,
556
+ "learning_rate": 0.000579234776360697,
557
+ "loss": 0.6426,
558
+ "step": 13185
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
559
  },
560
  {
561
+ "epoch": 9.0,
562
+ "eval_accuracy": 0.7510223953261927,
563
+ "eval_b_acc": 0.6108946329415156,
564
+ "eval_f1": 0.6175413637878915,
565
+ "eval_f1_anger": 0.588235294117647,
566
+ "eval_f1_disgust": 0.42267050912584053,
567
+ "eval_f1_fear": 0.6240409207161126,
568
+ "eval_f1_joy": 0.7357859531772576,
569
+ "eval_f1_neutral": 0.8457566654149455,
570
+ "eval_f1_sadness": 0.6677704194260485,
571
+ "eval_f1_surprise": 0.4385297845373891,
572
+ "eval_loss": 0.6683408617973328,
573
+ "eval_micro_f1": 0.7510223953261927,
574
+ "eval_prec": 0.6304447087675242,
575
+ "eval_prec_anger": 0.5768208399787347,
576
+ "eval_prec_disgust": 0.3907637655417407,
577
+ "eval_prec_fear": 0.746938775510204,
578
+ "eval_prec_joy": 0.7215562090024882,
579
+ "eval_prec_neutral": 0.8457566654149455,
580
+ "eval_prec_sadness": 0.6966033390903857,
581
+ "eval_prec_surprise": 0.43467336683417085,
582
+ "eval_recall": 0.6108946329415156,
583
+ "eval_recall_anger": 0.6001106194690266,
584
+ "eval_recall_disgust": 0.4602510460251046,
585
+ "eval_recall_fear": 0.5358711566617862,
586
+ "eval_recall_joy": 0.7505882352941177,
587
+ "eval_recall_neutral": 0.8457566654149455,
588
+ "eval_recall_sadness": 0.6412294647588765,
589
+ "eval_recall_surprise": 0.4424552429667519,
590
+ "eval_runtime": 46.02,
591
+ "eval_samples_per_second": 446.328,
592
+ "eval_steps_per_second": 13.95,
593
+ "step": 13185
594
+ },
595
+ {
596
+ "epoch": 9.2,
597
+ "learning_rate": 0.0005687084605712233,
598
+ "loss": 0.6219,
599
+ "step": 13478
600
+ },
601
+ {
602
+ "epoch": 9.4,
603
+ "learning_rate": 0.0005581821447817496,
604
+ "loss": 0.629,
605
+ "step": 13771
606
+ },
607
+ {
608
+ "epoch": 9.6,
609
+ "learning_rate": 0.000547655828992276,
610
+ "loss": 0.6295,
611
+ "step": 14064
612
+ },
613
+ {
614
+ "epoch": 9.8,
615
+ "learning_rate": 0.0005371295132028022,
616
+ "loss": 0.6341,
617
+ "step": 14357
618
+ },
619
+ {
620
+ "epoch": 10.0,
621
+ "learning_rate": 0.0005266031974133285,
622
+ "loss": 0.6278,
623
+ "step": 14650
624
+ },
625
+ {
626
+ "epoch": 10.0,
627
+ "eval_accuracy": 0.7544790652385589,
628
+ "eval_b_acc": 0.5967589307999713,
629
+ "eval_f1": 0.6141821019437051,
630
+ "eval_f1_anger": 0.5878859857482185,
631
+ "eval_f1_disgust": 0.44155844155844154,
632
+ "eval_f1_fear": 0.6228143213988342,
633
+ "eval_f1_joy": 0.7319787131107887,
634
+ "eval_f1_neutral": 0.8493716172828181,
635
+ "eval_f1_sadness": 0.6534983341266064,
636
+ "eval_f1_surprise": 0.41216730038022814,
637
+ "eval_loss": 0.6661337018013,
638
+ "eval_micro_f1": 0.7544790652385589,
639
+ "eval_prec": 0.642724018193579,
640
+ "eval_prec_anger": 0.6346153846153846,
641
+ "eval_prec_disgust": 0.45739910313901344,
642
+ "eval_prec_fear": 0.722007722007722,
643
+ "eval_prec_joy": 0.75311100049776,
644
+ "eval_prec_neutral": 0.8304035874439462,
645
+ "eval_prec_sadness": 0.5930885529157668,
646
+ "eval_prec_surprise": 0.5084427767354597,
647
+ "eval_recall": 0.5967589307999713,
648
+ "eval_recall_anger": 0.547566371681416,
649
+ "eval_recall_disgust": 0.42677824267782427,
650
+ "eval_recall_fear": 0.5475841874084919,
651
+ "eval_recall_joy": 0.712,
652
+ "eval_recall_neutral": 0.8692264363499812,
653
+ "eval_recall_sadness": 0.7276099629040805,
654
+ "eval_recall_surprise": 0.34654731457800514,
655
+ "eval_runtime": 46.1343,
656
+ "eval_samples_per_second": 445.222,
657
+ "eval_steps_per_second": 13.916,
658
+ "step": 14650
659
+ },
660
+ {
661
+ "epoch": 10.2,
662
+ "learning_rate": 0.0005161128076163104,
663
+ "loss": 0.6132,
664
+ "step": 14943
665
+ },
666
+ {
667
+ "epoch": 10.4,
668
+ "learning_rate": 0.0005055864918268367,
669
+ "loss": 0.6134,
670
+ "step": 15236
671
+ },
672
+ {
673
+ "epoch": 10.6,
674
+ "learning_rate": 0.0004950961020298186,
675
+ "loss": 0.6153,
676
+ "step": 15529
677
+ },
678
+ {
679
+ "epoch": 10.8,
680
+ "learning_rate": 0.0004845697862403449,
681
+ "loss": 0.6115,
682
+ "step": 15822
683
+ },
684
+ {
685
+ "epoch": 11.0,
686
+ "learning_rate": 0.0004740434704508712,
687
+ "loss": 0.6218,
688
+ "step": 16115
689
+ },
690
+ {
691
+ "epoch": 11.0,
692
+ "eval_accuracy": 0.750730282375852,
693
+ "eval_b_acc": 0.5958006635298841,
694
+ "eval_f1": 0.6142987968349727,
695
+ "eval_f1_anger": 0.5728,
696
+ "eval_f1_disgust": 0.45192307692307687,
697
+ "eval_f1_fear": 0.6015971606033718,
698
+ "eval_f1_joy": 0.7337797782412998,
699
+ "eval_f1_neutral": 0.8416802042237178,
700
+ "eval_f1_sadness": 0.6666666666666666,
701
+ "eval_f1_surprise": 0.431644691186676,
702
+ "eval_loss": 0.6714352965354919,
703
+ "eval_micro_f1": 0.750730282375852,
704
+ "eval_prec": 0.647849574337048,
705
+ "eval_prec_anger": 0.6795747911921033,
706
+ "eval_prec_disgust": 0.4181494661921708,
707
+ "eval_prec_fear": 0.7635135135135135,
708
+ "eval_prec_joy": 0.6877958427660013,
709
+ "eval_prec_neutral": 0.832369411548701,
710
+ "eval_prec_sadness": 0.6816168327796235,
711
+ "eval_prec_surprise": 0.47192716236722304,
712
+ "eval_recall": 0.5958006635298841,
713
+ "eval_recall_anger": 0.4950221238938053,
714
+ "eval_recall_disgust": 0.4916317991631799,
715
+ "eval_recall_fear": 0.49633967789165445,
716
+ "eval_recall_joy": 0.7863529411764706,
717
+ "eval_recall_neutral": 0.8512016522718738,
718
+ "eval_recall_sadness": 0.6523582405935348,
719
+ "eval_recall_surprise": 0.3976982097186701,
720
+ "eval_runtime": 46.0325,
721
+ "eval_samples_per_second": 446.206,
722
+ "eval_steps_per_second": 13.947,
723
+ "step": 16115
724
+ },
725
+ {
726
+ "epoch": 11.2,
727
+ "learning_rate": 0.00046351715466139755,
728
+ "loss": 0.5966,
729
+ "step": 16408
730
+ },
731
+ {
732
+ "epoch": 11.4,
733
+ "learning_rate": 0.0004529908388719238,
734
+ "loss": 0.5988,
735
+ "step": 16701
736
+ },
737
+ {
738
+ "epoch": 11.6,
739
+ "learning_rate": 0.0004424645230824502,
740
+ "loss": 0.6077,
741
+ "step": 16994
742
+ },
743
+ {
744
+ "epoch": 11.8,
745
+ "learning_rate": 0.0004319382072929765,
746
+ "loss": 0.6089,
747
+ "step": 17287
748
  },
749
  {
750
+ "epoch": 12.0,
751
+ "learning_rate": 0.0004214118915035028,
752
+ "loss": 0.6077,
753
+ "step": 17580
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
754
  },
755
  {
756
  "epoch": 12.0,
757
+ "eval_accuracy": 0.7543330087633885,
758
+ "eval_b_acc": 0.6171055294678581,
759
+ "eval_f1": 0.6187242211015894,
760
+ "eval_f1_anger": 0.6074972436604189,
761
+ "eval_f1_disgust": 0.429035752979415,
762
+ "eval_f1_fear": 0.6134515890613451,
763
+ "eval_f1_joy": 0.7370813397129187,
764
+ "eval_f1_neutral": 0.8496555576242785,
765
+ "eval_f1_sadness": 0.6629986244841817,
766
+ "eval_f1_surprise": 0.431349440188568,
767
+ "eval_loss": 0.6648654341697693,
768
+ "eval_micro_f1": 0.7543330087633885,
769
+ "eval_prec": 0.6216330895487993,
770
+ "eval_prec_anger": 0.6054945054945055,
771
+ "eval_prec_disgust": 0.4449438202247191,
772
+ "eval_prec_fear": 0.6194029850746269,
773
+ "eval_prec_joy": 0.7496350364963503,
774
+ "eval_prec_neutral": 0.842596011816839,
775
+ "eval_prec_sadness": 0.6893592677345538,
776
+ "eval_prec_surprise": 0.4,
777
+ "eval_recall": 0.6171055294678581,
778
+ "eval_recall_anger": 0.6095132743362832,
779
+ "eval_recall_disgust": 0.41422594142259417,
780
+ "eval_recall_fear": 0.6076134699853587,
781
+ "eval_recall_joy": 0.7249411764705882,
782
+ "eval_recall_neutral": 0.8568343972962824,
783
+ "eval_recall_sadness": 0.6385797562268151,
784
+ "eval_recall_surprise": 0.4680306905370844,
785
+ "eval_runtime": 46.1374,
786
+ "eval_samples_per_second": 445.192,
787
+ "eval_steps_per_second": 13.915,
788
+ "step": 17580
789
+ },
790
+ {
791
+ "epoch": 12.2,
792
+ "learning_rate": 0.0004108855757140291,
793
+ "loss": 0.5841,
794
+ "step": 17873
795
+ },
796
+ {
797
+ "epoch": 12.4,
798
+ "learning_rate": 0.0004003592599245554,
799
+ "loss": 0.5891,
800
+ "step": 18166
801
+ },
802
+ {
803
+ "epoch": 12.6,
804
+ "learning_rate": 0.00038983294413508175,
805
+ "loss": 0.5867,
806
+ "step": 18459
807
+ },
808
+ {
809
+ "epoch": 12.8,
810
+ "learning_rate": 0.000379306628345608,
811
+ "loss": 0.5906,
812
+ "step": 18752
813
+ },
814
+ {
815
+ "epoch": 13.0,
816
+ "learning_rate": 0.0003687803125561344,
817
+ "loss": 0.5868,
818
+ "step": 19045
819
+ },
820
+ {
821
+ "epoch": 13.0,
822
+ "eval_accuracy": 0.7583739045764363,
823
+ "eval_b_acc": 0.6026010025373034,
824
+ "eval_f1": 0.6223744496289562,
825
+ "eval_f1_anger": 0.6024734982332155,
826
+ "eval_f1_disgust": 0.44166666666666665,
827
+ "eval_f1_fear": 0.6313213703099511,
828
+ "eval_f1_joy": 0.735365152386429,
829
+ "eval_f1_neutral": 0.8496863696717184,
830
+ "eval_f1_sadness": 0.6641961231470923,
831
+ "eval_f1_surprise": 0.43191196698762035,
832
+ "eval_loss": 0.6679861545562744,
833
+ "eval_micro_f1": 0.7583739045764363,
834
+ "eval_prec": 0.64731907895135,
835
+ "eval_prec_anger": 0.6442065491183879,
836
+ "eval_prec_disgust": 0.43983402489626555,
837
+ "eval_prec_fear": 0.712707182320442,
838
+ "eval_prec_joy": 0.7192350956130483,
839
+ "eval_prec_neutral": 0.8292966306193583,
840
+ "eval_prec_sadness": 0.7186921653300432,
841
+ "eval_prec_surprise": 0.46726190476190477,
842
+ "eval_recall": 0.6026010025373034,
843
+ "eval_recall_anger": 0.5658185840707964,
844
+ "eval_recall_disgust": 0.4435146443514644,
845
+ "eval_recall_fear": 0.5666178623718887,
846
+ "eval_recall_joy": 0.7522352941176471,
847
+ "eval_recall_neutral": 0.8711040180247841,
848
+ "eval_recall_sadness": 0.6173820879703232,
849
+ "eval_recall_surprise": 0.40153452685422,
850
+ "eval_runtime": 46.0652,
851
+ "eval_samples_per_second": 445.89,
852
+ "eval_steps_per_second": 13.937,
853
+ "step": 19045
854
+ },
855
+ {
856
+ "epoch": 13.2,
857
+ "learning_rate": 0.0003582539967666607,
858
+ "loss": 0.5689,
859
+ "step": 19338
860
+ },
861
+ {
862
+ "epoch": 13.4,
863
+ "learning_rate": 0.000347727680977187,
864
+ "loss": 0.5716,
865
+ "step": 19631
866
+ },
867
+ {
868
+ "epoch": 13.6,
869
+ "learning_rate": 0.0003372372911801689,
870
+ "loss": 0.5675,
871
+ "step": 19924
872
+ },
873
+ {
874
+ "epoch": 13.8,
875
+ "learning_rate": 0.00032674690138315073,
876
+ "loss": 0.5758,
877
+ "step": 20217
878
+ },
879
+ {
880
+ "epoch": 14.0,
881
+ "learning_rate": 0.00031622058559367704,
882
+ "loss": 0.5747,
883
+ "step": 20510
884
+ },
885
+ {
886
+ "epoch": 14.0,
887
+ "eval_accuracy": 0.755111976630964,
888
+ "eval_b_acc": 0.6048530634576196,
889
+ "eval_f1": 0.6154691317356998,
890
+ "eval_f1_anger": 0.6074639062925634,
891
+ "eval_f1_disgust": 0.4108352144469526,
892
+ "eval_f1_fear": 0.607483492296405,
893
+ "eval_f1_joy": 0.7358854935817335,
894
+ "eval_f1_neutral": 0.8482922954725973,
895
+ "eval_f1_sadness": 0.6642149929278642,
896
+ "eval_f1_surprise": 0.43410852713178294,
897
+ "eval_loss": 0.6692087054252625,
898
+ "eval_micro_f1": 0.755111976630964,
899
+ "eval_prec": 0.6292971112960697,
900
+ "eval_prec_anger": 0.5984970477724101,
901
+ "eval_prec_disgust": 0.44607843137254904,
902
+ "eval_prec_fear": 0.6088235294117647,
903
+ "eval_prec_joy": 0.711399077531298,
904
+ "eval_prec_neutral": 0.8443865686912845,
905
+ "eval_prec_sadness": 0.712378640776699,
906
+ "eval_prec_surprise": 0.4835164835164835,
907
+ "eval_recall": 0.6048530634576196,
908
+ "eval_recall_anger": 0.6167035398230089,
909
  "eval_recall_disgust": 0.3807531380753138,
910
+ "eval_recall_fear": 0.6061493411420205,
911
+ "eval_recall_joy": 0.7621176470588236,
912
+ "eval_recall_neutral": 0.8522343221930154,
913
+ "eval_recall_sadness": 0.6221515633280339,
914
+ "eval_recall_surprise": 0.3938618925831202,
915
+ "eval_runtime": 46.1819,
916
+ "eval_samples_per_second": 444.763,
917
+ "eval_steps_per_second": 13.902,
918
+ "step": 20510
919
  },
920
  {
921
+ "epoch": 14.2,
922
+ "learning_rate": 0.00030569426980420336,
923
+ "loss": 0.5521,
924
+ "step": 20803
925
  },
926
  {
927
+ "epoch": 14.4,
928
+ "learning_rate": 0.00029516795401472967,
929
+ "loss": 0.55,
930
+ "step": 21096
931
  },
932
  {
933
+ "epoch": 14.6,
934
+ "learning_rate": 0.000284641638225256,
935
+ "loss": 0.5572,
936
+ "step": 21389
937
  },
938
  {
939
+ "epoch": 14.8,
940
+ "learning_rate": 0.0002741153224357823,
941
+ "loss": 0.5615,
942
+ "step": 21682
943
  },
944
  {
945
+ "epoch": 15.0,
946
+ "learning_rate": 0.00026358900664630856,
947
+ "loss": 0.5632,
948
+ "step": 21975
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
949
  },
950
  {
951
  "epoch": 15.0,
952
+ "eval_accuracy": 0.7550632911392405,
953
+ "eval_b_acc": 0.6104260663388762,
954
+ "eval_f1": 0.6185386561537733,
955
+ "eval_f1_anger": 0.6062717770034843,
956
+ "eval_f1_disgust": 0.4662349676225717,
957
+ "eval_f1_fear": 0.5972434915773354,
958
+ "eval_f1_joy": 0.7371225577264653,
959
+ "eval_f1_neutral": 0.8455345440928667,
960
+ "eval_f1_sadness": 0.669596264762428,
961
+ "eval_f1_surprise": 0.4077669902912621,
962
+ "eval_loss": 0.6762722134590149,
963
+ "eval_micro_f1": 0.7550632911392405,
964
+ "eval_prec": 0.6390061654621464,
965
+ "eval_prec_anger": 0.6381418092909535,
966
+ "eval_prec_disgust": 0.417910447761194,
967
+ "eval_prec_fear": 0.6260032102728732,
968
+ "eval_prec_joy": 0.6977721731820092,
969
+ "eval_prec_neutral": 0.8431665421956684,
970
+ "eval_prec_sadness": 0.6949828962371721,
971
+ "eval_prec_surprise": 0.5550660792951542,
972
+ "eval_recall": 0.6104260663388762,
973
+ "eval_recall_anger": 0.577433628318584,
974
+ "eval_recall_disgust": 0.5271966527196653,
975
+ "eval_recall_fear": 0.5710102489019033,
976
+ "eval_recall_joy": 0.7811764705882352,
977
+ "eval_recall_neutral": 0.8479158843409689,
978
+ "eval_recall_sadness": 0.6459989401165872,
979
+ "eval_recall_surprise": 0.32225063938618925,
980
+ "eval_runtime": 46.0659,
981
+ "eval_samples_per_second": 445.883,
982
+ "eval_steps_per_second": 13.937,
983
+ "step": 21975
984
+ },
985
+ {
986
+ "epoch": 15.2,
987
+ "learning_rate": 0.0002530626908568349,
988
+ "loss": 0.5379,
989
+ "step": 22268
990
+ },
991
+ {
992
+ "epoch": 15.4,
993
+ "learning_rate": 0.00024253637506736124,
994
+ "loss": 0.5403,
995
+ "step": 22561
996
+ },
997
+ {
998
+ "epoch": 15.6,
999
+ "learning_rate": 0.00023201005927788758,
1000
+ "loss": 0.5446,
1001
+ "step": 22854
1002
+ },
1003
+ {
1004
+ "epoch": 15.8,
1005
+ "learning_rate": 0.00022148374348841387,
1006
+ "loss": 0.5467,
1007
+ "step": 23147
1008
+ },
1009
+ {
1010
+ "epoch": 16.0,
1011
+ "learning_rate": 0.00021095742769894018,
1012
+ "loss": 0.546,
1013
+ "step": 23440
1014
+ },
1015
+ {
1016
+ "epoch": 16.0,
1017
+ "eval_accuracy": 0.7537000973709834,
1018
+ "eval_b_acc": 0.6088681990875895,
1019
+ "eval_f1": 0.6204872320296809,
1020
+ "eval_f1_anger": 0.6185002736726875,
1021
+ "eval_f1_disgust": 0.41638225255972694,
1022
+ "eval_f1_fear": 0.6321401370906321,
1023
+ "eval_f1_joy": 0.7359859309738404,
1024
+ "eval_f1_neutral": 0.8420753645142964,
1025
+ "eval_f1_sadness": 0.6701657458563536,
1026
+ "eval_f1_surprise": 0.4281609195402299,
1027
+ "eval_loss": 0.6880349516868591,
1028
+ "eval_micro_f1": 0.7537000973709834,
1029
+ "eval_prec": 0.6365138577031803,
1030
+ "eval_prec_anger": 0.6121343445287107,
1031
+ "eval_prec_disgust": 0.456359102244389,
1032
+ "eval_prec_fear": 0.6587301587301587,
1033
+ "eval_prec_joy": 0.6905940594059405,
1034
+ "eval_prec_neutral": 0.8493124522536287,
1035
+ "eval_prec_sadness": 0.6999422965954991,
1036
+ "eval_prec_surprise": 0.4885245901639344,
1037
+ "eval_recall": 0.6088681990875895,
1038
+ "eval_recall_anger": 0.625,
1039
+ "eval_recall_disgust": 0.38284518828451886,
1040
+ "eval_recall_fear": 0.6076134699853587,
1041
+ "eval_recall_joy": 0.7877647058823529,
1042
+ "eval_recall_neutral": 0.8349605707848291,
1043
+ "eval_recall_sadness": 0.6428192898781134,
1044
+ "eval_recall_surprise": 0.38107416879795397,
1045
+ "eval_runtime": 46.5188,
1046
+ "eval_samples_per_second": 441.542,
1047
+ "eval_steps_per_second": 13.801,
1048
+ "step": 23440
1049
+ },
1050
+ {
1051
+ "epoch": 16.2,
1052
+ "learning_rate": 0.0002004311119094665,
1053
+ "loss": 0.5239,
1054
+ "step": 23733
1055
+ },
1056
+ {
1057
+ "epoch": 16.4,
1058
+ "learning_rate": 0.0001899047961199928,
1059
+ "loss": 0.5223,
1060
+ "step": 24026
1061
+ },
1062
+ {
1063
+ "epoch": 16.6,
1064
+ "learning_rate": 0.00017941440632297467,
1065
+ "loss": 0.5312,
1066
+ "step": 24319
1067
+ },
1068
+ {
1069
+ "epoch": 16.8,
1070
+ "learning_rate": 0.00016888809053350098,
1071
+ "loss": 0.5308,
1072
+ "step": 24612
1073
+ },
1074
+ {
1075
+ "epoch": 17.0,
1076
+ "learning_rate": 0.0001583617747440273,
1077
+ "loss": 0.5354,
1078
+ "step": 24905
1079
+ },
1080
+ {
1081
+ "epoch": 17.0,
1082
+ "eval_accuracy": 0.7544790652385589,
1083
+ "eval_b_acc": 0.6097199422404823,
1084
+ "eval_f1": 0.6222181238744549,
1085
+ "eval_f1_anger": 0.6241173275393808,
1086
+ "eval_f1_disgust": 0.42105263157894735,
1087
+ "eval_f1_fear": 0.632506004803843,
1088
+ "eval_f1_joy": 0.7375304810463312,
1089
+ "eval_f1_neutral": 0.8440314781454441,
1090
+ "eval_f1_sadness": 0.663218077865505,
1091
+ "eval_f1_surprise": 0.4330708661417323,
1092
+ "eval_loss": 0.6822559833526611,
1093
+ "eval_micro_f1": 0.7544790652385589,
1094
+ "eval_prec": 0.6398646312953825,
1095
+ "eval_prec_anger": 0.6131270010672358,
1096
+ "eval_prec_disgust": 0.49162011173184356,
1097
+ "eval_prec_fear": 0.6978798586572438,
1098
+ "eval_prec_joy": 0.6971919530595139,
1099
+ "eval_prec_neutral": 0.8525186745834131,
1100
+ "eval_prec_sadness": 0.6819708846584547,
1101
+ "eval_prec_surprise": 0.444743935309973,
1102
+ "eval_recall": 0.6097199422404823,
1103
+ "eval_recall_anger": 0.6355088495575221,
1104
+ "eval_recall_disgust": 0.3682008368200837,
1105
+ "eval_recall_fear": 0.5783308931185944,
1106
+ "eval_recall_joy": 0.7828235294117647,
1107
+ "eval_recall_neutral": 0.8357116034547503,
1108
+ "eval_recall_sadness": 0.6454689984101749,
1109
+ "eval_recall_surprise": 0.4219948849104859,
1110
+ "eval_runtime": 46.2493,
1111
+ "eval_samples_per_second": 444.115,
1112
+ "eval_steps_per_second": 13.881,
1113
+ "step": 24905
1114
+ },
1115
+ {
1116
+ "epoch": 17.2,
1117
+ "learning_rate": 0.0001478354589545536,
1118
+ "loss": 0.5058,
1119
+ "step": 25198
1120
+ },
1121
+ {
1122
+ "epoch": 17.4,
1123
+ "learning_rate": 0.00013730914316507995,
1124
+ "loss": 0.5182,
1125
+ "step": 25491
1126
+ },
1127
+ {
1128
+ "epoch": 17.6,
1129
+ "learning_rate": 0.00012678282737560627,
1130
+ "loss": 0.5132,
1131
+ "step": 25784
1132
+ },
1133
+ {
1134
+ "epoch": 17.8,
1135
+ "learning_rate": 0.00011629243757858811,
1136
+ "loss": 0.5169,
1137
+ "step": 26077
1138
+ },
1139
+ {
1140
+ "epoch": 18.0,
1141
+ "learning_rate": 0.00010576612178911443,
1142
+ "loss": 0.5103,
1143
+ "step": 26370
1144
+ },
1145
+ {
1146
+ "epoch": 18.0,
1147
+ "eval_accuracy": 0.7581304771178189,
1148
+ "eval_b_acc": 0.6039152175326364,
1149
+ "eval_f1": 0.6206372407316966,
1150
+ "eval_f1_anger": 0.624553694040099,
1151
+ "eval_f1_disgust": 0.4259259259259259,
1152
+ "eval_f1_fear": 0.6247049567269867,
1153
+ "eval_f1_joy": 0.7396948303347757,
1154
+ "eval_f1_neutral": 0.8471082089552239,
1155
+ "eval_f1_sadness": 0.6643598615916955,
1156
+ "eval_f1_surprise": 0.41811320754716985,
1157
+ "eval_loss": 0.6852018237113953,
1158
+ "eval_micro_f1": 0.758130477117819,
1159
+ "eval_prec": 0.6440153151637059,
1160
+ "eval_prec_anger": 0.6202945990180033,
1161
+ "eval_prec_disgust": 0.47668393782383417,
1162
+ "eval_prec_fear": 0.6751700680272109,
1163
+ "eval_prec_joy": 0.7166813768755517,
1164
+ "eval_prec_neutral": 0.8417686318131257,
1165
+ "eval_prec_sadness": 0.667379679144385,
1166
+ "eval_prec_surprise": 0.5101289134438306,
1167
+ "eval_recall": 0.6039152175326364,
1168
+ "eval_recall_anger": 0.6288716814159292,
1169
+ "eval_recall_disgust": 0.38493723849372385,
1170
+ "eval_recall_fear": 0.5812591508052709,
1171
+ "eval_recall_joy": 0.764235294117647,
1172
+ "eval_recall_neutral": 0.8525159594442359,
1173
+ "eval_recall_sadness": 0.6613672496025437,
1174
+ "eval_recall_surprise": 0.35421994884910485,
1175
+ "eval_runtime": 46.0432,
1176
+ "eval_samples_per_second": 446.103,
1177
+ "eval_steps_per_second": 13.943,
1178
+ "step": 26370
1179
+ },
1180
+ {
1181
+ "epoch": 18.2,
1182
+ "learning_rate": 9.523980599964074e-05,
1183
+ "loss": 0.5041,
1184
+ "step": 26663
1185
+ },
1186
+ {
1187
+ "epoch": 18.4,
1188
+ "learning_rate": 8.471349021016706e-05,
1189
+ "loss": 0.5066,
1190
+ "step": 26956
1191
+ },
1192
+ {
1193
+ "epoch": 18.6,
1194
+ "learning_rate": 7.418717442069338e-05,
1195
+ "loss": 0.5007,
1196
+ "step": 27249
1197
+ },
1198
+ {
1199
+ "epoch": 18.8,
1200
+ "learning_rate": 6.369678462367523e-05,
1201
+ "loss": 0.4965,
1202
+ "step": 27542
1203
+ },
1204
+ {
1205
+ "epoch": 19.0,
1206
+ "learning_rate": 5.3170468834201544e-05,
1207
+ "loss": 0.4972,
1208
+ "step": 27835
1209
+ },
1210
+ {
1211
+ "epoch": 19.0,
1212
+ "eval_accuracy": 0.7535053554040896,
1213
+ "eval_b_acc": 0.6039050483043659,
1214
+ "eval_f1": 0.6162485458896193,
1215
+ "eval_f1_anger": 0.6241059602649006,
1216
+ "eval_f1_disgust": 0.41258741258741255,
1217
+ "eval_f1_fear": 0.6275430359937403,
1218
+ "eval_f1_joy": 0.7361095521382872,
1219
+ "eval_f1_neutral": 0.8437618147448016,
1220
+ "eval_f1_sadness": 0.6601011445302103,
1221
+ "eval_f1_surprise": 0.4095309009679821,
1222
+ "eval_loss": 0.6947867274284363,
1223
+ "eval_micro_f1": 0.7535053554040896,
1224
+ "eval_prec": 0.635037226488908,
1225
+ "eval_prec_anger": 0.5988815455007626,
1226
+ "eval_prec_disgust": 0.46578947368421053,
1227
+ "eval_prec_fear": 0.6739495798319328,
1228
+ "eval_prec_joy": 0.7037990985189955,
1229
+ "eval_prec_neutral": 0.849543205177008,
1230
+ "eval_prec_sadness": 0.6631016042780749,
1231
+ "eval_prec_surprise": 0.49019607843137253,
1232
+ "eval_recall": 0.6039050483043659,
1233
+ "eval_recall_anger": 0.6515486725663717,
1234
+ "eval_recall_disgust": 0.3702928870292887,
1235
+ "eval_recall_fear": 0.5871156661786238,
1236
+ "eval_recall_joy": 0.7715294117647059,
1237
+ "eval_recall_neutral": 0.8380585805482539,
1238
+ "eval_recall_sadness": 0.6571277159512454,
1239
+ "eval_recall_surprise": 0.3516624040920716,
1240
+ "eval_runtime": 46.2834,
1241
+ "eval_samples_per_second": 443.788,
1242
+ "eval_steps_per_second": 13.871,
1243
+ "step": 27835
1244
+ },
1245
+ {
1246
+ "epoch": 19.2,
1247
+ "learning_rate": 4.264415304472786e-05,
1248
+ "loss": 0.4927,
1249
+ "step": 28128
1250
+ },
1251
+ {
1252
+ "epoch": 19.4,
1253
+ "learning_rate": 3.211783725525418e-05,
1254
+ "loss": 0.4867,
1255
+ "step": 28421
1256
+ },
1257
+ {
1258
+ "epoch": 19.6,
1259
+ "learning_rate": 2.1591521465780493e-05,
1260
+ "loss": 0.4917,
1261
+ "step": 28714
1262
+ },
1263
+ {
1264
+ "epoch": 19.8,
1265
+ "learning_rate": 1.1065205676306808e-05,
1266
+ "loss": 0.4916,
1267
+ "step": 29007
1268
+ },
1269
+ {
1270
+ "epoch": 20.0,
1271
+ "learning_rate": 5.388898868331237e-07,
1272
+ "loss": 0.4801,
1273
+ "step": 29300
1274
+ },
1275
+ {
1276
+ "epoch": 20.0,
1277
+ "eval_accuracy": 0.7549172346640701,
1278
+ "eval_b_acc": 0.6105911461962804,
1279
+ "eval_f1": 0.6198802361438264,
1280
+ "eval_f1_anger": 0.6221737946063742,
1281
+ "eval_f1_disgust": 0.42093784078516905,
1282
+ "eval_f1_fear": 0.6232558139534883,
1283
+ "eval_f1_joy": 0.7376322074377345,
1284
+ "eval_f1_neutral": 0.8454656747339674,
1285
+ "eval_f1_sadness": 0.6622481442205725,
1286
+ "eval_f1_surprise": 0.4274481772694782,
1287
+ "eval_loss": 0.6945263743400574,
1288
+ "eval_micro_f1": 0.7549172346640701,
1289
+ "eval_prec": 0.6320068488618952,
1290
+ "eval_prec_anger": 0.6129898013955984,
1291
+ "eval_prec_disgust": 0.4396355353075171,
1292
+ "eval_prec_fear": 0.6622734761120264,
1293
+ "eval_prec_joy": 0.713845476557341,
1294
+ "eval_prec_neutral": 0.8481012658227848,
1295
+ "eval_prec_sadness": 0.6625994694960212,
1296
+ "eval_prec_surprise": 0.4846029173419773,
1297
+ "eval_recall": 0.6105911461962804,
1298
+ "eval_recall_anger": 0.6316371681415929,
1299
+ "eval_recall_disgust": 0.40376569037656906,
1300
+ "eval_recall_fear": 0.5885797950219619,
1301
+ "eval_recall_joy": 0.7630588235294118,
1302
+ "eval_recall_neutral": 0.8428464138190012,
1303
+ "eval_recall_sadness": 0.661897191308956,
1304
+ "eval_recall_surprise": 0.38235294117647056,
1305
+ "eval_runtime": 46.1785,
1306
+ "eval_samples_per_second": 444.796,
1307
+ "eval_steps_per_second": 13.903,
1308
+ "step": 29300
1309
+ },
1310
+ {
1311
+ "epoch": 20.0,
1312
+ "step": 29300,
1313
+ "total_flos": 8.789779081685053e+17,
1314
+ "train_loss": 0.6315777759747294,
1315
+ "train_runtime": 20512.0097,
1316
+ "train_samples_per_second": 182.843,
1317
+ "train_steps_per_second": 1.428
1318
  }
1319
  ],
1320
+ "max_steps": 29300,
1321
+ "num_train_epochs": 20,
1322
+ "total_flos": 8.789779081685053e+17,
1323
  "trial_name": null,
1324
  "trial_params": null
1325
  }