anniew666 commited on
Commit
447a2b2
1 Parent(s): f598d00

End of training

Browse files
Files changed (7) hide show
  1. all_results.json +40 -0
  2. cf.png +2 -2
  3. cf.txt +7 -7
  4. class_report.txt +8 -8
  5. eval_results.json +35 -0
  6. train_results.json +8 -0
  7. trainer_state.json +1284 -0
all_results.json ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 15.0,
3
+ "eval_accuracy": 0.7630963972736124,
4
+ "eval_b_acc": 0.6053830892588602,
5
+ "eval_f1": 0.6276991641576467,
6
+ "eval_f1_anger": 0.6168702073274639,
7
+ "eval_f1_disgust": 0.43303571428571425,
8
+ "eval_f1_fear": 0.638801261829653,
9
+ "eval_f1_joy": 0.7379285799027169,
10
+ "eval_f1_neutral": 0.8519039622384605,
11
+ "eval_f1_sadness": 0.6683630195080577,
12
+ "eval_f1_surprise": 0.44699140401146126,
13
+ "eval_loss": 0.6577332019805908,
14
+ "eval_micro_f1": 0.7630963972736124,
15
+ "eval_prec": 0.6548174460459298,
16
+ "eval_prec_anger": 0.6339754816112084,
17
+ "eval_prec_disgust": 0.46411483253588515,
18
+ "eval_prec_fear": 0.6923076923076923,
19
+ "eval_prec_joy": 0.7441971763579803,
20
+ "eval_prec_neutral": 0.8246199806695369,
21
+ "eval_prec_sadness": 0.7163636363636363,
22
+ "eval_prec_surprise": 0.50814332247557,
23
+ "eval_recall": 0.6053830892588602,
24
+ "eval_recall_anger": 0.6006637168141593,
25
+ "eval_recall_disgust": 0.40585774058577406,
26
+ "eval_recall_fear": 0.5929721815519766,
27
+ "eval_recall_joy": 0.731764705882353,
28
+ "eval_recall_neutral": 0.8810552009012392,
29
+ "eval_recall_sadness": 0.6263910969793323,
30
+ "eval_recall_surprise": 0.3989769820971867,
31
+ "eval_runtime": 52.7414,
32
+ "eval_samples": 20540,
33
+ "eval_samples_per_second": 389.447,
34
+ "eval_steps_per_second": 24.345,
35
+ "train_loss": 0.6400373776102771,
36
+ "train_runtime": 15988.8097,
37
+ "train_samples": 187524,
38
+ "train_samples_per_second": 175.927,
39
+ "train_steps_per_second": 1.374
40
+ }
cf.png CHANGED

Git LFS Details

  • SHA256: 163a2a43bc9a31f6f7787197cf40dbd1bfec84e35902d600ea6c7512828ba156
  • Pointer size: 130 Bytes
  • Size of remote file: 57.4 kB

Git LFS Details

  • SHA256: d7535020cf3ac357cdecbab2dbe9eab87ea70795ba87e480c1886703a2c3f0ad
  • Pointer size: 130 Bytes
  • Size of remote file: 57.4 kB
cf.txt CHANGED
@@ -1,7 +1,7 @@
1
- 6.050884955752212635e-01 4.424778761061946841e-02 2.876106194690265447e-02 5.641592920353982049e-02 1.852876106194690231e-01 5.696902654867256471e-02 2.323008849557522265e-02
2
- 1.966527196652719800e-01 4.163179916317991669e-01 4.811715481171548181e-02 5.648535564853556651e-02 7.949790794979079422e-02 1.799163179916317967e-01 2.301255230125523119e-02
3
- 6.295754026354319355e-02 2.489019033674963466e-02 5.988286969253294734e-01 6.442166910688140735e-02 1.390922401171303113e-01 5.710102489019033833e-02 5.270863836017569692e-02
4
- 2.023529411764705965e-02 3.764705882352941280e-03 7.294117647058823324e-03 7.804705882352941382e-01 1.491764705882352993e-01 2.541176470588235245e-02 1.364705882352941144e-02
5
- 2.750657153586181028e-02 4.036800600826136350e-03 4.787833270747277915e-03 8.796470146451371153e-02 8.388096132181750431e-01 2.459631993991738541e-02 1.229815996995869271e-02
6
- 4.557498675145733869e-02 2.596714361420243700e-02 2.437731849496555317e-02 6.465288818229994461e-02 1.505034446210916921e-01 6.756756756756756577e-01 1.324854266030736638e-02
7
- 5.498721227621483632e-02 1.023017902813299317e-02 2.685421994884910554e-02 1.982097186700767233e-01 2.340153452685422020e-01 7.033248081841432520e-02 4.053708439897698024e-01
 
1
+ 6.006637168141593097e-01 3.705752212389380740e-02 2.488938053097345185e-02 5.088495575221239214e-02 2.212389380530973559e-01 3.871681415929203313e-02 2.654867256637168105e-02
2
+ 2.175732217573221883e-01 4.058577405857740628e-01 5.020920502092050125e-02 6.485355648535565121e-02 1.066945606694560678e-01 1.297071129707113024e-01 2.510460251046025063e-02
3
+ 6.588579795021962116e-02 2.196193265007320705e-02 5.929721815519766182e-01 5.270863836017569692e-02 1.625183016105417322e-01 4.538799414348462791e-02 5.856515373352855214e-02
4
+ 1.882352941176470423e-02 4.235294117647058453e-03 5.176470588235294532e-03 7.317647058823529838e-01 2.021176470588235408e-01 2.094117647058823389e-02 1.694117647058823381e-02
5
+ 2.412692452121667150e-02 4.787833270747277915e-03 2.722493428464138176e-03 6.111528351483289795e-02 8.810552009012392327e-01 1.624108148704468679e-02 9.951182876455126614e-03
6
+ 5.352411234764176129e-02 3.179650238473767654e-02 2.066772655007948975e-02 6.200317965023847272e-02 1.928987811340752423e-01 6.263910969793322625e-01 1.271860095389507235e-02
7
+ 5.115089514066496063e-02 1.662404092071611411e-02 2.685421994884910554e-02 1.815856777493606022e-01 2.698209718670076529e-01 5.498721227621483632e-02 3.989769820971866832e-01
class_report.txt CHANGED
@@ -1,13 +1,13 @@
1
  precision recall f1-score support
2
 
3
- 0anger 0.63 0.61 0.62 1808
4
- 1disgust 0.48 0.42 0.45 478
5
- 2fear 0.65 0.60 0.62 683
6
- 3joy 0.71 0.78 0.74 4250
7
- 4neutral 0.85 0.84 0.84 10652
8
- 5sadness 0.66 0.68 0.67 1887
9
- 6surprise 0.51 0.41 0.45 782
10
 
11
  accuracy 0.76 20540
12
- macro avg 0.64 0.62 0.63 20540
13
  weighted avg 0.76 0.76 0.76 20540
 
1
  precision recall f1-score support
2
 
3
+ 0anger 0.63 0.60 0.62 1808
4
+ 1disgust 0.46 0.41 0.43 478
5
+ 2fear 0.69 0.59 0.64 683
6
+ 3joy 0.74 0.73 0.74 4250
7
+ 4neutral 0.82 0.88 0.85 10652
8
+ 5sadness 0.72 0.63 0.67 1887
9
+ 6surprise 0.51 0.40 0.45 782
10
 
11
  accuracy 0.76 20540
12
+ macro avg 0.65 0.61 0.63 20540
13
  weighted avg 0.76 0.76 0.76 20540
eval_results.json ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 15.0,
3
+ "eval_accuracy": 0.7630963972736124,
4
+ "eval_b_acc": 0.6053830892588602,
5
+ "eval_f1": 0.6276991641576467,
6
+ "eval_f1_anger": 0.6168702073274639,
7
+ "eval_f1_disgust": 0.43303571428571425,
8
+ "eval_f1_fear": 0.638801261829653,
9
+ "eval_f1_joy": 0.7379285799027169,
10
+ "eval_f1_neutral": 0.8519039622384605,
11
+ "eval_f1_sadness": 0.6683630195080577,
12
+ "eval_f1_surprise": 0.44699140401146126,
13
+ "eval_loss": 0.6577332019805908,
14
+ "eval_micro_f1": 0.7630963972736124,
15
+ "eval_prec": 0.6548174460459298,
16
+ "eval_prec_anger": 0.6339754816112084,
17
+ "eval_prec_disgust": 0.46411483253588515,
18
+ "eval_prec_fear": 0.6923076923076923,
19
+ "eval_prec_joy": 0.7441971763579803,
20
+ "eval_prec_neutral": 0.8246199806695369,
21
+ "eval_prec_sadness": 0.7163636363636363,
22
+ "eval_prec_surprise": 0.50814332247557,
23
+ "eval_recall": 0.6053830892588602,
24
+ "eval_recall_anger": 0.6006637168141593,
25
+ "eval_recall_disgust": 0.40585774058577406,
26
+ "eval_recall_fear": 0.5929721815519766,
27
+ "eval_recall_joy": 0.731764705882353,
28
+ "eval_recall_neutral": 0.8810552009012392,
29
+ "eval_recall_sadness": 0.6263910969793323,
30
+ "eval_recall_surprise": 0.3989769820971867,
31
+ "eval_runtime": 52.7414,
32
+ "eval_samples": 20540,
33
+ "eval_samples_per_second": 389.447,
34
+ "eval_steps_per_second": 24.345
35
+ }
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 15.0,
3
+ "train_loss": 0.6400373776102771,
4
+ "train_runtime": 15988.8097,
5
+ "train_samples": 187524,
6
+ "train_samples_per_second": 175.927,
7
+ "train_steps_per_second": 1.374
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,1284 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.6276991641576467,
3
+ "best_model_checkpoint": ".exp/lora/lora-roberta-large-no-ed/checkpoint-17584",
4
+ "epoch": 14.99744070977649,
5
+ "global_step": 21975,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.15,
12
+ "learning_rate": 0.00019836214740673338,
13
+ "loss": 1.2151,
14
+ "step": 220
15
+ },
16
+ {
17
+ "epoch": 0.3,
18
+ "learning_rate": 0.0003976342129208371,
19
+ "loss": 0.8737,
20
+ "step": 440
21
+ },
22
+ {
23
+ "epoch": 0.45,
24
+ "learning_rate": 0.0005969062784349408,
25
+ "loss": 0.8228,
26
+ "step": 660
27
+ },
28
+ {
29
+ "epoch": 0.6,
30
+ "learning_rate": 0.0007970882620564149,
31
+ "loss": 0.8081,
32
+ "step": 880
33
+ },
34
+ {
35
+ "epoch": 0.75,
36
+ "eval_accuracy": 0.7138266796494644,
37
+ "eval_b_acc": 0.5642215512771782,
38
+ "eval_f1": 0.5601190771157161,
39
+ "eval_f1_anger": 0.515716568993074,
40
+ "eval_f1_disgust": 0.3879907621247113,
41
+ "eval_f1_fear": 0.5360230547550433,
42
+ "eval_f1_joy": 0.6877726536208402,
43
+ "eval_f1_neutral": 0.8344834105302958,
44
+ "eval_f1_sadness": 0.5870011402508551,
45
+ "eval_f1_surprise": 0.3718459495351925,
46
+ "eval_loss": 0.790067732334137,
47
+ "eval_micro_f1": 0.7138266796494644,
48
+ "eval_prec": 0.5616517829432821,
49
+ "eval_prec_anger": 0.49743062692702983,
50
+ "eval_prec_disgust": 0.4329896907216495,
51
+ "eval_prec_fear": 0.5276595744680851,
52
+ "eval_prec_joy": 0.7312483434932414,
53
+ "eval_prec_neutral": 0.8402817437654674,
54
+ "eval_prec_sadness": 0.5152121697357886,
55
+ "eval_prec_surprise": 0.3867403314917127,
56
+ "eval_recall": 0.5642215512771782,
57
+ "eval_recall_anger": 0.5353982300884956,
58
+ "eval_recall_disgust": 0.3514644351464435,
59
+ "eval_recall_fear": 0.5446559297218155,
60
+ "eval_recall_joy": 0.6491764705882352,
61
+ "eval_recall_neutral": 0.8287645512579798,
62
+ "eval_recall_sadness": 0.6820349761526232,
63
+ "eval_recall_surprise": 0.35805626598465473,
64
+ "eval_runtime": 53.9044,
65
+ "eval_samples_per_second": 381.045,
66
+ "eval_steps_per_second": 23.82,
67
+ "step": 1099
68
+ },
69
+ {
70
+ "epoch": 0.75,
71
+ "learning_rate": 0.000997270245677889,
72
+ "loss": 0.7828,
73
+ "step": 1100
74
+ },
75
+ {
76
+ "epoch": 0.9,
77
+ "learning_rate": 0.0009896052883694194,
78
+ "loss": 0.7661,
79
+ "step": 1320
80
+ },
81
+ {
82
+ "epoch": 1.05,
83
+ "learning_rate": 0.0009790668710480935,
84
+ "loss": 0.7799,
85
+ "step": 1540
86
+ },
87
+ {
88
+ "epoch": 1.2,
89
+ "learning_rate": 0.0009685284537267676,
90
+ "loss": 0.757,
91
+ "step": 1760
92
+ },
93
+ {
94
+ "epoch": 1.35,
95
+ "learning_rate": 0.0009579900364054417,
96
+ "loss": 0.7543,
97
+ "step": 1980
98
+ },
99
+ {
100
+ "epoch": 1.5,
101
+ "eval_accuracy": 0.7262901655306718,
102
+ "eval_b_acc": 0.5714411859458394,
103
+ "eval_f1": 0.573711944542916,
104
+ "eval_f1_anger": 0.5241837968561063,
105
+ "eval_f1_disgust": 0.44267198404785646,
106
+ "eval_f1_fear": 0.546070460704607,
107
+ "eval_f1_joy": 0.7150729335494327,
108
+ "eval_f1_neutral": 0.8296947358472735,
109
+ "eval_f1_sadness": 0.6172300981461288,
110
+ "eval_f1_surprise": 0.3410596026490066,
111
+ "eval_loss": 0.7482287883758545,
112
+ "eval_micro_f1": 0.7262901655306718,
113
+ "eval_prec": 0.5892369276637266,
114
+ "eval_prec_anger": 0.578,
115
+ "eval_prec_disgust": 0.4228571428571429,
116
+ "eval_prec_fear": 0.5081967213114754,
117
+ "eval_prec_joy": 0.6611388611388611,
118
+ "eval_prec_neutral": 0.8352997145575642,
119
+ "eval_prec_sadness": 0.6355979786636721,
120
+ "eval_prec_surprise": 0.4835680751173709,
121
+ "eval_recall": 0.5714411859458394,
122
+ "eval_recall_anger": 0.4795353982300885,
123
+ "eval_recall_disgust": 0.46443514644351463,
124
+ "eval_recall_fear": 0.5900439238653001,
125
+ "eval_recall_joy": 0.7785882352941177,
126
+ "eval_recall_neutral": 0.8241644761547128,
127
+ "eval_recall_sadness": 0.5998940116587176,
128
+ "eval_recall_surprise": 0.26342710997442453,
129
+ "eval_runtime": 52.5664,
130
+ "eval_samples_per_second": 390.744,
131
+ "eval_steps_per_second": 24.426,
132
+ "step": 2198
133
+ },
134
+ {
135
+ "epoch": 1.5,
136
+ "learning_rate": 0.0009474516190841157,
137
+ "loss": 0.7562,
138
+ "step": 2200
139
+ },
140
+ {
141
+ "epoch": 1.65,
142
+ "learning_rate": 0.0009369132017627898,
143
+ "loss": 0.7601,
144
+ "step": 2420
145
+ },
146
+ {
147
+ "epoch": 1.8,
148
+ "learning_rate": 0.0009263747844414639,
149
+ "loss": 0.7501,
150
+ "step": 2640
151
+ },
152
+ {
153
+ "epoch": 1.95,
154
+ "learning_rate": 0.000915836367120138,
155
+ "loss": 0.737,
156
+ "step": 2860
157
+ },
158
+ {
159
+ "epoch": 2.1,
160
+ "learning_rate": 0.0009052979497988121,
161
+ "loss": 0.7292,
162
+ "step": 3080
163
+ },
164
+ {
165
+ "epoch": 2.25,
166
+ "eval_accuracy": 0.739240506329114,
167
+ "eval_b_acc": 0.5728734605953718,
168
+ "eval_f1": 0.5834227565376339,
169
+ "eval_f1_anger": 0.5439560439560439,
170
+ "eval_f1_disgust": 0.41185185185185186,
171
+ "eval_f1_fear": 0.593798449612403,
172
+ "eval_f1_joy": 0.721927599723311,
173
+ "eval_f1_neutral": 0.8387907060195567,
174
+ "eval_f1_sadness": 0.6231551328304362,
175
+ "eval_f1_surprise": 0.35047951176983433,
176
+ "eval_loss": 0.7176372408866882,
177
+ "eval_micro_f1": 0.739240506329114,
178
+ "eval_prec": 0.633689371773426,
179
+ "eval_prec_anger": 0.6069482288828338,
180
+ "eval_prec_disgust": 0.31880733944954126,
181
+ "eval_prec_fear": 0.6309719934102141,
182
+ "eval_prec_joy": 0.7077305605786618,
183
+ "eval_prec_neutral": 0.8031266105480158,
184
+ "eval_prec_sadness": 0.8175559380378657,
185
+ "eval_prec_surprise": 0.5506849315068493,
186
+ "eval_recall": 0.5728734605953718,
187
+ "eval_recall_anger": 0.4928097345132743,
188
+ "eval_recall_disgust": 0.5815899581589958,
189
+ "eval_recall_fear": 0.5607613469985359,
190
+ "eval_recall_joy": 0.7367058823529412,
191
+ "eval_recall_neutral": 0.8777694329703342,
192
+ "eval_recall_sadness": 0.5034446210916799,
193
+ "eval_recall_surprise": 0.2570332480818414,
194
+ "eval_runtime": 52.5539,
195
+ "eval_samples_per_second": 390.837,
196
+ "eval_steps_per_second": 24.432,
197
+ "step": 3297
198
+ },
199
+ {
200
+ "epoch": 2.25,
201
+ "learning_rate": 0.0008948074343744013,
202
+ "loss": 0.7375,
203
+ "step": 3300
204
+ },
205
+ {
206
+ "epoch": 2.4,
207
+ "learning_rate": 0.0008842690170530752,
208
+ "loss": 0.7199,
209
+ "step": 3520
210
+ },
211
+ {
212
+ "epoch": 2.55,
213
+ "learning_rate": 0.0008737305997317494,
214
+ "loss": 0.7064,
215
+ "step": 3740
216
+ },
217
+ {
218
+ "epoch": 2.7,
219
+ "learning_rate": 0.0008631921824104235,
220
+ "loss": 0.7063,
221
+ "step": 3960
222
+ },
223
+ {
224
+ "epoch": 2.85,
225
+ "learning_rate": 0.0008526537650890975,
226
+ "loss": 0.7138,
227
+ "step": 4180
228
+ },
229
+ {
230
+ "epoch": 3.0,
231
+ "eval_accuracy": 0.7448393378773126,
232
+ "eval_b_acc": 0.5918170569783451,
233
+ "eval_f1": 0.6005073740718484,
234
+ "eval_f1_anger": 0.583310230108123,
235
+ "eval_f1_disgust": 0.4129301355578728,
236
+ "eval_f1_fear": 0.582723279648609,
237
+ "eval_f1_joy": 0.729650507328072,
238
+ "eval_f1_neutral": 0.8403856955626287,
239
+ "eval_f1_sadness": 0.6514983351831298,
240
+ "eval_f1_surprise": 0.40305343511450376,
241
+ "eval_loss": 0.688290536403656,
242
+ "eval_micro_f1": 0.7448393378773126,
243
+ "eval_prec": 0.6144786785060393,
244
+ "eval_prec_anger": 0.584769316286826,
245
+ "eval_prec_disgust": 0.41164241164241167,
246
+ "eval_prec_fear": 0.582723279648609,
247
+ "eval_prec_joy": 0.7004329004329004,
248
+ "eval_prec_neutral": 0.8380321135175504,
249
+ "eval_prec_sadness": 0.6837507280139778,
250
+ "eval_prec_surprise": 0.5,
251
+ "eval_recall": 0.5918170569783451,
252
+ "eval_recall_anger": 0.581858407079646,
253
+ "eval_recall_disgust": 0.41422594142259417,
254
+ "eval_recall_fear": 0.582723279648609,
255
+ "eval_recall_joy": 0.7614117647058823,
256
+ "eval_recall_neutral": 0.842752534735261,
257
+ "eval_recall_sadness": 0.6221515633280339,
258
+ "eval_recall_surprise": 0.3375959079283887,
259
+ "eval_runtime": 52.617,
260
+ "eval_samples_per_second": 390.368,
261
+ "eval_steps_per_second": 24.403,
262
+ "step": 4396
263
+ },
264
+ {
265
+ "epoch": 3.0,
266
+ "learning_rate": 0.0008421632496646868,
267
+ "loss": 0.7289,
268
+ "step": 4400
269
+ },
270
+ {
271
+ "epoch": 3.15,
272
+ "learning_rate": 0.0008316248323433608,
273
+ "loss": 0.6887,
274
+ "step": 4620
275
+ },
276
+ {
277
+ "epoch": 3.3,
278
+ "learning_rate": 0.0008210864150220348,
279
+ "loss": 0.6982,
280
+ "step": 4840
281
+ },
282
+ {
283
+ "epoch": 3.45,
284
+ "learning_rate": 0.0008105479977007089,
285
+ "loss": 0.701,
286
+ "step": 5060
287
+ },
288
+ {
289
+ "epoch": 3.6,
290
+ "learning_rate": 0.0008000095803793831,
291
+ "loss": 0.7046,
292
+ "step": 5280
293
+ },
294
+ {
295
+ "epoch": 3.75,
296
+ "eval_accuracy": 0.7464946445959104,
297
+ "eval_b_acc": 0.5788756560881936,
298
+ "eval_f1": 0.5986191545663104,
299
+ "eval_f1_anger": 0.5739130434782608,
300
+ "eval_f1_disgust": 0.3984476067270375,
301
+ "eval_f1_fear": 0.5746569814366425,
302
+ "eval_f1_joy": 0.730888607885964,
303
+ "eval_f1_neutral": 0.8425003475279181,
304
+ "eval_f1_sadness": 0.6517333333333334,
305
+ "eval_f1_surprise": 0.418194161575017,
306
+ "eval_loss": 0.682627260684967,
307
+ "eval_micro_f1": 0.7464946445959104,
308
+ "eval_prec": 0.6275132039697725,
309
+ "eval_prec_anger": 0.5822424587364826,
310
+ "eval_prec_disgust": 0.5220338983050847,
311
+ "eval_prec_fear": 0.6402877697841727,
312
+ "eval_prec_joy": 0.7145425938413127,
313
+ "eval_prec_neutral": 0.8318235886174399,
314
+ "eval_prec_sadness": 0.6559312936124531,
315
+ "eval_prec_surprise": 0.44573082489146165,
316
+ "eval_recall": 0.5788756560881936,
317
+ "eval_recall_anger": 0.5658185840707964,
318
+ "eval_recall_disgust": 0.32217573221757323,
319
+ "eval_recall_fear": 0.5212298682284041,
320
+ "eval_recall_joy": 0.748,
321
+ "eval_recall_neutral": 0.8534547502816372,
322
+ "eval_recall_sadness": 0.6475887652358241,
323
+ "eval_recall_surprise": 0.3938618925831202,
324
+ "eval_runtime": 54.8263,
325
+ "eval_samples_per_second": 374.638,
326
+ "eval_steps_per_second": 23.419,
327
+ "step": 5495
328
+ },
329
+ {
330
+ "epoch": 3.75,
331
+ "learning_rate": 0.0007894711630580571,
332
+ "loss": 0.7145,
333
+ "step": 5500
334
+ },
335
+ {
336
+ "epoch": 3.9,
337
+ "learning_rate": 0.0007789806476336463,
338
+ "loss": 0.7056,
339
+ "step": 5720
340
+ },
341
+ {
342
+ "epoch": 4.05,
343
+ "learning_rate": 0.0007684422303123204,
344
+ "loss": 0.6911,
345
+ "step": 5940
346
+ },
347
+ {
348
+ "epoch": 4.2,
349
+ "learning_rate": 0.0007579038129909944,
350
+ "loss": 0.6777,
351
+ "step": 6160
352
+ },
353
+ {
354
+ "epoch": 4.35,
355
+ "learning_rate": 0.0007473653956696685,
356
+ "loss": 0.6767,
357
+ "step": 6380
358
+ },
359
+ {
360
+ "epoch": 4.5,
361
+ "eval_accuracy": 0.7435735150925025,
362
+ "eval_b_acc": 0.5648744699236212,
363
+ "eval_f1": 0.592256565822076,
364
+ "eval_f1_anger": 0.5643717196665637,
365
+ "eval_f1_disgust": 0.36467236467236464,
366
+ "eval_f1_fear": 0.6036536934074663,
367
+ "eval_f1_joy": 0.7215847324556106,
368
+ "eval_f1_neutral": 0.8374881666140739,
369
+ "eval_f1_sadness": 0.6377816291161179,
370
+ "eval_f1_surprise": 0.416243654822335,
371
+ "eval_loss": 0.6971003413200378,
372
+ "eval_micro_f1": 0.7435735150925025,
373
+ "eval_prec": 0.6422939486456166,
374
+ "eval_prec_anger": 0.6387141858839972,
375
+ "eval_prec_disgust": 0.5714285714285714,
376
+ "eval_prec_fear": 0.6597222222222222,
377
+ "eval_prec_joy": 0.7413750310250683,
378
+ "eval_prec_neutral": 0.80556760038158,
379
+ "eval_prec_sadness": 0.5985130111524164,
380
+ "eval_prec_surprise": 0.4807370184254606,
381
+ "eval_recall": 0.5648744699236212,
382
+ "eval_recall_anger": 0.5055309734513275,
383
+ "eval_recall_disgust": 0.26778242677824265,
384
+ "eval_recall_fear": 0.5563689604685212,
385
+ "eval_recall_joy": 0.7028235294117647,
386
+ "eval_recall_neutral": 0.8720428088621855,
387
+ "eval_recall_sadness": 0.6825649178590355,
388
+ "eval_recall_surprise": 0.3670076726342711,
389
+ "eval_runtime": 52.3013,
390
+ "eval_samples_per_second": 392.725,
391
+ "eval_steps_per_second": 24.55,
392
+ "step": 6594
393
+ },
394
+ {
395
+ "epoch": 4.5,
396
+ "learning_rate": 0.0007368269783483425,
397
+ "loss": 0.6834,
398
+ "step": 6600
399
+ },
400
+ {
401
+ "epoch": 4.65,
402
+ "learning_rate": 0.0007262885610270167,
403
+ "loss": 0.6924,
404
+ "step": 6820
405
+ },
406
+ {
407
+ "epoch": 4.8,
408
+ "learning_rate": 0.0007157501437056908,
409
+ "loss": 0.6872,
410
+ "step": 7040
411
+ },
412
+ {
413
+ "epoch": 4.95,
414
+ "learning_rate": 0.0007052117263843648,
415
+ "loss": 0.6681,
416
+ "step": 7260
417
+ },
418
+ {
419
+ "epoch": 5.1,
420
+ "learning_rate": 0.000694673309063039,
421
+ "loss": 0.661,
422
+ "step": 7480
423
+ },
424
+ {
425
+ "epoch": 5.25,
426
+ "eval_accuracy": 0.7383641674780915,
427
+ "eval_b_acc": 0.602771097930762,
428
+ "eval_f1": 0.6030709415406346,
429
+ "eval_f1_anger": 0.5770609318996416,
430
+ "eval_f1_disgust": 0.41814595660749504,
431
+ "eval_f1_fear": 0.6160198183319571,
432
+ "eval_f1_joy": 0.7286771805600258,
433
+ "eval_f1_neutral": 0.8364084854464726,
434
+ "eval_f1_sadness": 0.6574813998346651,
435
+ "eval_f1_surprise": 0.38770281810418444,
436
+ "eval_loss": 0.7123843431472778,
437
+ "eval_micro_f1": 0.7383641674780915,
438
+ "eval_prec": 0.6294789669741513,
439
+ "eval_prec_anger": 0.48493975903614456,
440
+ "eval_prec_disgust": 0.39552238805970147,
441
+ "eval_prec_fear": 0.7064393939393939,
442
+ "eval_prec_joy": 0.6696903963715244,
443
+ "eval_prec_neutral": 0.88136826783115,
444
+ "eval_prec_sadness": 0.6848450057405281,
445
+ "eval_prec_surprise": 0.583547557840617,
446
+ "eval_recall": 0.602771097930762,
447
+ "eval_recall_anger": 0.7123893805309734,
448
+ "eval_recall_disgust": 0.4435146443514644,
449
+ "eval_recall_fear": 0.5461200585651538,
450
+ "eval_recall_joy": 0.7990588235294117,
451
+ "eval_recall_neutral": 0.7958129928651896,
452
+ "eval_recall_sadness": 0.6322204557498675,
453
+ "eval_recall_surprise": 0.29028132992327366,
454
+ "eval_runtime": 52.258,
455
+ "eval_samples_per_second": 393.05,
456
+ "eval_steps_per_second": 24.57,
457
+ "step": 7693
458
+ },
459
+ {
460
+ "epoch": 5.26,
461
+ "learning_rate": 0.000684134891741713,
462
+ "loss": 0.6623,
463
+ "step": 7700
464
+ },
465
+ {
466
+ "epoch": 5.41,
467
+ "learning_rate": 0.000673596474420387,
468
+ "loss": 0.6663,
469
+ "step": 7920
470
+ },
471
+ {
472
+ "epoch": 5.56,
473
+ "learning_rate": 0.0006630580570990611,
474
+ "loss": 0.6669,
475
+ "step": 8140
476
+ },
477
+ {
478
+ "epoch": 5.71,
479
+ "learning_rate": 0.0006525196397777352,
480
+ "loss": 0.6691,
481
+ "step": 8360
482
+ },
483
+ {
484
+ "epoch": 5.86,
485
+ "learning_rate": 0.0006419812224564093,
486
+ "loss": 0.6652,
487
+ "step": 8580
488
+ },
489
+ {
490
+ "epoch": 6.0,
491
+ "eval_accuracy": 0.752921129503408,
492
+ "eval_b_acc": 0.594191766213012,
493
+ "eval_f1": 0.6135563471911549,
494
+ "eval_f1_anger": 0.5377977217811529,
495
+ "eval_f1_disgust": 0.4477933261571583,
496
+ "eval_f1_fear": 0.6142208774583964,
497
+ "eval_f1_joy": 0.7345635202271116,
498
+ "eval_f1_neutral": 0.8443846671149968,
499
+ "eval_f1_sadness": 0.659697386519945,
500
+ "eval_f1_surprise": 0.4564369310793238,
501
+ "eval_loss": 0.670600414276123,
502
+ "eval_micro_f1": 0.752921129503408,
503
+ "eval_prec": 0.6441161632494222,
504
+ "eval_prec_anger": 0.7153351698806244,
505
+ "eval_prec_disgust": 0.4611973392461197,
506
+ "eval_prec_fear": 0.6353677621283255,
507
+ "eval_prec_joy": 0.7385823025689819,
508
+ "eval_prec_neutral": 0.8081180811808119,
509
+ "eval_prec_sadness": 0.6859267734553776,
510
+ "eval_prec_surprise": 0.4642857142857143,
511
+ "eval_recall": 0.594191766213012,
512
+ "eval_recall_anger": 0.43086283185840707,
513
+ "eval_recall_disgust": 0.4351464435146444,
514
+ "eval_recall_fear": 0.5944363103953147,
515
+ "eval_recall_joy": 0.7305882352941176,
516
+ "eval_recall_neutral": 0.8840593315809238,
517
+ "eval_recall_sadness": 0.6354001059883413,
518
+ "eval_recall_surprise": 0.44884910485933505,
519
+ "eval_runtime": 52.6277,
520
+ "eval_samples_per_second": 390.289,
521
+ "eval_steps_per_second": 24.398,
522
+ "step": 8792
523
+ },
524
+ {
525
+ "epoch": 6.01,
526
+ "learning_rate": 0.0006314428051350833,
527
+ "loss": 0.66,
528
+ "step": 8800
529
+ },
530
+ {
531
+ "epoch": 6.16,
532
+ "learning_rate": 0.0006209043878137575,
533
+ "loss": 0.6414,
534
+ "step": 9020
535
+ },
536
+ {
537
+ "epoch": 6.31,
538
+ "learning_rate": 0.0006103659704924315,
539
+ "loss": 0.6445,
540
+ "step": 9240
541
+ },
542
+ {
543
+ "epoch": 6.46,
544
+ "learning_rate": 0.0005998275531711056,
545
+ "loss": 0.6405,
546
+ "step": 9460
547
+ },
548
+ {
549
+ "epoch": 6.61,
550
+ "learning_rate": 0.0005892891358497796,
551
+ "loss": 0.6532,
552
+ "step": 9680
553
+ },
554
+ {
555
+ "epoch": 6.75,
556
+ "eval_accuracy": 0.7581791626095423,
557
+ "eval_b_acc": 0.5852602000181494,
558
+ "eval_f1": 0.614564401804941,
559
+ "eval_f1_anger": 0.5887445887445888,
560
+ "eval_f1_disgust": 0.4246079613992763,
561
+ "eval_f1_fear": 0.6189300411522632,
562
+ "eval_f1_joy": 0.7366662689416538,
563
+ "eval_f1_neutral": 0.8483534354248544,
564
+ "eval_f1_sadness": 0.6636794939377966,
565
+ "eval_f1_surprise": 0.42096902303415407,
566
+ "eval_loss": 0.6566693782806396,
567
+ "eval_micro_f1": 0.7581791626095423,
568
+ "eval_prec": 0.6577687706916829,
569
+ "eval_prec_anger": 0.6155703077851539,
570
+ "eval_prec_disgust": 0.5014245014245015,
571
+ "eval_prec_fear": 0.706766917293233,
572
+ "eval_prec_joy": 0.7472766884531591,
573
+ "eval_prec_neutral": 0.8175881584675664,
574
+ "eval_prec_sadness": 0.6601992658626115,
575
+ "eval_prec_surprise": 0.5555555555555556,
576
+ "eval_recall": 0.5852602000181494,
577
+ "eval_recall_anger": 0.5641592920353983,
578
+ "eval_recall_disgust": 0.3682008368200837,
579
+ "eval_recall_fear": 0.5505124450951684,
580
+ "eval_recall_joy": 0.7263529411764705,
581
+ "eval_recall_neutral": 0.88152459631994,
582
+ "eval_recall_sadness": 0.6671966083730789,
583
+ "eval_recall_surprise": 0.3388746803069054,
584
+ "eval_runtime": 52.2302,
585
+ "eval_samples_per_second": 393.259,
586
+ "eval_steps_per_second": 24.583,
587
+ "step": 9891
588
+ },
589
+ {
590
+ "epoch": 6.76,
591
+ "learning_rate": 0.0005787507185284537,
592
+ "loss": 0.6566,
593
+ "step": 9900
594
+ },
595
+ {
596
+ "epoch": 6.91,
597
+ "learning_rate": 0.0005682602031040429,
598
+ "loss": 0.6528,
599
+ "step": 10120
600
+ },
601
+ {
602
+ "epoch": 7.06,
603
+ "learning_rate": 0.000557769687679632,
604
+ "loss": 0.6419,
605
+ "step": 10340
606
+ },
607
+ {
608
+ "epoch": 7.21,
609
+ "learning_rate": 0.0005472312703583062,
610
+ "loss": 0.6305,
611
+ "step": 10560
612
+ },
613
+ {
614
+ "epoch": 7.36,
615
+ "learning_rate": 0.0005366928530369802,
616
+ "loss": 0.6314,
617
+ "step": 10780
618
+ },
619
+ {
620
+ "epoch": 7.5,
621
+ "eval_accuracy": 0.7554527750730282,
622
+ "eval_b_acc": 0.5864396115457234,
623
+ "eval_f1": 0.6141846408191719,
624
+ "eval_f1_anger": 0.6100183582480986,
625
+ "eval_f1_disgust": 0.4005235602094241,
626
+ "eval_f1_fear": 0.6080586080586081,
627
+ "eval_f1_joy": 0.7392614080107107,
628
+ "eval_f1_neutral": 0.8438656485688855,
629
+ "eval_f1_sadness": 0.6687747035573123,
630
+ "eval_f1_surprise": 0.4287901990811639,
631
+ "eval_loss": 0.6726419925689697,
632
+ "eval_micro_f1": 0.7554527750730282,
633
+ "eval_prec": 0.6673306947742298,
634
+ "eval_prec_anger": 0.5800498753117207,
635
+ "eval_prec_disgust": 0.534965034965035,
636
+ "eval_prec_fear": 0.8117359413202934,
637
+ "eval_prec_joy": 0.7029492892000849,
638
+ "eval_prec_neutral": 0.8421692379616643,
639
+ "eval_prec_sadness": 0.6650943396226415,
640
+ "eval_prec_surprise": 0.5343511450381679,
641
+ "eval_recall": 0.5864396115457234,
642
+ "eval_recall_anger": 0.6432522123893806,
643
+ "eval_recall_disgust": 0.3200836820083682,
644
+ "eval_recall_fear": 0.486090775988287,
645
+ "eval_recall_joy": 0.7795294117647059,
646
+ "eval_recall_neutral": 0.8455689072474653,
647
+ "eval_recall_sadness": 0.6724960254372019,
648
+ "eval_recall_surprise": 0.35805626598465473,
649
+ "eval_runtime": 52.4759,
650
+ "eval_samples_per_second": 391.418,
651
+ "eval_steps_per_second": 24.468,
652
+ "step": 10990
653
+ },
654
+ {
655
+ "epoch": 7.51,
656
+ "learning_rate": 0.0005261544357156543,
657
+ "loss": 0.6297,
658
+ "step": 11000
659
+ },
660
+ {
661
+ "epoch": 7.66,
662
+ "learning_rate": 0.0005156160183943285,
663
+ "loss": 0.6373,
664
+ "step": 11220
665
+ },
666
+ {
667
+ "epoch": 7.81,
668
+ "learning_rate": 0.0005050776010730025,
669
+ "loss": 0.6278,
670
+ "step": 11440
671
+ },
672
+ {
673
+ "epoch": 7.96,
674
+ "learning_rate": 0.0004945391837516765,
675
+ "loss": 0.6321,
676
+ "step": 11660
677
+ },
678
+ {
679
+ "epoch": 8.11,
680
+ "learning_rate": 0.0004840007664303506,
681
+ "loss": 0.6045,
682
+ "step": 11880
683
+ },
684
+ {
685
+ "epoch": 8.25,
686
+ "eval_accuracy": 0.7577896786757546,
687
+ "eval_b_acc": 0.6005624120936303,
688
+ "eval_f1": 0.6238197827942396,
689
+ "eval_f1_anger": 0.6038186157517901,
690
+ "eval_f1_disgust": 0.4337078651685393,
691
+ "eval_f1_fear": 0.6333907056798622,
692
+ "eval_f1_joy": 0.7377106333527018,
693
+ "eval_f1_neutral": 0.8465511724642318,
694
+ "eval_f1_sadness": 0.6661166116611661,
695
+ "eval_f1_surprise": 0.4454428754813864,
696
+ "eval_loss": 0.6667613387107849,
697
+ "eval_micro_f1": 0.7577896786757546,
698
+ "eval_prec": 0.6550680878375978,
699
+ "eval_prec_anger": 0.655440414507772,
700
+ "eval_prec_disgust": 0.4684466019417476,
701
+ "eval_prec_fear": 0.7682672233820459,
702
+ "eval_prec_joy": 0.7288174512055109,
703
+ "eval_prec_neutral": 0.8249443207126949,
704
+ "eval_prec_sadness": 0.6923956546598056,
705
+ "eval_prec_surprise": 0.44716494845360827,
706
+ "eval_recall": 0.6005624120936303,
707
+ "eval_recall_anger": 0.5597345132743363,
708
+ "eval_recall_disgust": 0.40376569037656906,
709
+ "eval_recall_fear": 0.5387994143484627,
710
+ "eval_recall_joy": 0.7468235294117647,
711
+ "eval_recall_neutral": 0.8693203154337213,
712
+ "eval_recall_sadness": 0.6417594064652888,
713
+ "eval_recall_surprise": 0.4437340153452685,
714
+ "eval_runtime": 54.5559,
715
+ "eval_samples_per_second": 376.494,
716
+ "eval_steps_per_second": 23.535,
717
+ "step": 12089
718
+ },
719
+ {
720
+ "epoch": 8.26,
721
+ "learning_rate": 0.00047346234910902474,
722
+ "loss": 0.6078,
723
+ "step": 12100
724
+ },
725
+ {
726
+ "epoch": 8.41,
727
+ "learning_rate": 0.0004629239317876988,
728
+ "loss": 0.6091,
729
+ "step": 12320
730
+ },
731
+ {
732
+ "epoch": 8.56,
733
+ "learning_rate": 0.0004523855144663729,
734
+ "loss": 0.6127,
735
+ "step": 12540
736
+ },
737
+ {
738
+ "epoch": 8.71,
739
+ "learning_rate": 0.00044184709714504693,
740
+ "loss": 0.6243,
741
+ "step": 12760
742
+ },
743
+ {
744
+ "epoch": 8.86,
745
+ "learning_rate": 0.000431308679823721,
746
+ "loss": 0.6182,
747
+ "step": 12980
748
+ },
749
+ {
750
+ "epoch": 9.0,
751
+ "eval_accuracy": 0.7570593962999026,
752
+ "eval_b_acc": 0.6044499151869599,
753
+ "eval_f1": 0.6204901474344295,
754
+ "eval_f1_anger": 0.6087460179554011,
755
+ "eval_f1_disgust": 0.44725738396624476,
756
+ "eval_f1_fear": 0.6212361331220285,
757
+ "eval_f1_joy": 0.7376712328767122,
758
+ "eval_f1_neutral": 0.8463038632986627,
759
+ "eval_f1_sadness": 0.6678737713398861,
760
+ "eval_f1_surprise": 0.41434262948207173,
761
+ "eval_loss": 0.6659196615219116,
762
+ "eval_micro_f1": 0.7570593962999026,
763
+ "eval_prec": 0.6461033688057751,
764
+ "eval_prec_anger": 0.6389057750759879,
765
+ "eval_prec_disgust": 0.451063829787234,
766
+ "eval_prec_fear": 0.6770293609671848,
767
+ "eval_prec_joy": 0.7164079822616408,
768
+ "eval_prec_neutral": 0.8372840867328188,
769
+ "eval_prec_sadness": 0.6523496715512885,
770
+ "eval_prec_surprise": 0.5496828752642706,
771
+ "eval_recall": 0.6044499151869599,
772
+ "eval_recall_anger": 0.5813053097345132,
773
+ "eval_recall_disgust": 0.4435146443514644,
774
+ "eval_recall_fear": 0.5739385065885798,
775
+ "eval_recall_joy": 0.760235294117647,
776
+ "eval_recall_neutral": 0.8555200901239204,
777
+ "eval_recall_sadness": 0.6841547429782724,
778
+ "eval_recall_surprise": 0.33248081841432225,
779
+ "eval_runtime": 53.1364,
780
+ "eval_samples_per_second": 386.552,
781
+ "eval_steps_per_second": 24.164,
782
+ "step": 13188
783
+ },
784
+ {
785
+ "epoch": 9.01,
786
+ "learning_rate": 0.0004207702625023951,
787
+ "loss": 0.6299,
788
+ "step": 13200
789
+ },
790
+ {
791
+ "epoch": 9.16,
792
+ "learning_rate": 0.00041023184518106917,
793
+ "loss": 0.5991,
794
+ "step": 13420
795
+ },
796
+ {
797
+ "epoch": 9.31,
798
+ "learning_rate": 0.00039969342785974325,
799
+ "loss": 0.5962,
800
+ "step": 13640
801
+ },
802
+ {
803
+ "epoch": 9.46,
804
+ "learning_rate": 0.00038915501053841733,
805
+ "loss": 0.6014,
806
+ "step": 13860
807
+ },
808
+ {
809
+ "epoch": 9.61,
810
+ "learning_rate": 0.0003786165932170914,
811
+ "loss": 0.5927,
812
+ "step": 14080
813
+ },
814
+ {
815
+ "epoch": 9.75,
816
+ "eval_accuracy": 0.7466407010710808,
817
+ "eval_b_acc": 0.5639997332284856,
818
+ "eval_f1": 0.595181302839129,
819
+ "eval_f1_anger": 0.5956719817767653,
820
+ "eval_f1_disgust": 0.3489736070381232,
821
+ "eval_f1_fear": 0.6333059885151764,
822
+ "eval_f1_joy": 0.7182098034572578,
823
+ "eval_f1_neutral": 0.8372471833853672,
824
+ "eval_f1_sadness": 0.6523649521840268,
825
+ "eval_f1_surprise": 0.38049560351718625,
826
+ "eval_loss": 0.7097288966178894,
827
+ "eval_micro_f1": 0.7466407010710808,
828
+ "eval_prec": 0.6560660561913124,
829
+ "eval_prec_anger": 0.613849765258216,
830
+ "eval_prec_disgust": 0.5833333333333334,
831
+ "eval_prec_fear": 0.7201492537313433,
832
+ "eval_prec_joy": 0.7228312678741659,
833
+ "eval_prec_neutral": 0.8081055113983754,
834
+ "eval_prec_sadness": 0.6367305751765893,
835
+ "eval_prec_surprise": 0.5074626865671642,
836
+ "eval_recall": 0.5639997332284856,
837
+ "eval_recall_anger": 0.5785398230088495,
838
+ "eval_recall_disgust": 0.2489539748953975,
839
+ "eval_recall_fear": 0.5651537335285505,
840
+ "eval_recall_joy": 0.7136470588235294,
841
+ "eval_recall_neutral": 0.8685692827638002,
842
+ "eval_recall_sadness": 0.6687864334923158,
843
+ "eval_recall_surprise": 0.30434782608695654,
844
+ "eval_runtime": 53.7235,
845
+ "eval_samples_per_second": 382.328,
846
+ "eval_steps_per_second": 23.9,
847
+ "step": 14287
848
+ },
849
+ {
850
+ "epoch": 9.76,
851
+ "learning_rate": 0.0003680781758957655,
852
+ "loss": 0.5977,
853
+ "step": 14300
854
+ },
855
+ {
856
+ "epoch": 9.91,
857
+ "learning_rate": 0.00035753975857443957,
858
+ "loss": 0.6181,
859
+ "step": 14520
860
+ },
861
+ {
862
+ "epoch": 10.06,
863
+ "learning_rate": 0.00034704924315002875,
864
+ "loss": 0.595,
865
+ "step": 14740
866
+ },
867
+ {
868
+ "epoch": 10.21,
869
+ "learning_rate": 0.00033651082582870283,
870
+ "loss": 0.5668,
871
+ "step": 14960
872
+ },
873
+ {
874
+ "epoch": 10.36,
875
+ "learning_rate": 0.0003259724085073769,
876
+ "loss": 0.5736,
877
+ "step": 15180
878
+ },
879
+ {
880
+ "epoch": 10.5,
881
+ "eval_accuracy": 0.758666017526777,
882
+ "eval_b_acc": 0.6092103490403898,
883
+ "eval_f1": 0.6224896550246998,
884
+ "eval_f1_anger": 0.6192840344917692,
885
+ "eval_f1_disgust": 0.42822966507177035,
886
+ "eval_f1_fear": 0.6338028169014085,
887
+ "eval_f1_joy": 0.742619926199262,
888
+ "eval_f1_neutral": 0.8472516603080401,
889
+ "eval_f1_sadness": 0.672,
890
+ "eval_f1_surprise": 0.4142394822006473,
891
+ "eval_loss": 0.6662837862968445,
892
+ "eval_micro_f1": 0.758666017526777,
893
+ "eval_prec": 0.6494125401879046,
894
+ "eval_prec_anger": 0.586924219910847,
895
+ "eval_prec_disgust": 0.5,
896
+ "eval_prec_fear": 0.680672268907563,
897
+ "eval_prec_joy": 0.7281772953414745,
898
+ "eval_prec_neutral": 0.8501748747518669,
899
+ "eval_prec_sadness": 0.6360624704212021,
900
+ "eval_prec_surprise": 0.5638766519823789,
901
+ "eval_recall": 0.6092103490403898,
902
+ "eval_recall_anger": 0.6554203539823009,
903
+ "eval_recall_disgust": 0.37447698744769875,
904
+ "eval_recall_fear": 0.5929721815519766,
905
+ "eval_recall_joy": 0.7576470588235295,
906
+ "eval_recall_neutral": 0.8443484791588434,
907
+ "eval_recall_sadness": 0.712241653418124,
908
+ "eval_recall_surprise": 0.3273657289002558,
909
+ "eval_runtime": 52.4006,
910
+ "eval_samples_per_second": 391.98,
911
+ "eval_steps_per_second": 24.504,
912
+ "step": 15386
913
+ },
914
+ {
915
+ "epoch": 10.51,
916
+ "learning_rate": 0.000315433991186051,
917
+ "loss": 0.5779,
918
+ "step": 15400
919
+ },
920
+ {
921
+ "epoch": 10.66,
922
+ "learning_rate": 0.00030489557386472507,
923
+ "loss": 0.5816,
924
+ "step": 15620
925
+ },
926
+ {
927
+ "epoch": 10.81,
928
+ "learning_rate": 0.0002943571565433991,
929
+ "loss": 0.5866,
930
+ "step": 15840
931
+ },
932
+ {
933
+ "epoch": 10.96,
934
+ "learning_rate": 0.0002838187392220732,
935
+ "loss": 0.5797,
936
+ "step": 16060
937
+ },
938
+ {
939
+ "epoch": 11.11,
940
+ "learning_rate": 0.00027328032190074725,
941
+ "loss": 0.5687,
942
+ "step": 16280
943
+ },
944
+ {
945
+ "epoch": 11.25,
946
+ "eval_accuracy": 0.7633398247322298,
947
+ "eval_b_acc": 0.6147514191038456,
948
+ "eval_f1": 0.6337188907871468,
949
+ "eval_f1_anger": 0.6268229911352589,
950
+ "eval_f1_disgust": 0.470076169749728,
951
+ "eval_f1_fear": 0.6422018348623854,
952
+ "eval_f1_joy": 0.7406107406107406,
953
+ "eval_f1_neutral": 0.8523923886938851,
954
+ "eval_f1_sadness": 0.6596455175956846,
955
+ "eval_f1_surprise": 0.4442825928623452,
956
+ "eval_loss": 0.6598661541938782,
957
+ "eval_micro_f1": 0.7633398247322298,
958
+ "eval_prec": 0.6594926170544204,
959
+ "eval_prec_anger": 0.6489046773238603,
960
+ "eval_prec_disgust": 0.4897959183673469,
961
+ "eval_prec_fear": 0.7461240310077519,
962
+ "eval_prec_joy": 0.7365603909704445,
963
+ "eval_prec_neutral": 0.8389090909090909,
964
+ "eval_prec_sadness": 0.6400797607178464,
965
+ "eval_prec_surprise": 0.5160744500846024,
966
+ "eval_recall": 0.6147514191038456,
967
+ "eval_recall_anger": 0.6061946902654868,
968
+ "eval_recall_disgust": 0.45188284518828453,
969
+ "eval_recall_fear": 0.5636896046852123,
970
+ "eval_recall_joy": 0.7447058823529412,
971
+ "eval_recall_neutral": 0.8663161847540368,
972
+ "eval_recall_sadness": 0.6804451510333863,
973
+ "eval_recall_surprise": 0.3900255754475703,
974
+ "eval_runtime": 54.1532,
975
+ "eval_samples_per_second": 379.294,
976
+ "eval_steps_per_second": 23.711,
977
+ "step": 16485
978
+ },
979
+ {
980
+ "epoch": 11.26,
981
+ "learning_rate": 0.0002627419045794214,
982
+ "loss": 0.5575,
983
+ "step": 16500
984
+ },
985
+ {
986
+ "epoch": 11.41,
987
+ "learning_rate": 0.00025220348725809547,
988
+ "loss": 0.5672,
989
+ "step": 16720
990
+ },
991
+ {
992
+ "epoch": 11.56,
993
+ "learning_rate": 0.00024166506993676952,
994
+ "loss": 0.5582,
995
+ "step": 16940
996
+ },
997
+ {
998
+ "epoch": 11.71,
999
+ "learning_rate": 0.00023112665261544357,
1000
+ "loss": 0.5607,
1001
+ "step": 17160
1002
+ },
1003
+ {
1004
+ "epoch": 11.86,
1005
+ "learning_rate": 0.00022058823529411765,
1006
+ "loss": 0.5652,
1007
+ "step": 17380
1008
+ },
1009
+ {
1010
+ "epoch": 12.0,
1011
+ "eval_accuracy": 0.7630963972736124,
1012
+ "eval_b_acc": 0.6053830892588602,
1013
+ "eval_f1": 0.6276991641576467,
1014
+ "eval_f1_anger": 0.6168702073274639,
1015
+ "eval_f1_disgust": 0.43303571428571425,
1016
+ "eval_f1_fear": 0.638801261829653,
1017
+ "eval_f1_joy": 0.7379285799027169,
1018
+ "eval_f1_neutral": 0.8519039622384605,
1019
+ "eval_f1_sadness": 0.6683630195080577,
1020
+ "eval_f1_surprise": 0.44699140401146126,
1021
+ "eval_loss": 0.6577332019805908,
1022
+ "eval_micro_f1": 0.7630963972736124,
1023
+ "eval_prec": 0.6548174460459298,
1024
+ "eval_prec_anger": 0.6339754816112084,
1025
+ "eval_prec_disgust": 0.46411483253588515,
1026
+ "eval_prec_fear": 0.6923076923076923,
1027
+ "eval_prec_joy": 0.7441971763579803,
1028
+ "eval_prec_neutral": 0.8246199806695369,
1029
+ "eval_prec_sadness": 0.7163636363636363,
1030
+ "eval_prec_surprise": 0.50814332247557,
1031
+ "eval_recall": 0.6053830892588602,
1032
+ "eval_recall_anger": 0.6006637168141593,
1033
+ "eval_recall_disgust": 0.40585774058577406,
1034
+ "eval_recall_fear": 0.5929721815519766,
1035
+ "eval_recall_joy": 0.731764705882353,
1036
+ "eval_recall_neutral": 0.8810552009012392,
1037
+ "eval_recall_sadness": 0.6263910969793323,
1038
+ "eval_recall_surprise": 0.3989769820971867,
1039
+ "eval_runtime": 53.0543,
1040
+ "eval_samples_per_second": 387.151,
1041
+ "eval_steps_per_second": 24.202,
1042
+ "step": 17584
1043
+ },
1044
+ {
1045
+ "epoch": 12.01,
1046
+ "learning_rate": 0.00021004981797279173,
1047
+ "loss": 0.5559,
1048
+ "step": 17600
1049
+ },
1050
+ {
1051
+ "epoch": 12.16,
1052
+ "learning_rate": 0.00019951140065146582,
1053
+ "loss": 0.5439,
1054
+ "step": 17820
1055
+ },
1056
+ {
1057
+ "epoch": 12.31,
1058
+ "learning_rate": 0.00018897298333013987,
1059
+ "loss": 0.5438,
1060
+ "step": 18040
1061
+ },
1062
+ {
1063
+ "epoch": 12.46,
1064
+ "learning_rate": 0.00017843456600881395,
1065
+ "loss": 0.543,
1066
+ "step": 18260
1067
+ },
1068
+ {
1069
+ "epoch": 12.61,
1070
+ "learning_rate": 0.00016789614868748803,
1071
+ "loss": 0.5377,
1072
+ "step": 18480
1073
+ },
1074
+ {
1075
+ "epoch": 12.75,
1076
+ "eval_accuracy": 0.7619766309639727,
1077
+ "eval_b_acc": 0.6124179118880813,
1078
+ "eval_f1": 0.6250179854378021,
1079
+ "eval_f1_anger": 0.6205983584855705,
1080
+ "eval_f1_disgust": 0.41743119266055045,
1081
+ "eval_f1_fear": 0.6180981595092024,
1082
+ "eval_f1_joy": 0.7463065558633425,
1083
+ "eval_f1_neutral": 0.8512547315295107,
1084
+ "eval_f1_sadness": 0.6756976429151992,
1085
+ "eval_f1_surprise": 0.44573925710123824,
1086
+ "eval_loss": 0.6680665612220764,
1087
+ "eval_micro_f1": 0.7619766309639727,
1088
+ "eval_prec": 0.6421501390714648,
1089
+ "eval_prec_anger": 0.595226003047232,
1090
+ "eval_prec_disgust": 0.4619289340101523,
1091
+ "eval_prec_fear": 0.6489533011272142,
1092
+ "eval_prec_joy": 0.732442229270503,
1093
+ "eval_prec_neutral": 0.8474923234390993,
1094
+ "eval_prec_sadness": 0.6912416851441242,
1095
+ "eval_prec_surprise": 0.5177664974619289,
1096
+ "eval_recall": 0.6124179118880813,
1097
+ "eval_recall_anger": 0.6482300884955752,
1098
+ "eval_recall_disgust": 0.3807531380753138,
1099
+ "eval_recall_fear": 0.5900439238653001,
1100
+ "eval_recall_joy": 0.7607058823529412,
1101
+ "eval_recall_neutral": 0.8550506947052197,
1102
+ "eval_recall_sadness": 0.6608373078961314,
1103
+ "eval_recall_surprise": 0.391304347826087,
1104
+ "eval_runtime": 53.2844,
1105
+ "eval_samples_per_second": 385.479,
1106
+ "eval_steps_per_second": 24.097,
1107
+ "step": 18683
1108
+ },
1109
+ {
1110
+ "epoch": 12.76,
1111
+ "learning_rate": 0.0001573577313661621,
1112
+ "loss": 0.5457,
1113
+ "step": 18700
1114
+ },
1115
+ {
1116
+ "epoch": 12.91,
1117
+ "learning_rate": 0.00014681931404483616,
1118
+ "loss": 0.5445,
1119
+ "step": 18920
1120
+ },
1121
+ {
1122
+ "epoch": 13.06,
1123
+ "learning_rate": 0.0001363287986204254,
1124
+ "loss": 0.5323,
1125
+ "step": 19140
1126
+ },
1127
+ {
1128
+ "epoch": 13.21,
1129
+ "learning_rate": 0.00012579038129909945,
1130
+ "loss": 0.5214,
1131
+ "step": 19360
1132
+ },
1133
+ {
1134
+ "epoch": 13.36,
1135
+ "learning_rate": 0.00011525196397777351,
1136
+ "loss": 0.5312,
1137
+ "step": 19580
1138
+ },
1139
+ {
1140
+ "epoch": 13.5,
1141
+ "eval_accuracy": 0.7594449853943525,
1142
+ "eval_b_acc": 0.6161690104230055,
1143
+ "eval_f1": 0.62474808335526,
1144
+ "eval_f1_anger": 0.6223776223776223,
1145
+ "eval_f1_disgust": 0.4353448275862069,
1146
+ "eval_f1_fear": 0.6165413533834586,
1147
+ "eval_f1_joy": 0.742164744261913,
1148
+ "eval_f1_neutral": 0.8496567185091775,
1149
+ "eval_f1_sadness": 0.6675588865096359,
1150
+ "eval_f1_surprise": 0.4395924308588064,
1151
+ "eval_loss": 0.6776713132858276,
1152
+ "eval_micro_f1": 0.7594449853943525,
1153
+ "eval_prec": 0.636197719648956,
1154
+ "eval_prec_anger": 0.6057591623036649,
1155
+ "eval_prec_disgust": 0.4488888888888889,
1156
+ "eval_prec_fear": 0.633693972179289,
1157
+ "eval_prec_joy": 0.7350565428109854,
1158
+ "eval_prec_neutral": 0.8454317315735663,
1159
+ "eval_prec_sadness": 0.6744186046511628,
1160
+ "eval_prec_surprise": 0.5101351351351351,
1161
+ "eval_recall": 0.6161690104230055,
1162
+ "eval_recall_anger": 0.639933628318584,
1163
+ "eval_recall_disgust": 0.4225941422594142,
1164
+ "eval_recall_fear": 0.6002928257686676,
1165
+ "eval_recall_joy": 0.7494117647058823,
1166
+ "eval_recall_neutral": 0.8539241457003379,
1167
+ "eval_recall_sadness": 0.6608373078961314,
1168
+ "eval_recall_surprise": 0.38618925831202044,
1169
+ "eval_runtime": 52.4495,
1170
+ "eval_samples_per_second": 391.615,
1171
+ "eval_steps_per_second": 24.481,
1172
+ "step": 19782
1173
+ },
1174
+ {
1175
+ "epoch": 13.51,
1176
+ "learning_rate": 0.00010471354665644759,
1177
+ "loss": 0.5261,
1178
+ "step": 19800
1179
+ },
1180
+ {
1181
+ "epoch": 13.66,
1182
+ "learning_rate": 9.417512933512167e-05,
1183
+ "loss": 0.5282,
1184
+ "step": 20020
1185
+ },
1186
+ {
1187
+ "epoch": 13.81,
1188
+ "learning_rate": 8.363671201379575e-05,
1189
+ "loss": 0.5201,
1190
+ "step": 20240
1191
+ },
1192
+ {
1193
+ "epoch": 13.96,
1194
+ "learning_rate": 7.309829469246983e-05,
1195
+ "loss": 0.5292,
1196
+ "step": 20460
1197
+ },
1198
+ {
1199
+ "epoch": 14.11,
1200
+ "learning_rate": 6.25598773711439e-05,
1201
+ "loss": 0.512,
1202
+ "step": 20680
1203
+ },
1204
+ {
1205
+ "epoch": 14.25,
1206
+ "eval_accuracy": 0.7568646543330088,
1207
+ "eval_b_acc": 0.6172231293216093,
1208
+ "eval_f1": 0.6274045304621182,
1209
+ "eval_f1_anger": 0.6168593177332957,
1210
+ "eval_f1_disgust": 0.44719101123595506,
1211
+ "eval_f1_fear": 0.621580547112462,
1212
+ "eval_f1_joy": 0.7408979227161047,
1213
+ "eval_f1_neutral": 0.8446776328228398,
1214
+ "eval_f1_sadness": 0.6684141546526867,
1215
+ "eval_f1_surprise": 0.4522111269614835,
1216
+ "eval_loss": 0.6823310852050781,
1217
+ "eval_micro_f1": 0.7568646543330088,
1218
+ "eval_prec": 0.6409438141857619,
1219
+ "eval_prec_anger": 0.6290971822886716,
1220
+ "eval_prec_disgust": 0.4830097087378641,
1221
+ "eval_prec_fear": 0.6461295418641391,
1222
+ "eval_prec_joy": 0.7051445578231292,
1223
+ "eval_prec_neutral": 0.8506283320639756,
1224
+ "eval_prec_sadness": 0.6613070539419087,
1225
+ "eval_prec_surprise": 0.5112903225806451,
1226
+ "eval_recall": 0.6172231293216093,
1227
+ "eval_recall_anger": 0.6050884955752213,
1228
+ "eval_recall_disgust": 0.41631799163179917,
1229
+ "eval_recall_fear": 0.5988286969253295,
1230
+ "eval_recall_joy": 0.7804705882352941,
1231
+ "eval_recall_neutral": 0.838809613218175,
1232
+ "eval_recall_sadness": 0.6756756756756757,
1233
+ "eval_recall_surprise": 0.4053708439897698,
1234
+ "eval_runtime": 53.2289,
1235
+ "eval_samples_per_second": 385.881,
1236
+ "eval_steps_per_second": 24.122,
1237
+ "step": 20881
1238
+ },
1239
+ {
1240
+ "epoch": 14.26,
1241
+ "learning_rate": 5.202146004981798e-05,
1242
+ "loss": 0.5179,
1243
+ "step": 20900
1244
+ },
1245
+ {
1246
+ "epoch": 14.41,
1247
+ "learning_rate": 4.148304272849205e-05,
1248
+ "loss": 0.5085,
1249
+ "step": 21120
1250
+ },
1251
+ {
1252
+ "epoch": 14.56,
1253
+ "learning_rate": 3.099252730408124e-05,
1254
+ "loss": 0.5083,
1255
+ "step": 21340
1256
+ },
1257
+ {
1258
+ "epoch": 14.71,
1259
+ "learning_rate": 2.0454109982755316e-05,
1260
+ "loss": 0.5121,
1261
+ "step": 21560
1262
+ },
1263
+ {
1264
+ "epoch": 14.86,
1265
+ "learning_rate": 9.915692661429392e-06,
1266
+ "loss": 0.5026,
1267
+ "step": 21780
1268
+ },
1269
+ {
1270
+ "epoch": 15.0,
1271
+ "step": 21975,
1272
+ "total_flos": 6.592350719428977e+17,
1273
+ "train_loss": 0.6400373776102771,
1274
+ "train_runtime": 15988.8097,
1275
+ "train_samples_per_second": 175.927,
1276
+ "train_steps_per_second": 1.374
1277
+ }
1278
+ ],
1279
+ "max_steps": 21975,
1280
+ "num_train_epochs": 15,
1281
+ "total_flos": 6.592350719428977e+17,
1282
+ "trial_name": null,
1283
+ "trial_params": null
1284
+ }