Fitsum Gaim commited on
Commit
68db11e
1 Parent(s): 56201f9
all_results.json DELETED
@@ -1,185 +0,0 @@
1
- {
2
- "epoch": 10.0,
3
- "eval_ADJ_f1": 0.9277000892591492,
4
- "eval_ADJ_number": 1670,
5
- "eval_ADJ_precision": 0.92193968066233,
6
- "eval_ADJ_recall": 0.9335329341317365,
7
- "eval_ADV_f1": 0.8423194303153613,
8
- "eval_ADV_number": 484,
9
- "eval_ADV_precision": 0.8296593186372746,
10
- "eval_ADV_recall": 0.8553719008264463,
11
- "eval_CON_f1": 0.9803719008264462,
12
- "eval_CON_number": 972,
13
- "eval_CON_precision": 0.9844398340248963,
14
- "eval_CON_recall": 0.9763374485596708,
15
- "eval_FW_f1": 0.6382978723404255,
16
- "eval_FW_number": 28,
17
- "eval_FW_precision": 0.7894736842105263,
18
- "eval_FW_recall": 0.5357142857142857,
19
- "eval_INT_f1": 0.6909090909090909,
20
- "eval_INT_number": 26,
21
- "eval_INT_precision": 0.6551724137931034,
22
- "eval_INT_recall": 0.7307692307692307,
23
- "eval_NUM_f1": 0.9705882352941178,
24
- "eval_NUM_number": 239,
25
- "eval_NUM_precision": 0.9746835443037974,
26
- "eval_NUM_recall": 0.9665271966527197,
27
- "eval_N_PRP_f1": 0.9376979936642028,
28
- "eval_N_PRP_number": 470,
29
- "eval_N_PRP_precision": 0.9308176100628931,
30
- "eval_N_PRP_recall": 0.9446808510638298,
31
- "eval_N_V_f1": 0.9794437726723096,
32
- "eval_N_V_number": 416,
33
- "eval_N_V_precision": 0.9854014598540146,
34
- "eval_N_V_recall": 0.9735576923076923,
35
- "eval_N_f1": 0.965577669295281,
36
- "eval_N_number": 3992,
37
- "eval_N_precision": 0.9649737302977233,
38
- "eval_N_recall": 0.966182364729459,
39
- "eval_PRE_f1": 0.9673130193905818,
40
- "eval_PRE_number": 907,
41
- "eval_PRE_precision": 0.9721603563474388,
42
- "eval_PRE_recall": 0.9625137816979051,
43
- "eval_PRO_f1": 0.9340909090909091,
44
- "eval_PRO_number": 445,
45
- "eval_PRO_precision": 0.9448275862068966,
46
- "eval_PRO_recall": 0.9235955056179775,
47
- "eval_PUN_f1": 0.9996887643946467,
48
- "eval_PUN_number": 1607,
49
- "eval_PUN_precision": 1.0,
50
- "eval_PUN_recall": 0.9993777224642191,
51
- "eval_UNC_f1": 0.9333333333333333,
52
- "eval_UNC_number": 16,
53
- "eval_UNC_precision": 1.0,
54
- "eval_UNC_recall": 0.875,
55
- "eval_V_AUX_f1": 0.9780469341408025,
56
- "eval_V_AUX_number": 654,
57
- "eval_V_AUX_precision": 0.9685157421289355,
58
- "eval_V_AUX_recall": 0.9877675840978594,
59
- "eval_V_GER_f1": 0.9478764478764479,
60
- "eval_V_GER_number": 513,
61
- "eval_V_GER_precision": 0.9388145315487572,
62
- "eval_V_GER_recall": 0.9571150097465887,
63
- "eval_V_IMF_f1": 0.9564738292011019,
64
- "eval_V_IMF_number": 914,
65
- "eval_V_IMF_precision": 0.9633740288568258,
66
- "eval_V_IMF_recall": 0.949671772428884,
67
- "eval_V_IMV_f1": 0.796875,
68
- "eval_V_IMV_number": 70,
69
- "eval_V_IMV_precision": 0.8793103448275862,
70
- "eval_V_IMV_recall": 0.7285714285714285,
71
- "eval_V_PRF_f1": 0.902027027027027,
72
- "eval_V_PRF_number": 294,
73
- "eval_V_PRF_precision": 0.8959731543624161,
74
- "eval_V_PRF_recall": 0.9081632653061225,
75
- "eval_V_REL_f1": 0.9607451763140386,
76
- "eval_V_REL_number": 757,
77
- "eval_V_REL_precision": 0.967828418230563,
78
- "eval_V_REL_recall": 0.9537648612945839,
79
- "eval_V_f1": 0.9,
80
- "eval_V_number": 78,
81
- "eval_V_precision": 0.8780487804878049,
82
- "eval_V_recall": 0.9230769230769231,
83
- "eval_loss": 0.3193676769733429,
84
- "eval_overall_accuracy": 0.9561572292468389,
85
- "eval_overall_f1": 0.9561572292468388,
86
- "eval_overall_precision": 0.9561572292468389,
87
- "eval_overall_recall": 0.9561572292468389,
88
- "eval_runtime": 14.3338,
89
- "eval_samples": 929,
90
- "eval_samples_per_second": 64.812,
91
- "eval_steps_per_second": 2.093,
92
- "predict_ADJ_f1": 0.9277000892591492,
93
- "predict_ADJ_number": 1670,
94
- "predict_ADJ_precision": 0.92193968066233,
95
- "predict_ADJ_recall": 0.9335329341317365,
96
- "predict_ADV_f1": 0.8423194303153613,
97
- "predict_ADV_number": 484,
98
- "predict_ADV_precision": 0.8296593186372746,
99
- "predict_ADV_recall": 0.8553719008264463,
100
- "predict_CON_f1": 0.9803719008264462,
101
- "predict_CON_number": 972,
102
- "predict_CON_precision": 0.9844398340248963,
103
- "predict_CON_recall": 0.9763374485596708,
104
- "predict_FW_f1": 0.6382978723404255,
105
- "predict_FW_number": 28,
106
- "predict_FW_precision": 0.7894736842105263,
107
- "predict_FW_recall": 0.5357142857142857,
108
- "predict_INT_f1": 0.6909090909090909,
109
- "predict_INT_number": 26,
110
- "predict_INT_precision": 0.6551724137931034,
111
- "predict_INT_recall": 0.7307692307692307,
112
- "predict_NUM_f1": 0.9705882352941178,
113
- "predict_NUM_number": 239,
114
- "predict_NUM_precision": 0.9746835443037974,
115
- "predict_NUM_recall": 0.9665271966527197,
116
- "predict_N_PRP_f1": 0.9376979936642028,
117
- "predict_N_PRP_number": 470,
118
- "predict_N_PRP_precision": 0.9308176100628931,
119
- "predict_N_PRP_recall": 0.9446808510638298,
120
- "predict_N_V_f1": 0.9794437726723096,
121
- "predict_N_V_number": 416,
122
- "predict_N_V_precision": 0.9854014598540146,
123
- "predict_N_V_recall": 0.9735576923076923,
124
- "predict_N_f1": 0.965577669295281,
125
- "predict_N_number": 3992,
126
- "predict_N_precision": 0.9649737302977233,
127
- "predict_N_recall": 0.966182364729459,
128
- "predict_PRE_f1": 0.9673130193905818,
129
- "predict_PRE_number": 907,
130
- "predict_PRE_precision": 0.9721603563474388,
131
- "predict_PRE_recall": 0.9625137816979051,
132
- "predict_PRO_f1": 0.9340909090909091,
133
- "predict_PRO_number": 445,
134
- "predict_PRO_precision": 0.9448275862068966,
135
- "predict_PRO_recall": 0.9235955056179775,
136
- "predict_PUN_f1": 0.9996887643946467,
137
- "predict_PUN_number": 1607,
138
- "predict_PUN_precision": 1.0,
139
- "predict_PUN_recall": 0.9993777224642191,
140
- "predict_UNC_f1": 0.9333333333333333,
141
- "predict_UNC_number": 16,
142
- "predict_UNC_precision": 1.0,
143
- "predict_UNC_recall": 0.875,
144
- "predict_V_AUX_f1": 0.9780469341408025,
145
- "predict_V_AUX_number": 654,
146
- "predict_V_AUX_precision": 0.9685157421289355,
147
- "predict_V_AUX_recall": 0.9877675840978594,
148
- "predict_V_GER_f1": 0.9478764478764479,
149
- "predict_V_GER_number": 513,
150
- "predict_V_GER_precision": 0.9388145315487572,
151
- "predict_V_GER_recall": 0.9571150097465887,
152
- "predict_V_IMF_f1": 0.9564738292011019,
153
- "predict_V_IMF_number": 914,
154
- "predict_V_IMF_precision": 0.9633740288568258,
155
- "predict_V_IMF_recall": 0.949671772428884,
156
- "predict_V_IMV_f1": 0.796875,
157
- "predict_V_IMV_number": 70,
158
- "predict_V_IMV_precision": 0.8793103448275862,
159
- "predict_V_IMV_recall": 0.7285714285714285,
160
- "predict_V_PRF_f1": 0.902027027027027,
161
- "predict_V_PRF_number": 294,
162
- "predict_V_PRF_precision": 0.8959731543624161,
163
- "predict_V_PRF_recall": 0.9081632653061225,
164
- "predict_V_REL_f1": 0.9607451763140386,
165
- "predict_V_REL_number": 757,
166
- "predict_V_REL_precision": 0.967828418230563,
167
- "predict_V_REL_recall": 0.9537648612945839,
168
- "predict_V_f1": 0.9,
169
- "predict_V_number": 78,
170
- "predict_V_precision": 0.8780487804878049,
171
- "predict_V_recall": 0.9230769230769231,
172
- "predict_loss": 0.3193676769733429,
173
- "predict_overall_accuracy": 0.9561572292468389,
174
- "predict_overall_f1": 0.9561572292468388,
175
- "predict_overall_precision": 0.9561572292468389,
176
- "predict_overall_recall": 0.9561572292468389,
177
- "predict_runtime": 14.2811,
178
- "predict_samples_per_second": 65.051,
179
- "predict_steps_per_second": 2.101,
180
- "train_loss": 0.07197833191200252,
181
- "train_runtime": 2030.3618,
182
- "train_samples": 3691,
183
- "train_samples_per_second": 18.179,
184
- "train_steps_per_second": 2.275
185
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
eval_results.json DELETED
@@ -1,92 +0,0 @@
1
- {
2
- "epoch": 10.0,
3
- "eval_ADJ_f1": 0.9277000892591492,
4
- "eval_ADJ_number": 1670,
5
- "eval_ADJ_precision": 0.92193968066233,
6
- "eval_ADJ_recall": 0.9335329341317365,
7
- "eval_ADV_f1": 0.8423194303153613,
8
- "eval_ADV_number": 484,
9
- "eval_ADV_precision": 0.8296593186372746,
10
- "eval_ADV_recall": 0.8553719008264463,
11
- "eval_CON_f1": 0.9803719008264462,
12
- "eval_CON_number": 972,
13
- "eval_CON_precision": 0.9844398340248963,
14
- "eval_CON_recall": 0.9763374485596708,
15
- "eval_FW_f1": 0.6382978723404255,
16
- "eval_FW_number": 28,
17
- "eval_FW_precision": 0.7894736842105263,
18
- "eval_FW_recall": 0.5357142857142857,
19
- "eval_INT_f1": 0.6909090909090909,
20
- "eval_INT_number": 26,
21
- "eval_INT_precision": 0.6551724137931034,
22
- "eval_INT_recall": 0.7307692307692307,
23
- "eval_NUM_f1": 0.9705882352941178,
24
- "eval_NUM_number": 239,
25
- "eval_NUM_precision": 0.9746835443037974,
26
- "eval_NUM_recall": 0.9665271966527197,
27
- "eval_N_PRP_f1": 0.9376979936642028,
28
- "eval_N_PRP_number": 470,
29
- "eval_N_PRP_precision": 0.9308176100628931,
30
- "eval_N_PRP_recall": 0.9446808510638298,
31
- "eval_N_V_f1": 0.9794437726723096,
32
- "eval_N_V_number": 416,
33
- "eval_N_V_precision": 0.9854014598540146,
34
- "eval_N_V_recall": 0.9735576923076923,
35
- "eval_N_f1": 0.965577669295281,
36
- "eval_N_number": 3992,
37
- "eval_N_precision": 0.9649737302977233,
38
- "eval_N_recall": 0.966182364729459,
39
- "eval_PRE_f1": 0.9673130193905818,
40
- "eval_PRE_number": 907,
41
- "eval_PRE_precision": 0.9721603563474388,
42
- "eval_PRE_recall": 0.9625137816979051,
43
- "eval_PRO_f1": 0.9340909090909091,
44
- "eval_PRO_number": 445,
45
- "eval_PRO_precision": 0.9448275862068966,
46
- "eval_PRO_recall": 0.9235955056179775,
47
- "eval_PUN_f1": 0.9996887643946467,
48
- "eval_PUN_number": 1607,
49
- "eval_PUN_precision": 1.0,
50
- "eval_PUN_recall": 0.9993777224642191,
51
- "eval_UNC_f1": 0.9333333333333333,
52
- "eval_UNC_number": 16,
53
- "eval_UNC_precision": 1.0,
54
- "eval_UNC_recall": 0.875,
55
- "eval_V_AUX_f1": 0.9780469341408025,
56
- "eval_V_AUX_number": 654,
57
- "eval_V_AUX_precision": 0.9685157421289355,
58
- "eval_V_AUX_recall": 0.9877675840978594,
59
- "eval_V_GER_f1": 0.9478764478764479,
60
- "eval_V_GER_number": 513,
61
- "eval_V_GER_precision": 0.9388145315487572,
62
- "eval_V_GER_recall": 0.9571150097465887,
63
- "eval_V_IMF_f1": 0.9564738292011019,
64
- "eval_V_IMF_number": 914,
65
- "eval_V_IMF_precision": 0.9633740288568258,
66
- "eval_V_IMF_recall": 0.949671772428884,
67
- "eval_V_IMV_f1": 0.796875,
68
- "eval_V_IMV_number": 70,
69
- "eval_V_IMV_precision": 0.8793103448275862,
70
- "eval_V_IMV_recall": 0.7285714285714285,
71
- "eval_V_PRF_f1": 0.902027027027027,
72
- "eval_V_PRF_number": 294,
73
- "eval_V_PRF_precision": 0.8959731543624161,
74
- "eval_V_PRF_recall": 0.9081632653061225,
75
- "eval_V_REL_f1": 0.9607451763140386,
76
- "eval_V_REL_number": 757,
77
- "eval_V_REL_precision": 0.967828418230563,
78
- "eval_V_REL_recall": 0.9537648612945839,
79
- "eval_V_f1": 0.9,
80
- "eval_V_number": 78,
81
- "eval_V_precision": 0.8780487804878049,
82
- "eval_V_recall": 0.9230769230769231,
83
- "eval_loss": 0.3193676769733429,
84
- "eval_overall_accuracy": 0.9561572292468389,
85
- "eval_overall_f1": 0.9561572292468388,
86
- "eval_overall_precision": 0.9561572292468389,
87
- "eval_overall_recall": 0.9561572292468389,
88
- "eval_runtime": 14.3338,
89
- "eval_samples": 929,
90
- "eval_samples_per_second": 64.812,
91
- "eval_steps_per_second": 2.093
92
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
train_results.json DELETED
@@ -1,8 +0,0 @@
1
- {
2
- "epoch": 10.0,
3
- "train_loss": 0.07197833191200252,
4
- "train_runtime": 2030.3618,
5
- "train_samples": 3691,
6
- "train_samples_per_second": 18.179,
7
- "train_steps_per_second": 2.275
8
- }
 
 
 
 
 
 
 
 
trainer_state.json DELETED
@@ -1,79 +0,0 @@
1
- {
2
- "best_metric": null,
3
- "best_model_checkpoint": null,
4
- "epoch": 10.0,
5
- "global_step": 4620,
6
- "is_hyper_param_search": false,
7
- "is_local_process_zero": true,
8
- "is_world_process_zero": true,
9
- "log_history": [
10
- {
11
- "epoch": 1.08,
12
- "learning_rate": 4.458874458874459e-05,
13
- "loss": 0.4026,
14
- "step": 500
15
- },
16
- {
17
- "epoch": 2.16,
18
- "learning_rate": 3.917748917748918e-05,
19
- "loss": 0.1339,
20
- "step": 1000
21
- },
22
- {
23
- "epoch": 3.25,
24
- "learning_rate": 3.376623376623377e-05,
25
- "loss": 0.066,
26
- "step": 1500
27
- },
28
- {
29
- "epoch": 4.33,
30
- "learning_rate": 2.8354978354978357e-05,
31
- "loss": 0.032,
32
- "step": 2000
33
- },
34
- {
35
- "epoch": 5.41,
36
- "learning_rate": 2.2943722943722946e-05,
37
- "loss": 0.0157,
38
- "step": 2500
39
- },
40
- {
41
- "epoch": 6.49,
42
- "learning_rate": 1.7532467532467535e-05,
43
- "loss": 0.0061,
44
- "step": 3000
45
- },
46
- {
47
- "epoch": 7.58,
48
- "learning_rate": 1.2121212121212122e-05,
49
- "loss": 0.0051,
50
- "step": 3500
51
- },
52
- {
53
- "epoch": 8.66,
54
- "learning_rate": 6.709956709956711e-06,
55
- "loss": 0.002,
56
- "step": 4000
57
- },
58
- {
59
- "epoch": 9.74,
60
- "learning_rate": 1.2987012987012988e-06,
61
- "loss": 0.0015,
62
- "step": 4500
63
- },
64
- {
65
- "epoch": 10.0,
66
- "step": 4620,
67
- "total_flos": 2411508200294400.0,
68
- "train_loss": 0.07197833191200252,
69
- "train_runtime": 2030.3618,
70
- "train_samples_per_second": 18.179,
71
- "train_steps_per_second": 2.275
72
- }
73
- ],
74
- "max_steps": 4620,
75
- "num_train_epochs": 10,
76
- "total_flos": 2411508200294400.0,
77
- "trial_name": null,
78
- "trial_params": null
79
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
training_args.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:bd29656583d3cd9fb46c6b6b88fabde5a165aec3042edf54411bab3af0be3085
3
- size 2863