Commit
•
0b04e2c
1
Parent(s):
50ad54f
End of training
Browse files- all_results.json +12 -12
- eval_results.json +4 -4
- predict_results.json +4 -4
- train_results.json +4 -4
- trainer_state.json +22 -22
all_results.json
CHANGED
@@ -4,30 +4,30 @@
|
|
4 |
"eval_NG_number": 3198,
|
5 |
"eval_NG_precision": 0.7309048178613397,
|
6 |
"eval_NG_recall": 0.7779862414008756,
|
7 |
-
"eval_loss": 0.
|
8 |
"eval_overall_accuracy": 0.9019303173369988,
|
9 |
"eval_overall_f1": 0.7537109966676764,
|
10 |
"eval_overall_precision": 0.7309048178613397,
|
11 |
"eval_overall_recall": 0.7779862414008756,
|
12 |
-
"eval_runtime": 2.
|
13 |
"eval_samples": 391,
|
14 |
-
"eval_samples_per_second":
|
15 |
-
"eval_steps_per_second": 10.
|
16 |
"predict_NG_f1": 0.7636470935379168,
|
17 |
"predict_NG_number": 3337,
|
18 |
"predict_NG_precision": 0.7521069456553328,
|
19 |
"predict_NG_recall": 0.7755468984117471,
|
20 |
-
"predict_loss": 0.
|
21 |
"predict_overall_accuracy": 0.9084193245778611,
|
22 |
"predict_overall_f1": 0.7636470935379168,
|
23 |
"predict_overall_precision": 0.7521069456553328,
|
24 |
"predict_overall_recall": 0.7755468984117471,
|
25 |
-
"predict_runtime": 2.
|
26 |
-
"predict_samples_per_second":
|
27 |
-
"predict_steps_per_second":
|
28 |
-
"train_loss": 0.
|
29 |
-
"train_runtime":
|
30 |
"train_samples": 1824,
|
31 |
-
"train_samples_per_second": 60.
|
32 |
-
"train_steps_per_second": 3.
|
33 |
}
|
|
|
4 |
"eval_NG_number": 3198,
|
5 |
"eval_NG_precision": 0.7309048178613397,
|
6 |
"eval_NG_recall": 0.7779862414008756,
|
7 |
+
"eval_loss": 0.29878926277160645,
|
8 |
"eval_overall_accuracy": 0.9019303173369988,
|
9 |
"eval_overall_f1": 0.7537109966676764,
|
10 |
"eval_overall_precision": 0.7309048178613397,
|
11 |
"eval_overall_recall": 0.7779862414008756,
|
12 |
+
"eval_runtime": 2.4602,
|
13 |
"eval_samples": 391,
|
14 |
+
"eval_samples_per_second": 158.929,
|
15 |
+
"eval_steps_per_second": 10.162,
|
16 |
"predict_NG_f1": 0.7636470935379168,
|
17 |
"predict_NG_number": 3337,
|
18 |
"predict_NG_precision": 0.7521069456553328,
|
19 |
"predict_NG_recall": 0.7755468984117471,
|
20 |
+
"predict_loss": 0.28632164001464844,
|
21 |
"predict_overall_accuracy": 0.9084193245778611,
|
22 |
"predict_overall_f1": 0.7636470935379168,
|
23 |
"predict_overall_precision": 0.7521069456553328,
|
24 |
"predict_overall_recall": 0.7755468984117471,
|
25 |
+
"predict_runtime": 2.2477,
|
26 |
+
"predict_samples_per_second": 173.954,
|
27 |
+
"predict_steps_per_second": 11.122,
|
28 |
+
"train_loss": 0.23679824461016738,
|
29 |
+
"train_runtime": 149.9061,
|
30 |
"train_samples": 1824,
|
31 |
+
"train_samples_per_second": 60.838,
|
32 |
+
"train_steps_per_second": 3.802
|
33 |
}
|
eval_results.json
CHANGED
@@ -4,13 +4,13 @@
|
|
4 |
"eval_NG_number": 3198,
|
5 |
"eval_NG_precision": 0.7309048178613397,
|
6 |
"eval_NG_recall": 0.7779862414008756,
|
7 |
-
"eval_loss": 0.
|
8 |
"eval_overall_accuracy": 0.9019303173369988,
|
9 |
"eval_overall_f1": 0.7537109966676764,
|
10 |
"eval_overall_precision": 0.7309048178613397,
|
11 |
"eval_overall_recall": 0.7779862414008756,
|
12 |
-
"eval_runtime": 2.
|
13 |
"eval_samples": 391,
|
14 |
-
"eval_samples_per_second":
|
15 |
-
"eval_steps_per_second": 10.
|
16 |
}
|
|
|
4 |
"eval_NG_number": 3198,
|
5 |
"eval_NG_precision": 0.7309048178613397,
|
6 |
"eval_NG_recall": 0.7779862414008756,
|
7 |
+
"eval_loss": 0.29878926277160645,
|
8 |
"eval_overall_accuracy": 0.9019303173369988,
|
9 |
"eval_overall_f1": 0.7537109966676764,
|
10 |
"eval_overall_precision": 0.7309048178613397,
|
11 |
"eval_overall_recall": 0.7779862414008756,
|
12 |
+
"eval_runtime": 2.4602,
|
13 |
"eval_samples": 391,
|
14 |
+
"eval_samples_per_second": 158.929,
|
15 |
+
"eval_steps_per_second": 10.162
|
16 |
}
|
predict_results.json
CHANGED
@@ -3,12 +3,12 @@
|
|
3 |
"predict_NG_number": 3337,
|
4 |
"predict_NG_precision": 0.7521069456553328,
|
5 |
"predict_NG_recall": 0.7755468984117471,
|
6 |
-
"predict_loss": 0.
|
7 |
"predict_overall_accuracy": 0.9084193245778611,
|
8 |
"predict_overall_f1": 0.7636470935379168,
|
9 |
"predict_overall_precision": 0.7521069456553328,
|
10 |
"predict_overall_recall": 0.7755468984117471,
|
11 |
-
"predict_runtime": 2.
|
12 |
-
"predict_samples_per_second":
|
13 |
-
"predict_steps_per_second":
|
14 |
}
|
|
|
3 |
"predict_NG_number": 3337,
|
4 |
"predict_NG_precision": 0.7521069456553328,
|
5 |
"predict_NG_recall": 0.7755468984117471,
|
6 |
+
"predict_loss": 0.28632164001464844,
|
7 |
"predict_overall_accuracy": 0.9084193245778611,
|
8 |
"predict_overall_f1": 0.7636470935379168,
|
9 |
"predict_overall_precision": 0.7521069456553328,
|
10 |
"predict_overall_recall": 0.7755468984117471,
|
11 |
+
"predict_runtime": 2.2477,
|
12 |
+
"predict_samples_per_second": 173.954,
|
13 |
+
"predict_steps_per_second": 11.122
|
14 |
}
|
train_results.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"epoch": 5.0,
|
3 |
-
"train_loss": 0.
|
4 |
-
"train_runtime":
|
5 |
"train_samples": 1824,
|
6 |
-
"train_samples_per_second": 60.
|
7 |
-
"train_steps_per_second": 3.
|
8 |
}
|
|
|
1 |
{
|
2 |
"epoch": 5.0,
|
3 |
+
"train_loss": 0.23679824461016738,
|
4 |
+
"train_runtime": 149.9061,
|
5 |
"train_samples": 1824,
|
6 |
+
"train_samples_per_second": 60.838,
|
7 |
+
"train_steps_per_second": 3.802
|
8 |
}
|
trainer_state.json
CHANGED
@@ -24,9 +24,9 @@
|
|
24 |
"eval_overall_f1": 0.7225241545893719,
|
25 |
"eval_overall_precision": 0.698482194979568,
|
26 |
"eval_overall_recall": 0.7482801751094434,
|
27 |
-
"eval_runtime": 2.
|
28 |
-
"eval_samples_per_second":
|
29 |
-
"eval_steps_per_second": 11.
|
30 |
"step": 114
|
31 |
},
|
32 |
{
|
@@ -41,14 +41,14 @@
|
|
41 |
"eval_NG_number": 3198,
|
42 |
"eval_NG_precision": 0.7293508076805851,
|
43 |
"eval_NG_recall": 0.7482801751094434,
|
44 |
-
"eval_loss": 0.
|
45 |
"eval_overall_accuracy": 0.8932050439251777,
|
46 |
"eval_overall_f1": 0.7386942429387251,
|
47 |
"eval_overall_precision": 0.7293508076805851,
|
48 |
"eval_overall_recall": 0.7482801751094434,
|
49 |
-
"eval_runtime": 2.
|
50 |
-
"eval_samples_per_second":
|
51 |
-
"eval_steps_per_second": 10.
|
52 |
"step": 228
|
53 |
},
|
54 |
{
|
@@ -63,14 +63,14 @@
|
|
63 |
"eval_NG_number": 3198,
|
64 |
"eval_NG_precision": 0.7306327616794795,
|
65 |
"eval_NG_recall": 0.7726704190118824,
|
66 |
-
"eval_loss": 0.
|
67 |
"eval_overall_accuracy": 0.9000179286439969,
|
68 |
"eval_overall_f1": 0.751063829787234,
|
69 |
"eval_overall_precision": 0.7306327616794795,
|
70 |
"eval_overall_recall": 0.7726704190118824,
|
71 |
-
"eval_runtime": 2.
|
72 |
-
"eval_samples_per_second":
|
73 |
-
"eval_steps_per_second": 10.
|
74 |
"step": 342
|
75 |
},
|
76 |
{
|
@@ -85,14 +85,14 @@
|
|
85 |
"eval_NG_number": 3198,
|
86 |
"eval_NG_precision": 0.7309048178613397,
|
87 |
"eval_NG_recall": 0.7779862414008756,
|
88 |
-
"eval_loss": 0.
|
89 |
"eval_overall_accuracy": 0.9019303173369988,
|
90 |
"eval_overall_f1": 0.7537109966676764,
|
91 |
"eval_overall_precision": 0.7309048178613397,
|
92 |
"eval_overall_recall": 0.7779862414008756,
|
93 |
-
"eval_runtime": 2.
|
94 |
-
"eval_samples_per_second":
|
95 |
-
"eval_steps_per_second": 10.
|
96 |
"step": 456
|
97 |
},
|
98 |
{
|
@@ -112,19 +112,19 @@
|
|
112 |
"eval_overall_f1": 0.7514363471424251,
|
113 |
"eval_overall_precision": 0.7274590163934426,
|
114 |
"eval_overall_recall": 0.7770481550969356,
|
115 |
-
"eval_runtime": 2.
|
116 |
-
"eval_samples_per_second":
|
117 |
-
"eval_steps_per_second": 10.
|
118 |
"step": 570
|
119 |
},
|
120 |
{
|
121 |
"epoch": 5.0,
|
122 |
"step": 570,
|
123 |
"total_flos": 2383047966228480.0,
|
124 |
-
"train_loss": 0.
|
125 |
-
"train_runtime":
|
126 |
-
"train_samples_per_second": 60.
|
127 |
-
"train_steps_per_second": 3.
|
128 |
}
|
129 |
],
|
130 |
"max_steps": 570,
|
|
|
24 |
"eval_overall_f1": 0.7225241545893719,
|
25 |
"eval_overall_precision": 0.698482194979568,
|
26 |
"eval_overall_recall": 0.7482801751094434,
|
27 |
+
"eval_runtime": 2.2533,
|
28 |
+
"eval_samples_per_second": 173.524,
|
29 |
+
"eval_steps_per_second": 11.095,
|
30 |
"step": 114
|
31 |
},
|
32 |
{
|
|
|
41 |
"eval_NG_number": 3198,
|
42 |
"eval_NG_precision": 0.7293508076805851,
|
43 |
"eval_NG_recall": 0.7482801751094434,
|
44 |
+
"eval_loss": 0.29169172048568726,
|
45 |
"eval_overall_accuracy": 0.8932050439251777,
|
46 |
"eval_overall_f1": 0.7386942429387251,
|
47 |
"eval_overall_precision": 0.7293508076805851,
|
48 |
"eval_overall_recall": 0.7482801751094434,
|
49 |
+
"eval_runtime": 2.3222,
|
50 |
+
"eval_samples_per_second": 168.377,
|
51 |
+
"eval_steps_per_second": 10.766,
|
52 |
"step": 228
|
53 |
},
|
54 |
{
|
|
|
63 |
"eval_NG_number": 3198,
|
64 |
"eval_NG_precision": 0.7306327616794795,
|
65 |
"eval_NG_recall": 0.7726704190118824,
|
66 |
+
"eval_loss": 0.286408007144928,
|
67 |
"eval_overall_accuracy": 0.9000179286439969,
|
68 |
"eval_overall_f1": 0.751063829787234,
|
69 |
"eval_overall_precision": 0.7306327616794795,
|
70 |
"eval_overall_recall": 0.7726704190118824,
|
71 |
+
"eval_runtime": 2.3542,
|
72 |
+
"eval_samples_per_second": 166.089,
|
73 |
+
"eval_steps_per_second": 10.62,
|
74 |
"step": 342
|
75 |
},
|
76 |
{
|
|
|
85 |
"eval_NG_number": 3198,
|
86 |
"eval_NG_precision": 0.7309048178613397,
|
87 |
"eval_NG_recall": 0.7779862414008756,
|
88 |
+
"eval_loss": 0.29878926277160645,
|
89 |
"eval_overall_accuracy": 0.9019303173369988,
|
90 |
"eval_overall_f1": 0.7537109966676764,
|
91 |
"eval_overall_precision": 0.7309048178613397,
|
92 |
"eval_overall_recall": 0.7779862414008756,
|
93 |
+
"eval_runtime": 2.2946,
|
94 |
+
"eval_samples_per_second": 170.401,
|
95 |
+
"eval_steps_per_second": 10.895,
|
96 |
"step": 456
|
97 |
},
|
98 |
{
|
|
|
112 |
"eval_overall_f1": 0.7514363471424251,
|
113 |
"eval_overall_precision": 0.7274590163934426,
|
114 |
"eval_overall_recall": 0.7770481550969356,
|
115 |
+
"eval_runtime": 2.2998,
|
116 |
+
"eval_samples_per_second": 170.014,
|
117 |
+
"eval_steps_per_second": 10.87,
|
118 |
"step": 570
|
119 |
},
|
120 |
{
|
121 |
"epoch": 5.0,
|
122 |
"step": 570,
|
123 |
"total_flos": 2383047966228480.0,
|
124 |
+
"train_loss": 0.23679824461016738,
|
125 |
+
"train_runtime": 149.9061,
|
126 |
+
"train_samples_per_second": 60.838,
|
127 |
+
"train_steps_per_second": 3.802
|
128 |
}
|
129 |
],
|
130 |
"max_steps": 570,
|