jorgeortizfuentes commited on
Commit
0b04e2c
1 Parent(s): 50ad54f

End of training

Browse files
all_results.json CHANGED
@@ -4,30 +4,30 @@
4
  "eval_NG_number": 3198,
5
  "eval_NG_precision": 0.7309048178613397,
6
  "eval_NG_recall": 0.7779862414008756,
7
- "eval_loss": 0.29878920316696167,
8
  "eval_overall_accuracy": 0.9019303173369988,
9
  "eval_overall_f1": 0.7537109966676764,
10
  "eval_overall_precision": 0.7309048178613397,
11
  "eval_overall_recall": 0.7779862414008756,
12
- "eval_runtime": 2.4235,
13
  "eval_samples": 391,
14
- "eval_samples_per_second": 161.337,
15
- "eval_steps_per_second": 10.316,
16
  "predict_NG_f1": 0.7636470935379168,
17
  "predict_NG_number": 3337,
18
  "predict_NG_precision": 0.7521069456553328,
19
  "predict_NG_recall": 0.7755468984117471,
20
- "predict_loss": 0.2863216698169708,
21
  "predict_overall_accuracy": 0.9084193245778611,
22
  "predict_overall_f1": 0.7636470935379168,
23
  "predict_overall_precision": 0.7521069456553328,
24
  "predict_overall_recall": 0.7755468984117471,
25
- "predict_runtime": 2.281,
26
- "predict_samples_per_second": 171.414,
27
- "predict_steps_per_second": 10.96,
28
- "train_loss": 0.23679824628328022,
29
- "train_runtime": 150.2286,
30
  "train_samples": 1824,
31
- "train_samples_per_second": 60.707,
32
- "train_steps_per_second": 3.794
33
  }
 
4
  "eval_NG_number": 3198,
5
  "eval_NG_precision": 0.7309048178613397,
6
  "eval_NG_recall": 0.7779862414008756,
7
+ "eval_loss": 0.29878926277160645,
8
  "eval_overall_accuracy": 0.9019303173369988,
9
  "eval_overall_f1": 0.7537109966676764,
10
  "eval_overall_precision": 0.7309048178613397,
11
  "eval_overall_recall": 0.7779862414008756,
12
+ "eval_runtime": 2.4602,
13
  "eval_samples": 391,
14
+ "eval_samples_per_second": 158.929,
15
+ "eval_steps_per_second": 10.162,
16
  "predict_NG_f1": 0.7636470935379168,
17
  "predict_NG_number": 3337,
18
  "predict_NG_precision": 0.7521069456553328,
19
  "predict_NG_recall": 0.7755468984117471,
20
+ "predict_loss": 0.28632164001464844,
21
  "predict_overall_accuracy": 0.9084193245778611,
22
  "predict_overall_f1": 0.7636470935379168,
23
  "predict_overall_precision": 0.7521069456553328,
24
  "predict_overall_recall": 0.7755468984117471,
25
+ "predict_runtime": 2.2477,
26
+ "predict_samples_per_second": 173.954,
27
+ "predict_steps_per_second": 11.122,
28
+ "train_loss": 0.23679824461016738,
29
+ "train_runtime": 149.9061,
30
  "train_samples": 1824,
31
+ "train_samples_per_second": 60.838,
32
+ "train_steps_per_second": 3.802
33
  }
eval_results.json CHANGED
@@ -4,13 +4,13 @@
4
  "eval_NG_number": 3198,
5
  "eval_NG_precision": 0.7309048178613397,
6
  "eval_NG_recall": 0.7779862414008756,
7
- "eval_loss": 0.29878920316696167,
8
  "eval_overall_accuracy": 0.9019303173369988,
9
  "eval_overall_f1": 0.7537109966676764,
10
  "eval_overall_precision": 0.7309048178613397,
11
  "eval_overall_recall": 0.7779862414008756,
12
- "eval_runtime": 2.4235,
13
  "eval_samples": 391,
14
- "eval_samples_per_second": 161.337,
15
- "eval_steps_per_second": 10.316
16
  }
 
4
  "eval_NG_number": 3198,
5
  "eval_NG_precision": 0.7309048178613397,
6
  "eval_NG_recall": 0.7779862414008756,
7
+ "eval_loss": 0.29878926277160645,
8
  "eval_overall_accuracy": 0.9019303173369988,
9
  "eval_overall_f1": 0.7537109966676764,
10
  "eval_overall_precision": 0.7309048178613397,
11
  "eval_overall_recall": 0.7779862414008756,
12
+ "eval_runtime": 2.4602,
13
  "eval_samples": 391,
14
+ "eval_samples_per_second": 158.929,
15
+ "eval_steps_per_second": 10.162
16
  }
predict_results.json CHANGED
@@ -3,12 +3,12 @@
3
  "predict_NG_number": 3337,
4
  "predict_NG_precision": 0.7521069456553328,
5
  "predict_NG_recall": 0.7755468984117471,
6
- "predict_loss": 0.2863216698169708,
7
  "predict_overall_accuracy": 0.9084193245778611,
8
  "predict_overall_f1": 0.7636470935379168,
9
  "predict_overall_precision": 0.7521069456553328,
10
  "predict_overall_recall": 0.7755468984117471,
11
- "predict_runtime": 2.281,
12
- "predict_samples_per_second": 171.414,
13
- "predict_steps_per_second": 10.96
14
  }
 
3
  "predict_NG_number": 3337,
4
  "predict_NG_precision": 0.7521069456553328,
5
  "predict_NG_recall": 0.7755468984117471,
6
+ "predict_loss": 0.28632164001464844,
7
  "predict_overall_accuracy": 0.9084193245778611,
8
  "predict_overall_f1": 0.7636470935379168,
9
  "predict_overall_precision": 0.7521069456553328,
10
  "predict_overall_recall": 0.7755468984117471,
11
+ "predict_runtime": 2.2477,
12
+ "predict_samples_per_second": 173.954,
13
+ "predict_steps_per_second": 11.122
14
  }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 5.0,
3
- "train_loss": 0.23679824628328022,
4
- "train_runtime": 150.2286,
5
  "train_samples": 1824,
6
- "train_samples_per_second": 60.707,
7
- "train_steps_per_second": 3.794
8
  }
 
1
  {
2
  "epoch": 5.0,
3
+ "train_loss": 0.23679824461016738,
4
+ "train_runtime": 149.9061,
5
  "train_samples": 1824,
6
+ "train_samples_per_second": 60.838,
7
+ "train_steps_per_second": 3.802
8
  }
trainer_state.json CHANGED
@@ -24,9 +24,9 @@
24
  "eval_overall_f1": 0.7225241545893719,
25
  "eval_overall_precision": 0.698482194979568,
26
  "eval_overall_recall": 0.7482801751094434,
27
- "eval_runtime": 2.2675,
28
- "eval_samples_per_second": 172.436,
29
- "eval_steps_per_second": 11.025,
30
  "step": 114
31
  },
32
  {
@@ -41,14 +41,14 @@
41
  "eval_NG_number": 3198,
42
  "eval_NG_precision": 0.7293508076805851,
43
  "eval_NG_recall": 0.7482801751094434,
44
- "eval_loss": 0.29169175028800964,
45
  "eval_overall_accuracy": 0.8932050439251777,
46
  "eval_overall_f1": 0.7386942429387251,
47
  "eval_overall_precision": 0.7293508076805851,
48
  "eval_overall_recall": 0.7482801751094434,
49
- "eval_runtime": 2.3333,
50
- "eval_samples_per_second": 167.577,
51
- "eval_steps_per_second": 10.715,
52
  "step": 228
53
  },
54
  {
@@ -63,14 +63,14 @@
63
  "eval_NG_number": 3198,
64
  "eval_NG_precision": 0.7306327616794795,
65
  "eval_NG_recall": 0.7726704190118824,
66
- "eval_loss": 0.2864079773426056,
67
  "eval_overall_accuracy": 0.9000179286439969,
68
  "eval_overall_f1": 0.751063829787234,
69
  "eval_overall_precision": 0.7306327616794795,
70
  "eval_overall_recall": 0.7726704190118824,
71
- "eval_runtime": 2.3686,
72
- "eval_samples_per_second": 165.074,
73
- "eval_steps_per_second": 10.555,
74
  "step": 342
75
  },
76
  {
@@ -85,14 +85,14 @@
85
  "eval_NG_number": 3198,
86
  "eval_NG_precision": 0.7309048178613397,
87
  "eval_NG_recall": 0.7779862414008756,
88
- "eval_loss": 0.29878920316696167,
89
  "eval_overall_accuracy": 0.9019303173369988,
90
  "eval_overall_f1": 0.7537109966676764,
91
  "eval_overall_precision": 0.7309048178613397,
92
  "eval_overall_recall": 0.7779862414008756,
93
- "eval_runtime": 2.3061,
94
- "eval_samples_per_second": 169.554,
95
- "eval_steps_per_second": 10.841,
96
  "step": 456
97
  },
98
  {
@@ -112,19 +112,19 @@
112
  "eval_overall_f1": 0.7514363471424251,
113
  "eval_overall_precision": 0.7274590163934426,
114
  "eval_overall_recall": 0.7770481550969356,
115
- "eval_runtime": 2.3108,
116
- "eval_samples_per_second": 169.206,
117
- "eval_steps_per_second": 10.819,
118
  "step": 570
119
  },
120
  {
121
  "epoch": 5.0,
122
  "step": 570,
123
  "total_flos": 2383047966228480.0,
124
- "train_loss": 0.23679824628328022,
125
- "train_runtime": 150.2286,
126
- "train_samples_per_second": 60.707,
127
- "train_steps_per_second": 3.794
128
  }
129
  ],
130
  "max_steps": 570,
 
24
  "eval_overall_f1": 0.7225241545893719,
25
  "eval_overall_precision": 0.698482194979568,
26
  "eval_overall_recall": 0.7482801751094434,
27
+ "eval_runtime": 2.2533,
28
+ "eval_samples_per_second": 173.524,
29
+ "eval_steps_per_second": 11.095,
30
  "step": 114
31
  },
32
  {
 
41
  "eval_NG_number": 3198,
42
  "eval_NG_precision": 0.7293508076805851,
43
  "eval_NG_recall": 0.7482801751094434,
44
+ "eval_loss": 0.29169172048568726,
45
  "eval_overall_accuracy": 0.8932050439251777,
46
  "eval_overall_f1": 0.7386942429387251,
47
  "eval_overall_precision": 0.7293508076805851,
48
  "eval_overall_recall": 0.7482801751094434,
49
+ "eval_runtime": 2.3222,
50
+ "eval_samples_per_second": 168.377,
51
+ "eval_steps_per_second": 10.766,
52
  "step": 228
53
  },
54
  {
 
63
  "eval_NG_number": 3198,
64
  "eval_NG_precision": 0.7306327616794795,
65
  "eval_NG_recall": 0.7726704190118824,
66
+ "eval_loss": 0.286408007144928,
67
  "eval_overall_accuracy": 0.9000179286439969,
68
  "eval_overall_f1": 0.751063829787234,
69
  "eval_overall_precision": 0.7306327616794795,
70
  "eval_overall_recall": 0.7726704190118824,
71
+ "eval_runtime": 2.3542,
72
+ "eval_samples_per_second": 166.089,
73
+ "eval_steps_per_second": 10.62,
74
  "step": 342
75
  },
76
  {
 
85
  "eval_NG_number": 3198,
86
  "eval_NG_precision": 0.7309048178613397,
87
  "eval_NG_recall": 0.7779862414008756,
88
+ "eval_loss": 0.29878926277160645,
89
  "eval_overall_accuracy": 0.9019303173369988,
90
  "eval_overall_f1": 0.7537109966676764,
91
  "eval_overall_precision": 0.7309048178613397,
92
  "eval_overall_recall": 0.7779862414008756,
93
+ "eval_runtime": 2.2946,
94
+ "eval_samples_per_second": 170.401,
95
+ "eval_steps_per_second": 10.895,
96
  "step": 456
97
  },
98
  {
 
112
  "eval_overall_f1": 0.7514363471424251,
113
  "eval_overall_precision": 0.7274590163934426,
114
  "eval_overall_recall": 0.7770481550969356,
115
+ "eval_runtime": 2.2998,
116
+ "eval_samples_per_second": 170.014,
117
+ "eval_steps_per_second": 10.87,
118
  "step": 570
119
  },
120
  {
121
  "epoch": 5.0,
122
  "step": 570,
123
  "total_flos": 2383047966228480.0,
124
+ "train_loss": 0.23679824461016738,
125
+ "train_runtime": 149.9061,
126
+ "train_samples_per_second": 60.838,
127
+ "train_steps_per_second": 3.802
128
  }
129
  ],
130
  "max_steps": 570,