apwic commited on
Commit
9a8567c
1 Parent(s): eb8be17

End of training

Browse files
README.md CHANGED
@@ -1,4 +1,6 @@
1
  ---
 
 
2
  license: mit
3
  base_model: indolem/indobert-base-uncased
4
  tags:
 
1
  ---
2
+ language:
3
+ - id
4
  license: mit
5
  base_model: indolem/indobert-base-uncased
6
  tags:
all_results.json CHANGED
@@ -6,16 +6,16 @@
6
  "eval_loss": 0.33090195059776306,
7
  "eval_precision": 0.8378262413446174,
8
  "eval_recall": 0.8460174577195854,
9
- "eval_runtime": 4.9693,
10
  "eval_samples": 399,
11
- "eval_samples_per_second": 80.292,
12
- "eval_steps_per_second": 10.062,
13
  "f1": 0.8418232002914281,
14
  "precision": 0.8393060770407454,
15
  "recall": 0.8445056806950497,
16
  "train_loss": 0.3206107397548488,
17
- "train_runtime": 1955.0616,
18
  "train_samples": 3638,
19
- "train_samples_per_second": 37.216,
20
- "train_steps_per_second": 1.248
21
  }
 
6
  "eval_loss": 0.33090195059776306,
7
  "eval_precision": 0.8378262413446174,
8
  "eval_recall": 0.8460174577195854,
9
+ "eval_runtime": 5.0536,
10
  "eval_samples": 399,
11
+ "eval_samples_per_second": 78.954,
12
+ "eval_steps_per_second": 9.894,
13
  "f1": 0.8418232002914281,
14
  "precision": 0.8393060770407454,
15
  "recall": 0.8445056806950497,
16
  "train_loss": 0.3206107397548488,
17
+ "train_runtime": 1953.692,
18
  "train_samples": 3638,
19
+ "train_samples_per_second": 37.242,
20
+ "train_steps_per_second": 1.249
21
  }
eval_results.json CHANGED
@@ -5,8 +5,8 @@
5
  "eval_loss": 0.33090195059776306,
6
  "eval_precision": 0.8378262413446174,
7
  "eval_recall": 0.8460174577195854,
8
- "eval_runtime": 4.9693,
9
  "eval_samples": 399,
10
- "eval_samples_per_second": 80.292,
11
- "eval_steps_per_second": 10.062
12
  }
 
5
  "eval_loss": 0.33090195059776306,
6
  "eval_precision": 0.8378262413446174,
7
  "eval_recall": 0.8460174577195854,
8
+ "eval_runtime": 5.0536,
9
  "eval_samples": 399,
10
+ "eval_samples_per_second": 78.954,
11
+ "eval_steps_per_second": 9.894
12
  }
predict_results.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "accuracy": 0.8674579624134521,
3
+ "f1": 0.8418232002914281,
4
+ "precision": 0.8393060770407454,
5
+ "recall": 0.8445056806950497
6
+ }
runs/May26_13-14-11_indolem-petl-vm/events.out.tfevents.1716731222.indolem-petl-vm.2896391.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a899746a082c64a16bb00bec531f4dbe332e9aaf00709dd6e7ae90c559a2b03
3
+ size 560
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 20.0,
3
  "train_loss": 0.3206107397548488,
4
- "train_runtime": 1955.0616,
5
  "train_samples": 3638,
6
- "train_samples_per_second": 37.216,
7
- "train_steps_per_second": 1.248
8
  }
 
1
  {
2
  "epoch": 20.0,
3
  "train_loss": 0.3206107397548488,
4
+ "train_runtime": 1953.692,
5
  "train_samples": 3638,
6
+ "train_samples_per_second": 37.242,
7
+ "train_steps_per_second": 1.249
8
  }
trainer_state.json CHANGED
@@ -22,9 +22,9 @@
22
  "eval_loss": 0.5075693130493164,
23
  "eval_precision": 0.6564625850340136,
24
  "eval_recall": 0.6463902527732315,
25
- "eval_runtime": 5.145,
26
- "eval_samples_per_second": 77.551,
27
- "eval_steps_per_second": 9.718,
28
  "step": 122
29
  },
30
  {
@@ -41,9 +41,9 @@
41
  "eval_loss": 0.48389074206352234,
42
  "eval_precision": 0.7106679035250464,
43
  "eval_recall": 0.7409074377159484,
44
- "eval_runtime": 5.0628,
45
- "eval_samples_per_second": 78.81,
46
- "eval_steps_per_second": 9.876,
47
  "step": 244
48
  },
49
  {
@@ -60,9 +60,9 @@
60
  "eval_loss": 0.425637811422348,
61
  "eval_precision": 0.7280813755532857,
62
  "eval_recall": 0.7436352064011639,
63
- "eval_runtime": 5.0694,
64
- "eval_samples_per_second": 78.708,
65
- "eval_steps_per_second": 9.863,
66
  "step": 366
67
  },
68
  {
@@ -79,9 +79,9 @@
79
  "eval_loss": 0.387967973947525,
80
  "eval_precision": 0.7798245614035089,
81
  "eval_recall": 0.7755501000181851,
82
- "eval_runtime": 5.0609,
83
- "eval_samples_per_second": 78.84,
84
- "eval_steps_per_second": 9.88,
85
  "step": 488
86
  },
87
  {
@@ -98,9 +98,9 @@
98
  "eval_loss": 0.4130999743938446,
99
  "eval_precision": 0.765661378526179,
100
  "eval_recall": 0.7974177123113293,
101
- "eval_runtime": 5.1051,
102
- "eval_samples_per_second": 78.158,
103
- "eval_steps_per_second": 9.794,
104
  "step": 610
105
  },
106
  {
@@ -117,9 +117,9 @@
117
  "eval_loss": 0.36453139781951904,
118
  "eval_precision": 0.7965023376930815,
119
  "eval_recall": 0.803691580287325,
120
- "eval_runtime": 5.0825,
121
- "eval_samples_per_second": 78.504,
122
- "eval_steps_per_second": 9.838,
123
  "step": 732
124
  },
125
  {
@@ -136,9 +136,9 @@
136
  "eval_loss": 0.3639658987522125,
137
  "eval_precision": 0.798820781588242,
138
  "eval_recall": 0.8179669030732861,
139
- "eval_runtime": 5.0648,
140
- "eval_samples_per_second": 78.779,
141
- "eval_steps_per_second": 9.872,
142
  "step": 854
143
  },
144
  {
@@ -155,9 +155,9 @@
155
  "eval_loss": 0.3551309108734131,
156
  "eval_precision": 0.7996165051429931,
157
  "eval_recall": 0.8054646299327151,
158
- "eval_runtime": 5.1012,
159
- "eval_samples_per_second": 78.216,
160
- "eval_steps_per_second": 9.802,
161
  "step": 976
162
  },
163
  {
@@ -174,9 +174,9 @@
174
  "eval_loss": 0.3508576452732086,
175
  "eval_precision": 0.8169406150583245,
176
  "eval_recall": 0.8261047463175123,
177
- "eval_runtime": 5.0536,
178
- "eval_samples_per_second": 78.953,
179
- "eval_steps_per_second": 9.894,
180
  "step": 1098
181
  },
182
  {
@@ -193,9 +193,9 @@
193
  "eval_loss": 0.341298907995224,
194
  "eval_precision": 0.8212799324446589,
195
  "eval_recall": 0.8228768867066739,
196
- "eval_runtime": 5.0649,
197
- "eval_samples_per_second": 78.778,
198
- "eval_steps_per_second": 9.872,
199
  "step": 1220
200
  },
201
  {
@@ -212,9 +212,9 @@
212
  "eval_loss": 0.3493994474411011,
213
  "eval_precision": 0.8192918192918193,
214
  "eval_recall": 0.8328787052191308,
215
- "eval_runtime": 5.0474,
216
- "eval_samples_per_second": 79.051,
217
- "eval_steps_per_second": 9.906,
218
  "step": 1342
219
  },
220
  {
@@ -231,9 +231,9 @@
231
  "eval_loss": 0.35203850269317627,
232
  "eval_precision": 0.822024085224641,
233
  "eval_recall": 0.837152209492635,
234
- "eval_runtime": 5.0872,
235
- "eval_samples_per_second": 78.432,
236
- "eval_steps_per_second": 9.829,
237
  "step": 1464
238
  },
239
  {
@@ -250,9 +250,9 @@
250
  "eval_loss": 0.33577361702919006,
251
  "eval_precision": 0.8201621387462095,
252
  "eval_recall": 0.8136024731769412,
253
- "eval_runtime": 5.0577,
254
- "eval_samples_per_second": 78.89,
255
- "eval_steps_per_second": 9.886,
256
  "step": 1586
257
  },
258
  {
@@ -269,9 +269,9 @@
269
  "eval_loss": 0.3354940712451935,
270
  "eval_precision": 0.8352012604792199,
271
  "eval_recall": 0.8417439534460811,
272
- "eval_runtime": 5.0671,
273
- "eval_samples_per_second": 78.744,
274
- "eval_steps_per_second": 9.868,
275
  "step": 1708
276
  },
277
  {
@@ -288,9 +288,9 @@
288
  "eval_loss": 0.3406221270561218,
289
  "eval_precision": 0.8345705196182396,
290
  "eval_recall": 0.8442444080741953,
291
- "eval_runtime": 5.0556,
292
- "eval_samples_per_second": 78.923,
293
- "eval_steps_per_second": 9.89,
294
  "step": 1830
295
  },
296
  {
@@ -307,9 +307,9 @@
307
  "eval_loss": 0.337022989988327,
308
  "eval_precision": 0.8308913308913308,
309
  "eval_recall": 0.8449718130569195,
310
- "eval_runtime": 5.0566,
311
- "eval_samples_per_second": 78.906,
312
- "eval_steps_per_second": 9.888,
313
  "step": 1952
314
  },
315
  {
@@ -326,9 +326,9 @@
326
  "eval_loss": 0.3271777033805847,
327
  "eval_precision": 0.8411320530352577,
328
  "eval_recall": 0.8477905073649754,
329
- "eval_runtime": 5.0845,
330
- "eval_samples_per_second": 78.474,
331
- "eval_steps_per_second": 9.834,
332
  "step": 2074
333
  },
334
  {
@@ -345,9 +345,9 @@
345
  "eval_loss": 0.3318663537502289,
346
  "eval_precision": 0.8313636363636363,
347
  "eval_recall": 0.8424713584288053,
348
- "eval_runtime": 5.0547,
349
- "eval_samples_per_second": 78.936,
350
- "eval_steps_per_second": 9.892,
351
  "step": 2196
352
  },
353
  {
@@ -364,9 +364,9 @@
364
  "eval_loss": 0.3293265402317047,
365
  "eval_precision": 0.8411320530352577,
366
  "eval_recall": 0.8477905073649754,
367
- "eval_runtime": 5.0713,
368
- "eval_samples_per_second": 78.678,
369
- "eval_steps_per_second": 9.859,
370
  "step": 2318
371
  },
372
  {
@@ -383,9 +383,9 @@
383
  "eval_loss": 0.33090195059776306,
384
  "eval_precision": 0.8378262413446174,
385
  "eval_recall": 0.8460174577195854,
386
- "eval_runtime": 5.0518,
387
- "eval_samples_per_second": 78.981,
388
- "eval_steps_per_second": 9.897,
389
  "step": 2440
390
  },
391
  {
@@ -393,9 +393,9 @@
393
  "step": 2440,
394
  "total_flos": 7609911792720000.0,
395
  "train_loss": 0.3206107397548488,
396
- "train_runtime": 1955.0616,
397
- "train_samples_per_second": 37.216,
398
- "train_steps_per_second": 1.248
399
  }
400
  ],
401
  "logging_steps": 500,
 
22
  "eval_loss": 0.5075693130493164,
23
  "eval_precision": 0.6564625850340136,
24
  "eval_recall": 0.6463902527732315,
25
+ "eval_runtime": 5.0923,
26
+ "eval_samples_per_second": 78.354,
27
+ "eval_steps_per_second": 9.819,
28
  "step": 122
29
  },
30
  {
 
41
  "eval_loss": 0.48389074206352234,
42
  "eval_precision": 0.7106679035250464,
43
  "eval_recall": 0.7409074377159484,
44
+ "eval_runtime": 5.0441,
45
+ "eval_samples_per_second": 79.102,
46
+ "eval_steps_per_second": 9.913,
47
  "step": 244
48
  },
49
  {
 
60
  "eval_loss": 0.425637811422348,
61
  "eval_precision": 0.7280813755532857,
62
  "eval_recall": 0.7436352064011639,
63
+ "eval_runtime": 5.0729,
64
+ "eval_samples_per_second": 78.653,
65
+ "eval_steps_per_second": 9.856,
66
  "step": 366
67
  },
68
  {
 
79
  "eval_loss": 0.387967973947525,
80
  "eval_precision": 0.7798245614035089,
81
  "eval_recall": 0.7755501000181851,
82
+ "eval_runtime": 5.0882,
83
+ "eval_samples_per_second": 78.417,
84
+ "eval_steps_per_second": 9.827,
85
  "step": 488
86
  },
87
  {
 
98
  "eval_loss": 0.4130999743938446,
99
  "eval_precision": 0.765661378526179,
100
  "eval_recall": 0.7974177123113293,
101
+ "eval_runtime": 5.0804,
102
+ "eval_samples_per_second": 78.538,
103
+ "eval_steps_per_second": 9.842,
104
  "step": 610
105
  },
106
  {
 
117
  "eval_loss": 0.36453139781951904,
118
  "eval_precision": 0.7965023376930815,
119
  "eval_recall": 0.803691580287325,
120
+ "eval_runtime": 5.1163,
121
+ "eval_samples_per_second": 77.986,
122
+ "eval_steps_per_second": 9.773,
123
  "step": 732
124
  },
125
  {
 
136
  "eval_loss": 0.3639658987522125,
137
  "eval_precision": 0.798820781588242,
138
  "eval_recall": 0.8179669030732861,
139
+ "eval_runtime": 5.0581,
140
+ "eval_samples_per_second": 78.884,
141
+ "eval_steps_per_second": 9.885,
142
  "step": 854
143
  },
144
  {
 
155
  "eval_loss": 0.3551309108734131,
156
  "eval_precision": 0.7996165051429931,
157
  "eval_recall": 0.8054646299327151,
158
+ "eval_runtime": 5.0639,
159
+ "eval_samples_per_second": 78.794,
160
+ "eval_steps_per_second": 9.874,
161
  "step": 976
162
  },
163
  {
 
174
  "eval_loss": 0.3508576452732086,
175
  "eval_precision": 0.8169406150583245,
176
  "eval_recall": 0.8261047463175123,
177
+ "eval_runtime": 5.0524,
178
+ "eval_samples_per_second": 78.973,
179
+ "eval_steps_per_second": 9.896,
180
  "step": 1098
181
  },
182
  {
 
193
  "eval_loss": 0.341298907995224,
194
  "eval_precision": 0.8212799324446589,
195
  "eval_recall": 0.8228768867066739,
196
+ "eval_runtime": 5.0711,
197
+ "eval_samples_per_second": 78.681,
198
+ "eval_steps_per_second": 9.86,
199
  "step": 1220
200
  },
201
  {
 
212
  "eval_loss": 0.3493994474411011,
213
  "eval_precision": 0.8192918192918193,
214
  "eval_recall": 0.8328787052191308,
215
+ "eval_runtime": 5.08,
216
+ "eval_samples_per_second": 78.543,
217
+ "eval_steps_per_second": 9.842,
218
  "step": 1342
219
  },
220
  {
 
231
  "eval_loss": 0.35203850269317627,
232
  "eval_precision": 0.822024085224641,
233
  "eval_recall": 0.837152209492635,
234
+ "eval_runtime": 5.0962,
235
+ "eval_samples_per_second": 78.294,
236
+ "eval_steps_per_second": 9.811,
237
  "step": 1464
238
  },
239
  {
 
250
  "eval_loss": 0.33577361702919006,
251
  "eval_precision": 0.8201621387462095,
252
  "eval_recall": 0.8136024731769412,
253
+ "eval_runtime": 5.0497,
254
+ "eval_samples_per_second": 79.014,
255
+ "eval_steps_per_second": 9.902,
256
  "step": 1586
257
  },
258
  {
 
269
  "eval_loss": 0.3354940712451935,
270
  "eval_precision": 0.8352012604792199,
271
  "eval_recall": 0.8417439534460811,
272
+ "eval_runtime": 5.0822,
273
+ "eval_samples_per_second": 78.509,
274
+ "eval_steps_per_second": 9.838,
275
  "step": 1708
276
  },
277
  {
 
288
  "eval_loss": 0.3406221270561218,
289
  "eval_precision": 0.8345705196182396,
290
  "eval_recall": 0.8442444080741953,
291
+ "eval_runtime": 5.0733,
292
+ "eval_samples_per_second": 78.647,
293
+ "eval_steps_per_second": 9.855,
294
  "step": 1830
295
  },
296
  {
 
307
  "eval_loss": 0.337022989988327,
308
  "eval_precision": 0.8308913308913308,
309
  "eval_recall": 0.8449718130569195,
310
+ "eval_runtime": 5.074,
311
+ "eval_samples_per_second": 78.636,
312
+ "eval_steps_per_second": 9.854,
313
  "step": 1952
314
  },
315
  {
 
326
  "eval_loss": 0.3271777033805847,
327
  "eval_precision": 0.8411320530352577,
328
  "eval_recall": 0.8477905073649754,
329
+ "eval_runtime": 5.0533,
330
+ "eval_samples_per_second": 78.958,
331
+ "eval_steps_per_second": 9.894,
332
  "step": 2074
333
  },
334
  {
 
345
  "eval_loss": 0.3318663537502289,
346
  "eval_precision": 0.8313636363636363,
347
  "eval_recall": 0.8424713584288053,
348
+ "eval_runtime": 5.0843,
349
+ "eval_samples_per_second": 78.477,
350
+ "eval_steps_per_second": 9.834,
351
  "step": 2196
352
  },
353
  {
 
364
  "eval_loss": 0.3293265402317047,
365
  "eval_precision": 0.8411320530352577,
366
  "eval_recall": 0.8477905073649754,
367
+ "eval_runtime": 5.0621,
368
+ "eval_samples_per_second": 78.82,
369
+ "eval_steps_per_second": 9.877,
370
  "step": 2318
371
  },
372
  {
 
383
  "eval_loss": 0.33090195059776306,
384
  "eval_precision": 0.8378262413446174,
385
  "eval_recall": 0.8460174577195854,
386
+ "eval_runtime": 5.0495,
387
+ "eval_samples_per_second": 79.018,
388
+ "eval_steps_per_second": 9.902,
389
  "step": 2440
390
  },
391
  {
 
393
  "step": 2440,
394
  "total_flos": 7609911792720000.0,
395
  "train_loss": 0.3206107397548488,
396
+ "train_runtime": 1953.692,
397
+ "train_samples_per_second": 37.242,
398
+ "train_steps_per_second": 1.249
399
  }
400
  ],
401
  "logging_steps": 500,