apwic commited on
Commit
ca7a4f0
1 Parent(s): 621abe2

End of training

Browse files
README.md CHANGED
@@ -1,4 +1,6 @@
1
  ---
 
 
2
  license: mit
3
  base_model: indolem/indobert-base-uncased
4
  tags:
 
1
  ---
2
+ language:
3
+ - id
4
  license: mit
5
  base_model: indolem/indobert-base-uncased
6
  tags:
all_results.json CHANGED
@@ -6,16 +6,16 @@
6
  "eval_loss": 0.29368409514427185,
7
  "eval_precision": 0.8573798178418481,
8
  "eval_recall": 0.8591562102200401,
9
- "eval_runtime": 4.9708,
10
  "eval_samples": 399,
11
- "eval_samples_per_second": 80.268,
12
- "eval_steps_per_second": 10.059,
13
  "f1": 0.8877529196862761,
14
  "precision": 0.8852319695351321,
15
  "recall": 0.8904101207677175,
16
  "train_loss": 0.23575165701694176,
17
- "train_runtime": 1929.0983,
18
  "train_samples": 3638,
19
- "train_samples_per_second": 37.717,
20
- "train_steps_per_second": 1.265
21
  }
 
6
  "eval_loss": 0.29368409514427185,
7
  "eval_precision": 0.8573798178418481,
8
  "eval_recall": 0.8591562102200401,
9
+ "eval_runtime": 5.0799,
10
  "eval_samples": 399,
11
+ "eval_samples_per_second": 78.545,
12
+ "eval_steps_per_second": 9.843,
13
  "f1": 0.8877529196862761,
14
  "precision": 0.8852319695351321,
15
  "recall": 0.8904101207677175,
16
  "train_loss": 0.23575165701694176,
17
+ "train_runtime": 1927.8211,
18
  "train_samples": 3638,
19
+ "train_samples_per_second": 37.742,
20
+ "train_steps_per_second": 1.266
21
  }
eval_results.json CHANGED
@@ -5,8 +5,8 @@
5
  "eval_loss": 0.29368409514427185,
6
  "eval_precision": 0.8573798178418481,
7
  "eval_recall": 0.8591562102200401,
8
- "eval_runtime": 4.9708,
9
  "eval_samples": 399,
10
- "eval_samples_per_second": 80.268,
11
- "eval_steps_per_second": 10.059
12
  }
 
5
  "eval_loss": 0.29368409514427185,
6
  "eval_precision": 0.8573798178418481,
7
  "eval_recall": 0.8591562102200401,
8
+ "eval_runtime": 5.0799,
9
  "eval_samples": 399,
10
+ "eval_samples_per_second": 78.545,
11
+ "eval_steps_per_second": 9.843
12
  }
predict_results.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "accuracy": 0.9060336300692384,
3
+ "f1": 0.8877529196862761,
4
+ "precision": 0.8852319695351321,
5
+ "recall": 0.8904101207677175
6
+ }
runs/May25_18-37-55_indolem-petl-vm/events.out.tfevents.1716664221.indolem-petl-vm.2395462.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c19e561aa5e7fbfe3d6f4386016c218251422dd3853777430173b60d765a9c8d
3
+ size 560
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 20.0,
3
  "train_loss": 0.23575165701694176,
4
- "train_runtime": 1929.0983,
5
  "train_samples": 3638,
6
- "train_samples_per_second": 37.717,
7
- "train_steps_per_second": 1.265
8
  }
 
1
  {
2
  "epoch": 20.0,
3
  "train_loss": 0.23575165701694176,
4
+ "train_runtime": 1927.8211,
5
  "train_samples": 3638,
6
+ "train_samples_per_second": 37.742,
7
+ "train_steps_per_second": 1.266
8
  }
trainer_state.json CHANGED
@@ -22,9 +22,9 @@
22
  "eval_loss": 0.499358206987381,
23
  "eval_precision": 0.6878057302585605,
24
  "eval_recall": 0.6466175668303328,
25
- "eval_runtime": 5.1448,
26
- "eval_samples_per_second": 77.555,
27
- "eval_steps_per_second": 9.719,
28
  "step": 122
29
  },
30
  {
@@ -41,9 +41,9 @@
41
  "eval_loss": 0.4013344645500183,
42
  "eval_precision": 0.7567868206139117,
43
  "eval_recall": 0.7763684306237497,
44
- "eval_runtime": 5.1016,
45
- "eval_samples_per_second": 78.21,
46
- "eval_steps_per_second": 9.801,
47
  "step": 244
48
  },
49
  {
@@ -60,9 +60,9 @@
60
  "eval_loss": 0.36033105850219727,
61
  "eval_precision": 0.8252399774138905,
62
  "eval_recall": 0.7444080741953083,
63
- "eval_runtime": 5.0897,
64
- "eval_samples_per_second": 78.393,
65
- "eval_steps_per_second": 9.824,
66
  "step": 366
67
  },
68
  {
@@ -79,9 +79,9 @@
79
  "eval_loss": 0.31337350606918335,
80
  "eval_precision": 0.8356565656565657,
81
  "eval_recall": 0.8021458446990362,
82
- "eval_runtime": 5.0627,
83
- "eval_samples_per_second": 78.811,
84
- "eval_steps_per_second": 9.876,
85
  "step": 488
86
  },
87
  {
@@ -98,9 +98,9 @@
98
  "eval_loss": 0.30869799852371216,
99
  "eval_precision": 0.8463358876939919,
100
  "eval_recall": 0.8260138206946717,
101
- "eval_runtime": 5.0959,
102
- "eval_samples_per_second": 78.299,
103
- "eval_steps_per_second": 9.812,
104
  "step": 610
105
  },
106
  {
@@ -117,9 +117,9 @@
117
  "eval_loss": 0.30366042256355286,
118
  "eval_precision": 0.8442805058676086,
119
  "eval_recall": 0.8663393344244408,
120
- "eval_runtime": 5.0606,
121
- "eval_samples_per_second": 78.844,
122
- "eval_steps_per_second": 9.88,
123
  "step": 732
124
  },
125
  {
@@ -136,9 +136,9 @@
136
  "eval_loss": 0.2868788540363312,
137
  "eval_precision": 0.8513631702756499,
138
  "eval_recall": 0.8531096563011457,
139
- "eval_runtime": 5.0634,
140
- "eval_samples_per_second": 78.8,
141
- "eval_steps_per_second": 9.875,
142
  "step": 854
143
  },
144
  {
@@ -155,9 +155,9 @@
155
  "eval_loss": 0.3086492121219635,
156
  "eval_precision": 0.8487520627062706,
157
  "eval_recall": 0.8074649936352064,
158
- "eval_runtime": 5.0752,
159
- "eval_samples_per_second": 78.618,
160
- "eval_steps_per_second": 9.852,
161
  "step": 976
162
  },
163
  {
@@ -174,9 +174,9 @@
174
  "eval_loss": 0.29160723090171814,
175
  "eval_precision": 0.8520237470480189,
176
  "eval_recall": 0.8252864157119476,
177
- "eval_runtime": 5.0705,
178
- "eval_samples_per_second": 78.691,
179
- "eval_steps_per_second": 9.861,
180
  "step": 1098
181
  },
182
  {
@@ -193,9 +193,9 @@
193
  "eval_loss": 0.3077145218849182,
194
  "eval_precision": 0.8579231241892538,
195
  "eval_recall": 0.8177850518276051,
196
- "eval_runtime": 5.0979,
197
- "eval_samples_per_second": 78.267,
198
- "eval_steps_per_second": 9.808,
199
  "step": 1220
200
  },
201
  {
@@ -212,9 +212,9 @@
212
  "eval_loss": 0.29099568724632263,
213
  "eval_precision": 0.8385304659498208,
214
  "eval_recall": 0.8435170030914712,
215
- "eval_runtime": 5.064,
216
- "eval_samples_per_second": 78.791,
217
- "eval_steps_per_second": 9.874,
218
  "step": 1342
219
  },
220
  {
@@ -231,9 +231,9 @@
231
  "eval_loss": 0.28647324442863464,
232
  "eval_precision": 0.8529936381473334,
233
  "eval_recall": 0.8598836152027641,
234
- "eval_runtime": 5.0555,
235
- "eval_samples_per_second": 78.924,
236
- "eval_steps_per_second": 9.89,
237
  "step": 1464
238
  },
239
  {
@@ -250,9 +250,9 @@
250
  "eval_loss": 0.3067673444747925,
251
  "eval_precision": 0.8520237470480189,
252
  "eval_recall": 0.8252864157119476,
253
- "eval_runtime": 5.0624,
254
- "eval_samples_per_second": 78.817,
255
- "eval_steps_per_second": 9.877,
256
  "step": 1586
257
  },
258
  {
@@ -269,9 +269,9 @@
269
  "eval_loss": 0.29624542593955994,
270
  "eval_precision": 0.8587217615098657,
271
  "eval_recall": 0.8802054919076197,
272
- "eval_runtime": 5.1164,
273
- "eval_samples_per_second": 77.985,
274
- "eval_steps_per_second": 9.773,
275
  "step": 1708
276
  },
277
  {
@@ -288,9 +288,9 @@
288
  "eval_loss": 0.2889001667499542,
289
  "eval_precision": 0.8645363713902765,
290
  "eval_recall": 0.8627023095108202,
291
- "eval_runtime": 5.0785,
292
- "eval_samples_per_second": 78.566,
293
- "eval_steps_per_second": 9.845,
294
  "step": 1830
295
  },
296
  {
@@ -307,9 +307,9 @@
307
  "eval_loss": 0.2941306233406067,
308
  "eval_precision": 0.8540903540903542,
309
  "eval_recall": 0.8691580287324968,
310
- "eval_runtime": 5.0969,
311
- "eval_samples_per_second": 78.283,
312
- "eval_steps_per_second": 9.81,
313
  "step": 1952
314
  },
315
  {
@@ -326,9 +326,9 @@
326
  "eval_loss": 0.29707595705986023,
327
  "eval_precision": 0.8633733523114054,
328
  "eval_recall": 0.8559283506092017,
329
- "eval_runtime": 5.0647,
330
- "eval_samples_per_second": 78.78,
331
- "eval_steps_per_second": 9.872,
332
  "step": 2074
333
  },
334
  {
@@ -345,9 +345,9 @@
345
  "eval_loss": 0.29374733567237854,
346
  "eval_precision": 0.8620943049601959,
347
  "eval_recall": 0.8584288052373159,
348
- "eval_runtime": 5.0798,
349
- "eval_samples_per_second": 78.546,
350
- "eval_steps_per_second": 9.843,
351
  "step": 2196
352
  },
353
  {
@@ -364,9 +364,9 @@
364
  "eval_loss": 0.2946490943431854,
365
  "eval_precision": 0.8596491228070176,
366
  "eval_recall": 0.8541553009638116,
367
- "eval_runtime": 5.061,
368
- "eval_samples_per_second": 78.837,
369
- "eval_steps_per_second": 9.879,
370
  "step": 2318
371
  },
372
  {
@@ -383,9 +383,9 @@
383
  "eval_loss": 0.29368409514427185,
384
  "eval_precision": 0.8573798178418481,
385
  "eval_recall": 0.8591562102200401,
386
- "eval_runtime": 5.0593,
387
- "eval_samples_per_second": 78.864,
388
- "eval_steps_per_second": 9.883,
389
  "step": 2440
390
  },
391
  {
@@ -393,9 +393,9 @@
393
  "step": 2440,
394
  "total_flos": 8444128359504000.0,
395
  "train_loss": 0.23575165701694176,
396
- "train_runtime": 1929.0983,
397
- "train_samples_per_second": 37.717,
398
- "train_steps_per_second": 1.265
399
  }
400
  ],
401
  "logging_steps": 500,
 
22
  "eval_loss": 0.499358206987381,
23
  "eval_precision": 0.6878057302585605,
24
  "eval_recall": 0.6466175668303328,
25
+ "eval_runtime": 5.0995,
26
+ "eval_samples_per_second": 78.243,
27
+ "eval_steps_per_second": 9.805,
28
  "step": 122
29
  },
30
  {
 
41
  "eval_loss": 0.4013344645500183,
42
  "eval_precision": 0.7567868206139117,
43
  "eval_recall": 0.7763684306237497,
44
+ "eval_runtime": 5.1487,
45
+ "eval_samples_per_second": 77.495,
46
+ "eval_steps_per_second": 9.711,
47
  "step": 244
48
  },
49
  {
 
60
  "eval_loss": 0.36033105850219727,
61
  "eval_precision": 0.8252399774138905,
62
  "eval_recall": 0.7444080741953083,
63
+ "eval_runtime": 5.0787,
64
+ "eval_samples_per_second": 78.564,
65
+ "eval_steps_per_second": 9.845,
66
  "step": 366
67
  },
68
  {
 
79
  "eval_loss": 0.31337350606918335,
80
  "eval_precision": 0.8356565656565657,
81
  "eval_recall": 0.8021458446990362,
82
+ "eval_runtime": 5.0532,
83
+ "eval_samples_per_second": 78.96,
84
+ "eval_steps_per_second": 9.895,
85
  "step": 488
86
  },
87
  {
 
98
  "eval_loss": 0.30869799852371216,
99
  "eval_precision": 0.8463358876939919,
100
  "eval_recall": 0.8260138206946717,
101
+ "eval_runtime": 5.1714,
102
+ "eval_samples_per_second": 77.155,
103
+ "eval_steps_per_second": 9.669,
104
  "step": 610
105
  },
106
  {
 
117
  "eval_loss": 0.30366042256355286,
118
  "eval_precision": 0.8442805058676086,
119
  "eval_recall": 0.8663393344244408,
120
+ "eval_runtime": 5.0754,
121
+ "eval_samples_per_second": 78.614,
122
+ "eval_steps_per_second": 9.851,
123
  "step": 732
124
  },
125
  {
 
136
  "eval_loss": 0.2868788540363312,
137
  "eval_precision": 0.8513631702756499,
138
  "eval_recall": 0.8531096563011457,
139
+ "eval_runtime": 5.0844,
140
+ "eval_samples_per_second": 78.476,
141
+ "eval_steps_per_second": 9.834,
142
  "step": 854
143
  },
144
  {
 
155
  "eval_loss": 0.3086492121219635,
156
  "eval_precision": 0.8487520627062706,
157
  "eval_recall": 0.8074649936352064,
158
+ "eval_runtime": 5.076,
159
+ "eval_samples_per_second": 78.605,
160
+ "eval_steps_per_second": 9.85,
161
  "step": 976
162
  },
163
  {
 
174
  "eval_loss": 0.29160723090171814,
175
  "eval_precision": 0.8520237470480189,
176
  "eval_recall": 0.8252864157119476,
177
+ "eval_runtime": 5.0668,
178
+ "eval_samples_per_second": 78.748,
179
+ "eval_steps_per_second": 9.868,
180
  "step": 1098
181
  },
182
  {
 
193
  "eval_loss": 0.3077145218849182,
194
  "eval_precision": 0.8579231241892538,
195
  "eval_recall": 0.8177850518276051,
196
+ "eval_runtime": 5.1374,
197
+ "eval_samples_per_second": 77.665,
198
+ "eval_steps_per_second": 9.733,
199
  "step": 1220
200
  },
201
  {
 
212
  "eval_loss": 0.29099568724632263,
213
  "eval_precision": 0.8385304659498208,
214
  "eval_recall": 0.8435170030914712,
215
+ "eval_runtime": 5.0596,
216
+ "eval_samples_per_second": 78.861,
217
+ "eval_steps_per_second": 9.882,
218
  "step": 1342
219
  },
220
  {
 
231
  "eval_loss": 0.28647324442863464,
232
  "eval_precision": 0.8529936381473334,
233
  "eval_recall": 0.8598836152027641,
234
+ "eval_runtime": 5.0747,
235
+ "eval_samples_per_second": 78.626,
236
+ "eval_steps_per_second": 9.853,
237
  "step": 1464
238
  },
239
  {
 
250
  "eval_loss": 0.3067673444747925,
251
  "eval_precision": 0.8520237470480189,
252
  "eval_recall": 0.8252864157119476,
253
+ "eval_runtime": 5.0713,
254
+ "eval_samples_per_second": 78.679,
255
+ "eval_steps_per_second": 9.859,
256
  "step": 1586
257
  },
258
  {
 
269
  "eval_loss": 0.29624542593955994,
270
  "eval_precision": 0.8587217615098657,
271
  "eval_recall": 0.8802054919076197,
272
+ "eval_runtime": 5.0603,
273
+ "eval_samples_per_second": 78.849,
274
+ "eval_steps_per_second": 9.881,
275
  "step": 1708
276
  },
277
  {
 
288
  "eval_loss": 0.2889001667499542,
289
  "eval_precision": 0.8645363713902765,
290
  "eval_recall": 0.8627023095108202,
291
+ "eval_runtime": 5.1374,
292
+ "eval_samples_per_second": 77.666,
293
+ "eval_steps_per_second": 9.733,
294
  "step": 1830
295
  },
296
  {
 
307
  "eval_loss": 0.2941306233406067,
308
  "eval_precision": 0.8540903540903542,
309
  "eval_recall": 0.8691580287324968,
310
+ "eval_runtime": 5.0692,
311
+ "eval_samples_per_second": 78.711,
312
+ "eval_steps_per_second": 9.863,
313
  "step": 1952
314
  },
315
  {
 
326
  "eval_loss": 0.29707595705986023,
327
  "eval_precision": 0.8633733523114054,
328
  "eval_recall": 0.8559283506092017,
329
+ "eval_runtime": 5.0692,
330
+ "eval_samples_per_second": 78.711,
331
+ "eval_steps_per_second": 9.864,
332
  "step": 2074
333
  },
334
  {
 
345
  "eval_loss": 0.29374733567237854,
346
  "eval_precision": 0.8620943049601959,
347
  "eval_recall": 0.8584288052373159,
348
+ "eval_runtime": 5.0687,
349
+ "eval_samples_per_second": 78.718,
350
+ "eval_steps_per_second": 9.864,
351
  "step": 2196
352
  },
353
  {
 
364
  "eval_loss": 0.2946490943431854,
365
  "eval_precision": 0.8596491228070176,
366
  "eval_recall": 0.8541553009638116,
367
+ "eval_runtime": 5.0871,
368
+ "eval_samples_per_second": 78.434,
369
+ "eval_steps_per_second": 9.829,
370
  "step": 2318
371
  },
372
  {
 
383
  "eval_loss": 0.29368409514427185,
384
  "eval_precision": 0.8573798178418481,
385
  "eval_recall": 0.8591562102200401,
386
+ "eval_runtime": 5.1066,
387
+ "eval_samples_per_second": 78.134,
388
+ "eval_steps_per_second": 9.791,
389
  "step": 2440
390
  },
391
  {
 
393
  "step": 2440,
394
  "total_flos": 8444128359504000.0,
395
  "train_loss": 0.23575165701694176,
396
+ "train_runtime": 1927.8211,
397
+ "train_samples_per_second": 37.742,
398
+ "train_steps_per_second": 1.266
399
  }
400
  ],
401
  "logging_steps": 500,