apwic commited on
Commit
d907130
1 Parent(s): 8d6ee5e

End of training

Browse files
README.md CHANGED
@@ -1,4 +1,6 @@
1
  ---
 
 
2
  license: mit
3
  base_model: indolem/indobert-base-uncased
4
  tags:
 
1
  ---
2
+ language:
3
+ - id
4
  license: mit
5
  base_model: indolem/indobert-base-uncased
6
  tags:
all_results.json CHANGED
@@ -6,16 +6,16 @@
6
  "eval_loss": 0.2913039028644562,
7
  "eval_precision": 0.8851154755410074,
8
  "eval_recall": 0.8851154755410074,
9
- "eval_runtime": 5.0888,
10
  "eval_samples": 399,
11
- "eval_samples_per_second": 78.408,
12
- "eval_steps_per_second": 9.826,
13
  "f1": 0.875810040328188,
14
  "precision": 0.8705850368732237,
15
  "recall": 0.8817196456978266,
16
  "train_loss": 0.22896970373685244,
17
- "train_runtime": 1959.4286,
18
  "train_samples": 3638,
19
- "train_samples_per_second": 37.133,
20
- "train_steps_per_second": 1.245
21
  }
 
6
  "eval_loss": 0.2913039028644562,
7
  "eval_precision": 0.8851154755410074,
8
  "eval_recall": 0.8851154755410074,
9
+ "eval_runtime": 5.1012,
10
  "eval_samples": 399,
11
+ "eval_samples_per_second": 78.217,
12
+ "eval_steps_per_second": 9.802,
13
  "f1": 0.875810040328188,
14
  "precision": 0.8705850368732237,
15
  "recall": 0.8817196456978266,
16
  "train_loss": 0.22896970373685244,
17
+ "train_runtime": 1968.7629,
18
  "train_samples": 3638,
19
+ "train_samples_per_second": 36.957,
20
+ "train_steps_per_second": 1.239
21
  }
eval_results.json CHANGED
@@ -5,8 +5,8 @@
5
  "eval_loss": 0.2913039028644562,
6
  "eval_precision": 0.8851154755410074,
7
  "eval_recall": 0.8851154755410074,
8
- "eval_runtime": 5.0888,
9
  "eval_samples": 399,
10
- "eval_samples_per_second": 78.408,
11
- "eval_steps_per_second": 9.826
12
  }
 
5
  "eval_loss": 0.2913039028644562,
6
  "eval_precision": 0.8851154755410074,
7
  "eval_recall": 0.8851154755410074,
8
+ "eval_runtime": 5.1012,
9
  "eval_samples": 399,
10
+ "eval_samples_per_second": 78.217,
11
+ "eval_steps_per_second": 9.802
12
  }
predict_results.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "accuracy": 0.8951533135509396,
3
+ "f1": 0.875810040328188,
4
+ "precision": 0.8705850368732237,
5
+ "recall": 0.8817196456978266
6
+ }
runs/May25_17-31-29_indolem-petl-vm/events.out.tfevents.1716660276.indolem-petl-vm.2348815.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:904d57b8cf3adb6ab50f8aeda23fe598c4d462441d71961ac4467ba90bad15ca
3
+ size 560
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 20.0,
3
  "train_loss": 0.22896970373685244,
4
- "train_runtime": 1959.4286,
5
  "train_samples": 3638,
6
- "train_samples_per_second": 37.133,
7
- "train_steps_per_second": 1.245
8
  }
 
1
  {
2
  "epoch": 20.0,
3
  "train_loss": 0.22896970373685244,
4
+ "train_runtime": 1968.7629,
5
  "train_samples": 3638,
6
+ "train_samples_per_second": 36.957,
7
+ "train_steps_per_second": 1.239
8
  }
trainer_state.json CHANGED
@@ -22,9 +22,9 @@
22
  "eval_loss": 0.4752861261367798,
23
  "eval_precision": 0.6464762782128051,
24
  "eval_recall": 0.5963811602109474,
25
- "eval_runtime": 5.343,
26
- "eval_samples_per_second": 74.677,
27
- "eval_steps_per_second": 9.358,
28
  "step": 122
29
  },
30
  {
@@ -41,9 +41,9 @@
41
  "eval_loss": 0.4070126414299011,
42
  "eval_precision": 0.7589055735189347,
43
  "eval_recall": 0.7863702491362066,
44
- "eval_runtime": 5.1525,
45
- "eval_samples_per_second": 77.438,
46
- "eval_steps_per_second": 9.704,
47
  "step": 244
48
  },
49
  {
@@ -60,9 +60,9 @@
60
  "eval_loss": 0.3412257730960846,
61
  "eval_precision": 0.8231252179979072,
62
  "eval_recall": 0.7807783233315149,
63
- "eval_runtime": 5.171,
64
- "eval_samples_per_second": 77.16,
65
- "eval_steps_per_second": 9.669,
66
  "step": 366
67
  },
68
  {
@@ -79,9 +79,9 @@
79
  "eval_loss": 0.3252820372581482,
80
  "eval_precision": 0.8263351692555232,
81
  "eval_recall": 0.8196490270958356,
82
- "eval_runtime": 5.1862,
83
- "eval_samples_per_second": 76.935,
84
- "eval_steps_per_second": 9.641,
85
  "step": 488
86
  },
87
  {
@@ -98,9 +98,9 @@
98
  "eval_loss": 0.2941116690635681,
99
  "eval_precision": 0.8609538327526132,
100
  "eval_recall": 0.8516548463356974,
101
- "eval_runtime": 5.1746,
102
- "eval_samples_per_second": 77.108,
103
- "eval_steps_per_second": 9.663,
104
  "step": 610
105
  },
106
  {
@@ -117,9 +117,9 @@
117
  "eval_loss": 0.2965351343154907,
118
  "eval_precision": 0.8473119816985988,
119
  "eval_recall": 0.8681123840698308,
120
- "eval_runtime": 5.1845,
121
- "eval_samples_per_second": 76.96,
122
- "eval_steps_per_second": 9.644,
123
  "step": 732
124
  },
125
  {
@@ -136,9 +136,9 @@
136
  "eval_loss": 0.286903977394104,
137
  "eval_precision": 0.8446597760551249,
138
  "eval_recall": 0.8638388797963266,
139
- "eval_runtime": 5.1647,
140
- "eval_samples_per_second": 77.254,
141
- "eval_steps_per_second": 9.681,
142
  "step": 854
143
  },
144
  {
@@ -155,9 +155,9 @@
155
  "eval_loss": 0.2795129120349884,
156
  "eval_precision": 0.8961111111111111,
157
  "eval_recall": 0.8565648299690853,
158
- "eval_runtime": 5.1699,
159
- "eval_samples_per_second": 77.177,
160
- "eval_steps_per_second": 9.671,
161
  "step": 976
162
  },
163
  {
@@ -174,9 +174,9 @@
174
  "eval_loss": 0.27050527930259705,
175
  "eval_precision": 0.8673433153814287,
176
  "eval_recall": 0.8762502273140571,
177
- "eval_runtime": 5.1829,
178
- "eval_samples_per_second": 76.984,
179
- "eval_steps_per_second": 9.647,
180
  "step": 1098
181
  },
182
  {
@@ -193,9 +193,9 @@
193
  "eval_loss": 0.275096595287323,
194
  "eval_precision": 0.89198606271777,
195
  "eval_recall": 0.8818876159301692,
196
- "eval_runtime": 5.1456,
197
- "eval_samples_per_second": 77.542,
198
- "eval_steps_per_second": 9.717,
199
  "step": 1220
200
  },
201
  {
@@ -212,9 +212,9 @@
212
  "eval_loss": 0.27452006936073303,
213
  "eval_precision": 0.8826476009275225,
214
  "eval_recall": 0.8901163847972358,
215
- "eval_runtime": 5.1616,
216
- "eval_samples_per_second": 77.301,
217
- "eval_steps_per_second": 9.687,
218
  "step": 1342
219
  },
220
  {
@@ -231,9 +231,9 @@
231
  "eval_loss": 0.279909610748291,
232
  "eval_precision": 0.8956662848415425,
233
  "eval_recall": 0.8768867066739408,
234
- "eval_runtime": 5.0933,
235
- "eval_samples_per_second": 78.338,
236
- "eval_steps_per_second": 9.817,
237
  "step": 1464
238
  },
239
  {
@@ -250,9 +250,9 @@
250
  "eval_loss": 0.27386558055877686,
251
  "eval_precision": 0.8959740990990992,
252
  "eval_recall": 0.8836606655755592,
253
- "eval_runtime": 5.1138,
254
- "eval_samples_per_second": 78.024,
255
- "eval_steps_per_second": 9.778,
256
  "step": 1586
257
  },
258
  {
@@ -269,9 +269,9 @@
269
  "eval_loss": 0.28680744767189026,
270
  "eval_precision": 0.8862007168458781,
271
  "eval_recall": 0.8918894344426259,
272
- "eval_runtime": 5.0739,
273
- "eval_samples_per_second": 78.638,
274
- "eval_steps_per_second": 9.854,
275
  "step": 1708
276
  },
277
  {
@@ -288,9 +288,9 @@
288
  "eval_loss": 0.2929786145687103,
289
  "eval_precision": 0.8827677592299257,
290
  "eval_recall": 0.8808419712675032,
291
- "eval_runtime": 5.1442,
292
- "eval_samples_per_second": 77.564,
293
- "eval_steps_per_second": 9.72,
294
  "step": 1830
295
  },
296
  {
@@ -307,9 +307,9 @@
307
  "eval_loss": 0.3041006028652191,
308
  "eval_precision": 0.8682260305697083,
309
  "eval_recall": 0.8855246408437898,
310
- "eval_runtime": 5.0804,
311
- "eval_samples_per_second": 78.537,
312
- "eval_steps_per_second": 9.842,
313
  "step": 1952
314
  },
315
  {
@@ -326,9 +326,9 @@
326
  "eval_loss": 0.28764259815216064,
327
  "eval_precision": 0.8814464081066409,
328
  "eval_recall": 0.8833424258956174,
329
- "eval_runtime": 5.2288,
330
- "eval_samples_per_second": 76.309,
331
- "eval_steps_per_second": 9.562,
332
  "step": 2074
333
  },
334
  {
@@ -345,9 +345,9 @@
345
  "eval_loss": 0.28996890783309937,
346
  "eval_precision": 0.8865278628291489,
347
  "eval_recall": 0.8826150209128933,
348
- "eval_runtime": 5.1376,
349
- "eval_samples_per_second": 77.663,
350
- "eval_steps_per_second": 9.732,
351
  "step": 2196
352
  },
353
  {
@@ -364,9 +364,9 @@
364
  "eval_loss": 0.2917177975177765,
365
  "eval_precision": 0.8851154755410074,
366
  "eval_recall": 0.8851154755410074,
367
- "eval_runtime": 5.1533,
368
- "eval_samples_per_second": 77.427,
369
- "eval_steps_per_second": 9.703,
370
  "step": 2318
371
  },
372
  {
@@ -383,9 +383,9 @@
383
  "eval_loss": 0.2913039028644562,
384
  "eval_precision": 0.8851154755410074,
385
  "eval_recall": 0.8851154755410074,
386
- "eval_runtime": 5.2712,
387
- "eval_samples_per_second": 75.694,
388
- "eval_steps_per_second": 9.486,
389
  "step": 2440
390
  },
391
  {
@@ -393,9 +393,9 @@
393
  "step": 2440,
394
  "total_flos": 8444128359504000.0,
395
  "train_loss": 0.22896970373685244,
396
- "train_runtime": 1959.4286,
397
- "train_samples_per_second": 37.133,
398
- "train_steps_per_second": 1.245
399
  }
400
  ],
401
  "logging_steps": 500,
 
22
  "eval_loss": 0.4752861261367798,
23
  "eval_precision": 0.6464762782128051,
24
  "eval_recall": 0.5963811602109474,
25
+ "eval_runtime": 5.2249,
26
+ "eval_samples_per_second": 76.365,
27
+ "eval_steps_per_second": 9.57,
28
  "step": 122
29
  },
30
  {
 
41
  "eval_loss": 0.4070126414299011,
42
  "eval_precision": 0.7589055735189347,
43
  "eval_recall": 0.7863702491362066,
44
+ "eval_runtime": 5.1546,
45
+ "eval_samples_per_second": 77.407,
46
+ "eval_steps_per_second": 9.7,
47
  "step": 244
48
  },
49
  {
 
60
  "eval_loss": 0.3412257730960846,
61
  "eval_precision": 0.8231252179979072,
62
  "eval_recall": 0.7807783233315149,
63
+ "eval_runtime": 5.1898,
64
+ "eval_samples_per_second": 76.882,
65
+ "eval_steps_per_second": 9.634,
66
  "step": 366
67
  },
68
  {
 
79
  "eval_loss": 0.3252820372581482,
80
  "eval_precision": 0.8263351692555232,
81
  "eval_recall": 0.8196490270958356,
82
+ "eval_runtime": 5.1759,
83
+ "eval_samples_per_second": 77.088,
84
+ "eval_steps_per_second": 9.66,
85
  "step": 488
86
  },
87
  {
 
98
  "eval_loss": 0.2941116690635681,
99
  "eval_precision": 0.8609538327526132,
100
  "eval_recall": 0.8516548463356974,
101
+ "eval_runtime": 5.1453,
102
+ "eval_samples_per_second": 77.546,
103
+ "eval_steps_per_second": 9.718,
104
  "step": 610
105
  },
106
  {
 
117
  "eval_loss": 0.2965351343154907,
118
  "eval_precision": 0.8473119816985988,
119
  "eval_recall": 0.8681123840698308,
120
+ "eval_runtime": 5.1607,
121
+ "eval_samples_per_second": 77.315,
122
+ "eval_steps_per_second": 9.689,
123
  "step": 732
124
  },
125
  {
 
136
  "eval_loss": 0.286903977394104,
137
  "eval_precision": 0.8446597760551249,
138
  "eval_recall": 0.8638388797963266,
139
+ "eval_runtime": 5.4309,
140
+ "eval_samples_per_second": 73.468,
141
+ "eval_steps_per_second": 9.207,
142
  "step": 854
143
  },
144
  {
 
155
  "eval_loss": 0.2795129120349884,
156
  "eval_precision": 0.8961111111111111,
157
  "eval_recall": 0.8565648299690853,
158
+ "eval_runtime": 5.1715,
159
+ "eval_samples_per_second": 77.153,
160
+ "eval_steps_per_second": 9.668,
161
  "step": 976
162
  },
163
  {
 
174
  "eval_loss": 0.27050527930259705,
175
  "eval_precision": 0.8673433153814287,
176
  "eval_recall": 0.8762502273140571,
177
+ "eval_runtime": 5.1606,
178
+ "eval_samples_per_second": 77.317,
179
+ "eval_steps_per_second": 9.689,
180
  "step": 1098
181
  },
182
  {
 
193
  "eval_loss": 0.275096595287323,
194
  "eval_precision": 0.89198606271777,
195
  "eval_recall": 0.8818876159301692,
196
+ "eval_runtime": 5.1671,
197
+ "eval_samples_per_second": 77.22,
198
+ "eval_steps_per_second": 9.677,
199
  "step": 1220
200
  },
201
  {
 
212
  "eval_loss": 0.27452006936073303,
213
  "eval_precision": 0.8826476009275225,
214
  "eval_recall": 0.8901163847972358,
215
+ "eval_runtime": 5.1559,
216
+ "eval_samples_per_second": 77.387,
217
+ "eval_steps_per_second": 9.698,
218
  "step": 1342
219
  },
220
  {
 
231
  "eval_loss": 0.279909610748291,
232
  "eval_precision": 0.8956662848415425,
233
  "eval_recall": 0.8768867066739408,
234
+ "eval_runtime": 5.1353,
235
+ "eval_samples_per_second": 77.698,
236
+ "eval_steps_per_second": 9.737,
237
  "step": 1464
238
  },
239
  {
 
250
  "eval_loss": 0.27386558055877686,
251
  "eval_precision": 0.8959740990990992,
252
  "eval_recall": 0.8836606655755592,
253
+ "eval_runtime": 5.1775,
254
+ "eval_samples_per_second": 77.065,
255
+ "eval_steps_per_second": 9.657,
256
  "step": 1586
257
  },
258
  {
 
269
  "eval_loss": 0.28680744767189026,
270
  "eval_precision": 0.8862007168458781,
271
  "eval_recall": 0.8918894344426259,
272
+ "eval_runtime": 5.1734,
273
+ "eval_samples_per_second": 77.126,
274
+ "eval_steps_per_second": 9.665,
275
  "step": 1708
276
  },
277
  {
 
288
  "eval_loss": 0.2929786145687103,
289
  "eval_precision": 0.8827677592299257,
290
  "eval_recall": 0.8808419712675032,
291
+ "eval_runtime": 5.1562,
292
+ "eval_samples_per_second": 77.383,
293
+ "eval_steps_per_second": 9.697,
294
  "step": 1830
295
  },
296
  {
 
307
  "eval_loss": 0.3041006028652191,
308
  "eval_precision": 0.8682260305697083,
309
  "eval_recall": 0.8855246408437898,
310
+ "eval_runtime": 5.1466,
311
+ "eval_samples_per_second": 77.527,
312
+ "eval_steps_per_second": 9.715,
313
  "step": 1952
314
  },
315
  {
 
326
  "eval_loss": 0.28764259815216064,
327
  "eval_precision": 0.8814464081066409,
328
  "eval_recall": 0.8833424258956174,
329
+ "eval_runtime": 5.1398,
330
+ "eval_samples_per_second": 77.63,
331
+ "eval_steps_per_second": 9.728,
332
  "step": 2074
333
  },
334
  {
 
345
  "eval_loss": 0.28996890783309937,
346
  "eval_precision": 0.8865278628291489,
347
  "eval_recall": 0.8826150209128933,
348
+ "eval_runtime": 5.3979,
349
+ "eval_samples_per_second": 73.917,
350
+ "eval_steps_per_second": 9.263,
351
  "step": 2196
352
  },
353
  {
 
364
  "eval_loss": 0.2917177975177765,
365
  "eval_precision": 0.8851154755410074,
366
  "eval_recall": 0.8851154755410074,
367
+ "eval_runtime": 5.1418,
368
+ "eval_samples_per_second": 77.6,
369
+ "eval_steps_per_second": 9.724,
370
  "step": 2318
371
  },
372
  {
 
383
  "eval_loss": 0.2913039028644562,
384
  "eval_precision": 0.8851154755410074,
385
  "eval_recall": 0.8851154755410074,
386
+ "eval_runtime": 5.1424,
387
+ "eval_samples_per_second": 77.591,
388
+ "eval_steps_per_second": 9.723,
389
  "step": 2440
390
  },
391
  {
 
393
  "step": 2440,
394
  "total_flos": 8444128359504000.0,
395
  "train_loss": 0.22896970373685244,
396
+ "train_runtime": 1968.7629,
397
+ "train_samples_per_second": 36.957,
398
+ "train_steps_per_second": 1.239
399
  }
400
  ],
401
  "logging_steps": 500,