apwic commited on
Commit
13e64ef
1 Parent(s): 67b1d90

End of training

Browse files
README.md CHANGED
@@ -1,4 +1,6 @@
1
  ---
 
 
2
  license: mit
3
  base_model: indolem/indobert-base-uncased
4
  tags:
 
1
  ---
2
+ language:
3
+ - id
4
  license: mit
5
  base_model: indolem/indobert-base-uncased
6
  tags:
all_results.json CHANGED
@@ -6,16 +6,16 @@
6
  "eval_loss": 0.33090195059776306,
7
  "eval_precision": 0.8378262413446174,
8
  "eval_recall": 0.8460174577195854,
9
- "eval_runtime": 4.9516,
10
  "eval_samples": 399,
11
- "eval_samples_per_second": 80.58,
12
- "eval_steps_per_second": 10.098,
13
  "f1": 0.8418232002914281,
14
  "precision": 0.8393060770407454,
15
  "recall": 0.8445056806950497,
16
  "train_loss": 0.3206107397548488,
17
- "train_runtime": 1956.4863,
18
  "train_samples": 3638,
19
- "train_samples_per_second": 37.189,
20
- "train_steps_per_second": 1.247
21
  }
 
6
  "eval_loss": 0.33090195059776306,
7
  "eval_precision": 0.8378262413446174,
8
  "eval_recall": 0.8460174577195854,
9
+ "eval_runtime": 5.0841,
10
  "eval_samples": 399,
11
+ "eval_samples_per_second": 78.48,
12
+ "eval_steps_per_second": 9.835,
13
  "f1": 0.8418232002914281,
14
  "precision": 0.8393060770407454,
15
  "recall": 0.8445056806950497,
16
  "train_loss": 0.3206107397548488,
17
+ "train_runtime": 1939.2465,
18
  "train_samples": 3638,
19
+ "train_samples_per_second": 37.52,
20
+ "train_steps_per_second": 1.258
21
  }
eval_results.json CHANGED
@@ -5,8 +5,8 @@
5
  "eval_loss": 0.33090195059776306,
6
  "eval_precision": 0.8378262413446174,
7
  "eval_recall": 0.8460174577195854,
8
- "eval_runtime": 4.9516,
9
  "eval_samples": 399,
10
- "eval_samples_per_second": 80.58,
11
- "eval_steps_per_second": 10.098
12
  }
 
5
  "eval_loss": 0.33090195059776306,
6
  "eval_precision": 0.8378262413446174,
7
  "eval_recall": 0.8460174577195854,
8
+ "eval_runtime": 5.0841,
9
  "eval_samples": 399,
10
+ "eval_samples_per_second": 78.48,
11
+ "eval_steps_per_second": 9.835
12
  }
predict_results.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "accuracy": 0.8674579624134521,
3
+ "f1": 0.8418232002914281,
4
+ "precision": 0.8393060770407454,
5
+ "recall": 0.8445056806950497
6
+ }
runs/May26_12-07-29_indolem-petl-vm/events.out.tfevents.1716727207.indolem-petl-vm.2867885.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbb6ab131360d63d3be62742b3ebdd011402a781da734bc87cce465acfbd022b
3
+ size 560
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 20.0,
3
  "train_loss": 0.3206107397548488,
4
- "train_runtime": 1956.4863,
5
  "train_samples": 3638,
6
- "train_samples_per_second": 37.189,
7
- "train_steps_per_second": 1.247
8
  }
 
1
  {
2
  "epoch": 20.0,
3
  "train_loss": 0.3206107397548488,
4
+ "train_runtime": 1939.2465,
5
  "train_samples": 3638,
6
+ "train_samples_per_second": 37.52,
7
+ "train_steps_per_second": 1.258
8
  }
trainer_state.json CHANGED
@@ -22,9 +22,9 @@
22
  "eval_loss": 0.5075693130493164,
23
  "eval_precision": 0.6564625850340136,
24
  "eval_recall": 0.6463902527732315,
25
- "eval_runtime": 5.1118,
26
- "eval_samples_per_second": 78.054,
27
- "eval_steps_per_second": 9.781,
28
  "step": 122
29
  },
30
  {
@@ -41,9 +41,9 @@
41
  "eval_loss": 0.48389074206352234,
42
  "eval_precision": 0.7106679035250464,
43
  "eval_recall": 0.7409074377159484,
44
- "eval_runtime": 5.1507,
45
- "eval_samples_per_second": 77.466,
46
- "eval_steps_per_second": 9.707,
47
  "step": 244
48
  },
49
  {
@@ -60,9 +60,9 @@
60
  "eval_loss": 0.425637811422348,
61
  "eval_precision": 0.7280813755532857,
62
  "eval_recall": 0.7436352064011639,
63
- "eval_runtime": 5.0576,
64
- "eval_samples_per_second": 78.892,
65
- "eval_steps_per_second": 9.886,
66
  "step": 366
67
  },
68
  {
@@ -79,9 +79,9 @@
79
  "eval_loss": 0.387967973947525,
80
  "eval_precision": 0.7798245614035089,
81
  "eval_recall": 0.7755501000181851,
82
- "eval_runtime": 5.0583,
83
- "eval_samples_per_second": 78.88,
84
- "eval_steps_per_second": 9.885,
85
  "step": 488
86
  },
87
  {
@@ -98,9 +98,9 @@
98
  "eval_loss": 0.4130999743938446,
99
  "eval_precision": 0.765661378526179,
100
  "eval_recall": 0.7974177123113293,
101
- "eval_runtime": 5.0532,
102
- "eval_samples_per_second": 78.96,
103
- "eval_steps_per_second": 9.895,
104
  "step": 610
105
  },
106
  {
@@ -117,9 +117,9 @@
117
  "eval_loss": 0.36453139781951904,
118
  "eval_precision": 0.7965023376930815,
119
  "eval_recall": 0.803691580287325,
120
- "eval_runtime": 5.057,
121
- "eval_samples_per_second": 78.901,
122
- "eval_steps_per_second": 9.887,
123
  "step": 732
124
  },
125
  {
@@ -136,9 +136,9 @@
136
  "eval_loss": 0.3639658987522125,
137
  "eval_precision": 0.798820781588242,
138
  "eval_recall": 0.8179669030732861,
139
- "eval_runtime": 5.0706,
140
- "eval_samples_per_second": 78.689,
141
- "eval_steps_per_second": 9.861,
142
  "step": 854
143
  },
144
  {
@@ -155,9 +155,9 @@
155
  "eval_loss": 0.3551309108734131,
156
  "eval_precision": 0.7996165051429931,
157
  "eval_recall": 0.8054646299327151,
158
- "eval_runtime": 5.0676,
159
- "eval_samples_per_second": 78.736,
160
- "eval_steps_per_second": 9.867,
161
  "step": 976
162
  },
163
  {
@@ -174,9 +174,9 @@
174
  "eval_loss": 0.3508576452732086,
175
  "eval_precision": 0.8169406150583245,
176
  "eval_recall": 0.8261047463175123,
177
- "eval_runtime": 5.049,
178
- "eval_samples_per_second": 79.025,
179
- "eval_steps_per_second": 9.903,
180
  "step": 1098
181
  },
182
  {
@@ -193,9 +193,9 @@
193
  "eval_loss": 0.341298907995224,
194
  "eval_precision": 0.8212799324446589,
195
  "eval_recall": 0.8228768867066739,
196
- "eval_runtime": 5.1507,
197
- "eval_samples_per_second": 77.465,
198
- "eval_steps_per_second": 9.707,
199
  "step": 1220
200
  },
201
  {
@@ -212,9 +212,9 @@
212
  "eval_loss": 0.3493994474411011,
213
  "eval_precision": 0.8192918192918193,
214
  "eval_recall": 0.8328787052191308,
215
- "eval_runtime": 5.0606,
216
- "eval_samples_per_second": 78.845,
217
- "eval_steps_per_second": 9.88,
218
  "step": 1342
219
  },
220
  {
@@ -231,9 +231,9 @@
231
  "eval_loss": 0.35203850269317627,
232
  "eval_precision": 0.822024085224641,
233
  "eval_recall": 0.837152209492635,
234
- "eval_runtime": 5.073,
235
- "eval_samples_per_second": 78.651,
236
- "eval_steps_per_second": 9.856,
237
  "step": 1464
238
  },
239
  {
@@ -250,9 +250,9 @@
250
  "eval_loss": 0.33577361702919006,
251
  "eval_precision": 0.8201621387462095,
252
  "eval_recall": 0.8136024731769412,
253
- "eval_runtime": 5.0477,
254
- "eval_samples_per_second": 79.046,
255
- "eval_steps_per_second": 9.906,
256
  "step": 1586
257
  },
258
  {
@@ -269,9 +269,9 @@
269
  "eval_loss": 0.3354940712451935,
270
  "eval_precision": 0.8352012604792199,
271
  "eval_recall": 0.8417439534460811,
272
- "eval_runtime": 5.0567,
273
- "eval_samples_per_second": 78.905,
274
- "eval_steps_per_second": 9.888,
275
  "step": 1708
276
  },
277
  {
@@ -288,9 +288,9 @@
288
  "eval_loss": 0.3406221270561218,
289
  "eval_precision": 0.8345705196182396,
290
  "eval_recall": 0.8442444080741953,
291
- "eval_runtime": 5.0502,
292
- "eval_samples_per_second": 79.007,
293
- "eval_steps_per_second": 9.901,
294
  "step": 1830
295
  },
296
  {
@@ -307,9 +307,9 @@
307
  "eval_loss": 0.337022989988327,
308
  "eval_precision": 0.8308913308913308,
309
  "eval_recall": 0.8449718130569195,
310
- "eval_runtime": 5.0526,
311
- "eval_samples_per_second": 78.969,
312
- "eval_steps_per_second": 9.896,
313
  "step": 1952
314
  },
315
  {
@@ -326,9 +326,9 @@
326
  "eval_loss": 0.3271777033805847,
327
  "eval_precision": 0.8411320530352577,
328
  "eval_recall": 0.8477905073649754,
329
- "eval_runtime": 5.0707,
330
- "eval_samples_per_second": 78.687,
331
- "eval_steps_per_second": 9.86,
332
  "step": 2074
333
  },
334
  {
@@ -345,9 +345,9 @@
345
  "eval_loss": 0.3318663537502289,
346
  "eval_precision": 0.8313636363636363,
347
  "eval_recall": 0.8424713584288053,
348
- "eval_runtime": 5.1168,
349
- "eval_samples_per_second": 77.978,
350
- "eval_steps_per_second": 9.772,
351
  "step": 2196
352
  },
353
  {
@@ -364,9 +364,9 @@
364
  "eval_loss": 0.3293265402317047,
365
  "eval_precision": 0.8411320530352577,
366
  "eval_recall": 0.8477905073649754,
367
- "eval_runtime": 5.0594,
368
- "eval_samples_per_second": 78.863,
369
- "eval_steps_per_second": 9.883,
370
  "step": 2318
371
  },
372
  {
@@ -383,9 +383,9 @@
383
  "eval_loss": 0.33090195059776306,
384
  "eval_precision": 0.8378262413446174,
385
  "eval_recall": 0.8460174577195854,
386
- "eval_runtime": 5.0536,
387
- "eval_samples_per_second": 78.954,
388
- "eval_steps_per_second": 9.894,
389
  "step": 2440
390
  },
391
  {
@@ -393,9 +393,9 @@
393
  "step": 2440,
394
  "total_flos": 7609911792720000.0,
395
  "train_loss": 0.3206107397548488,
396
- "train_runtime": 1956.4863,
397
- "train_samples_per_second": 37.189,
398
- "train_steps_per_second": 1.247
399
  }
400
  ],
401
  "logging_steps": 500,
 
22
  "eval_loss": 0.5075693130493164,
23
  "eval_precision": 0.6564625850340136,
24
  "eval_recall": 0.6463902527732315,
25
+ "eval_runtime": 4.7027,
26
+ "eval_samples_per_second": 84.844,
27
+ "eval_steps_per_second": 10.632,
28
  "step": 122
29
  },
30
  {
 
41
  "eval_loss": 0.48389074206352234,
42
  "eval_precision": 0.7106679035250464,
43
  "eval_recall": 0.7409074377159484,
44
+ "eval_runtime": 5.045,
45
+ "eval_samples_per_second": 79.089,
46
+ "eval_steps_per_second": 9.911,
47
  "step": 244
48
  },
49
  {
 
60
  "eval_loss": 0.425637811422348,
61
  "eval_precision": 0.7280813755532857,
62
  "eval_recall": 0.7436352064011639,
63
+ "eval_runtime": 5.0509,
64
+ "eval_samples_per_second": 78.996,
65
+ "eval_steps_per_second": 9.899,
66
  "step": 366
67
  },
68
  {
 
79
  "eval_loss": 0.387967973947525,
80
  "eval_precision": 0.7798245614035089,
81
  "eval_recall": 0.7755501000181851,
82
+ "eval_runtime": 5.0567,
83
+ "eval_samples_per_second": 78.905,
84
+ "eval_steps_per_second": 9.888,
85
  "step": 488
86
  },
87
  {
 
98
  "eval_loss": 0.4130999743938446,
99
  "eval_precision": 0.765661378526179,
100
  "eval_recall": 0.7974177123113293,
101
+ "eval_runtime": 5.0544,
102
+ "eval_samples_per_second": 78.942,
103
+ "eval_steps_per_second": 9.892,
104
  "step": 610
105
  },
106
  {
 
117
  "eval_loss": 0.36453139781951904,
118
  "eval_precision": 0.7965023376930815,
119
  "eval_recall": 0.803691580287325,
120
+ "eval_runtime": 5.1261,
121
+ "eval_samples_per_second": 77.836,
122
+ "eval_steps_per_second": 9.754,
123
  "step": 732
124
  },
125
  {
 
136
  "eval_loss": 0.3639658987522125,
137
  "eval_precision": 0.798820781588242,
138
  "eval_recall": 0.8179669030732861,
139
+ "eval_runtime": 5.0556,
140
+ "eval_samples_per_second": 78.923,
141
+ "eval_steps_per_second": 9.89,
142
  "step": 854
143
  },
144
  {
 
155
  "eval_loss": 0.3551309108734131,
156
  "eval_precision": 0.7996165051429931,
157
  "eval_recall": 0.8054646299327151,
158
+ "eval_runtime": 5.0625,
159
+ "eval_samples_per_second": 78.815,
160
+ "eval_steps_per_second": 9.877,
161
  "step": 976
162
  },
163
  {
 
174
  "eval_loss": 0.3508576452732086,
175
  "eval_precision": 0.8169406150583245,
176
  "eval_recall": 0.8261047463175123,
177
+ "eval_runtime": 5.0808,
178
+ "eval_samples_per_second": 78.53,
179
+ "eval_steps_per_second": 9.841,
180
  "step": 1098
181
  },
182
  {
 
193
  "eval_loss": 0.341298907995224,
194
  "eval_precision": 0.8212799324446589,
195
  "eval_recall": 0.8228768867066739,
196
+ "eval_runtime": 5.0712,
197
+ "eval_samples_per_second": 78.679,
198
+ "eval_steps_per_second": 9.86,
199
  "step": 1220
200
  },
201
  {
 
212
  "eval_loss": 0.3493994474411011,
213
  "eval_precision": 0.8192918192918193,
214
  "eval_recall": 0.8328787052191308,
215
+ "eval_runtime": 5.0816,
216
+ "eval_samples_per_second": 78.518,
217
+ "eval_steps_per_second": 9.839,
218
  "step": 1342
219
  },
220
  {
 
231
  "eval_loss": 0.35203850269317627,
232
  "eval_precision": 0.822024085224641,
233
  "eval_recall": 0.837152209492635,
234
+ "eval_runtime": 5.0478,
235
+ "eval_samples_per_second": 79.045,
236
+ "eval_steps_per_second": 9.905,
237
  "step": 1464
238
  },
239
  {
 
250
  "eval_loss": 0.33577361702919006,
251
  "eval_precision": 0.8201621387462095,
252
  "eval_recall": 0.8136024731769412,
253
+ "eval_runtime": 5.0664,
254
+ "eval_samples_per_second": 78.754,
255
+ "eval_steps_per_second": 9.869,
256
  "step": 1586
257
  },
258
  {
 
269
  "eval_loss": 0.3354940712451935,
270
  "eval_precision": 0.8352012604792199,
271
  "eval_recall": 0.8417439534460811,
272
+ "eval_runtime": 5.0946,
273
+ "eval_samples_per_second": 78.318,
274
+ "eval_steps_per_second": 9.814,
275
  "step": 1708
276
  },
277
  {
 
288
  "eval_loss": 0.3406221270561218,
289
  "eval_precision": 0.8345705196182396,
290
  "eval_recall": 0.8442444080741953,
291
+ "eval_runtime": 5.0603,
292
+ "eval_samples_per_second": 78.849,
293
+ "eval_steps_per_second": 9.881,
294
  "step": 1830
295
  },
296
  {
 
307
  "eval_loss": 0.337022989988327,
308
  "eval_precision": 0.8308913308913308,
309
  "eval_recall": 0.8449718130569195,
310
+ "eval_runtime": 5.085,
311
+ "eval_samples_per_second": 78.466,
312
+ "eval_steps_per_second": 9.833,
313
  "step": 1952
314
  },
315
  {
 
326
  "eval_loss": 0.3271777033805847,
327
  "eval_precision": 0.8411320530352577,
328
  "eval_recall": 0.8477905073649754,
329
+ "eval_runtime": 5.0503,
330
+ "eval_samples_per_second": 79.006,
331
+ "eval_steps_per_second": 9.9,
332
  "step": 2074
333
  },
334
  {
 
345
  "eval_loss": 0.3318663537502289,
346
  "eval_precision": 0.8313636363636363,
347
  "eval_recall": 0.8424713584288053,
348
+ "eval_runtime": 5.0901,
349
+ "eval_samples_per_second": 78.388,
350
+ "eval_steps_per_second": 9.823,
351
  "step": 2196
352
  },
353
  {
 
364
  "eval_loss": 0.3293265402317047,
365
  "eval_precision": 0.8411320530352577,
366
  "eval_recall": 0.8477905073649754,
367
+ "eval_runtime": 5.0466,
368
+ "eval_samples_per_second": 79.064,
369
+ "eval_steps_per_second": 9.908,
370
  "step": 2318
371
  },
372
  {
 
383
  "eval_loss": 0.33090195059776306,
384
  "eval_precision": 0.8378262413446174,
385
  "eval_recall": 0.8460174577195854,
386
+ "eval_runtime": 5.0648,
387
+ "eval_samples_per_second": 78.78,
388
+ "eval_steps_per_second": 9.872,
389
  "step": 2440
390
  },
391
  {
 
393
  "step": 2440,
394
  "total_flos": 7609911792720000.0,
395
  "train_loss": 0.3206107397548488,
396
+ "train_runtime": 1939.2465,
397
+ "train_samples_per_second": 37.52,
398
+ "train_steps_per_second": 1.258
399
  }
400
  ],
401
  "logging_steps": 500,