nlpso commited on
Commit
f2a84c8
1 Parent(s): d2ec531

Load model and tokenizer

Browse files
config.json ADDED
@@ -0,0 +1,47 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "Jean-Baptiste/camembert-ner",
3
+ "architectures": [
4
+ "CamembertForTokenClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 5,
8
+ "classifier_dropout": null,
9
+ "eos_token_id": 6,
10
+ "gradient_checkpointing": false,
11
+ "hidden_act": "gelu",
12
+ "hidden_dropout_prob": 0.1,
13
+ "hidden_size": 768,
14
+ "id2label": {
15
+ "0": "O",
16
+ "1": "I-PER",
17
+ "2": "I-TITRE",
18
+ "3": "I-ACT",
19
+ "4": "I-LOC",
20
+ "5": "I-CARDINAL",
21
+ "6": "I-FT"
22
+ },
23
+ "initializer_range": 0.02,
24
+ "intermediate_size": 3072,
25
+ "label2id": {
26
+ "I-ACT": 3,
27
+ "I-CARDINAL": 5,
28
+ "I-FT": 6,
29
+ "I-LOC": 4,
30
+ "I-PER": 1,
31
+ "I-TITRE": 2,
32
+ "O": 0
33
+ },
34
+ "layer_norm_eps": 1e-05,
35
+ "max_position_embeddings": 514,
36
+ "model_type": "camembert",
37
+ "num_attention_heads": 12,
38
+ "num_hidden_layers": 12,
39
+ "output_past": true,
40
+ "pad_token_id": 1,
41
+ "position_embedding_type": "absolute",
42
+ "torch_dtype": "float32",
43
+ "transformers_version": "4.25.1",
44
+ "type_vocab_size": 1,
45
+ "use_cache": true,
46
+ "vocab_size": 32005
47
+ }
optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b436873117bdd544da4851b43a079f9e357e8065ef12d431c890124fd8ebe9b1
3
+ size 880409317
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be4d9fe1800b112be60bbd532d6b178aaa8948952e476dfd70ac3446b774f526
3
+ size 440218033
rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d741a85c4faa3af8e61ac6d28da871def49b72c259e734a90d1747b0880d4ae4
3
+ size 14503
scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49b57bc5172463fef07fc294451bc054e3a77eb4220472a8f5c71745e477f749
3
+ size 623
sentencepiece.bpe.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:988bc5a00281c6d210a5d34bd143d0363741a432fefe741bf71e61b1869d4314
3
+ size 810912
special_tokens_map.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<s>NOTUSED",
4
+ "</s>NOTUSED"
5
+ ],
6
+ "bos_token": "<s>",
7
+ "cls_token": "<s>",
8
+ "eos_token": "</s>",
9
+ "mask_token": "<mask>",
10
+ "pad_token": "<pad>",
11
+ "sep_token": "</s>",
12
+ "unk_token": "<unk>"
13
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<s>NOTUSED",
4
+ "</s>NOTUSED"
5
+ ],
6
+ "bos_token": "<s>",
7
+ "cls_token": "<s>",
8
+ "eos_token": "</s>",
9
+ "mask_token": {
10
+ "__type": "AddedToken",
11
+ "content": "<mask>",
12
+ "lstrip": true,
13
+ "normalized": true,
14
+ "rstrip": false,
15
+ "single_word": false
16
+ },
17
+ "model_max_length": 512,
18
+ "name_or_path": "Jean-Baptiste/camembert-ner",
19
+ "pad_token": "<pad>",
20
+ "sep_token": "</s>",
21
+ "sp_model_kwargs": {},
22
+ "special_tokens_map_file": "/lrde/home2/stual/.cache/huggingface/hub/models--Jean-Baptiste--camembert-ner/snapshots/9f8b2203b6a2daba1ad279ac2adb822518caa167/special_tokens_map.json",
23
+ "tokenizer_class": "CamembertTokenizer",
24
+ "unk_token": "<unk>"
25
+ }
trainer_state.json ADDED
@@ -0,0 +1,454 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.9642591213700671,
3
+ "best_model_checkpoint": "/work/stual/res_ICDAR/method_0/tmp/41-flat-ner-pero-ocr-camembert_ner/checkpoint-900",
4
+ "epoch": 2.362204724409449,
5
+ "global_step": 900,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.26,
12
+ "eval_ACT": {
13
+ "f1": 0.8502242152466369,
14
+ "number": 519,
15
+ "precision": 0.7953020134228188,
16
+ "recall": 0.9132947976878613
17
+ },
18
+ "eval_CARDINAL": {
19
+ "f1": 0.9723032069970846,
20
+ "number": 678,
21
+ "precision": 0.9610951008645533,
22
+ "recall": 0.9837758112094396
23
+ },
24
+ "eval_FT": {
25
+ "f1": 0.0,
26
+ "number": 7,
27
+ "precision": 0.0,
28
+ "recall": 0.0
29
+ },
30
+ "eval_LOC": {
31
+ "f1": 0.9184993531694695,
32
+ "number": 761,
33
+ "precision": 0.9044585987261147,
34
+ "recall": 0.9329829172141918
35
+ },
36
+ "eval_PER": {
37
+ "f1": 0.9062957540263543,
38
+ "number": 679,
39
+ "precision": 0.901018922852984,
40
+ "recall": 0.9116347569955817
41
+ },
42
+ "eval_TITRE": {
43
+ "f1": 0.0,
44
+ "number": 41,
45
+ "precision": 0.0,
46
+ "recall": 0.0
47
+ },
48
+ "eval_accuracy": 0.9454568463680081,
49
+ "eval_f1": 0.9069212410501192,
50
+ "eval_loss": 0.2516954839229584,
51
+ "eval_precision": 0.8942795076031861,
52
+ "eval_recall": 0.9199255121042831,
53
+ "eval_runtime": 2.036,
54
+ "eval_samples_per_second": 332.026,
55
+ "eval_steps_per_second": 21.12,
56
+ "step": 100
57
+ },
58
+ {
59
+ "epoch": 0.52,
60
+ "eval_ACT": {
61
+ "f1": 0.8866359447004608,
62
+ "number": 519,
63
+ "precision": 0.8498233215547704,
64
+ "recall": 0.9267822736030829
65
+ },
66
+ "eval_CARDINAL": {
67
+ "f1": 0.9786607799852833,
68
+ "number": 678,
69
+ "precision": 0.9765051395007343,
70
+ "recall": 0.9808259587020649
71
+ },
72
+ "eval_FT": {
73
+ "f1": 0.0,
74
+ "number": 7,
75
+ "precision": 0.0,
76
+ "recall": 0.0
77
+ },
78
+ "eval_LOC": {
79
+ "f1": 0.9327296248382924,
80
+ "number": 761,
81
+ "precision": 0.9184713375796179,
82
+ "recall": 0.9474375821287779
83
+ },
84
+ "eval_PER": {
85
+ "f1": 0.9166666666666666,
86
+ "number": 679,
87
+ "precision": 0.9100145137880987,
88
+ "recall": 0.9234167893961709
89
+ },
90
+ "eval_TITRE": {
91
+ "f1": 0.0,
92
+ "number": 41,
93
+ "precision": 0.0,
94
+ "recall": 0.0
95
+ },
96
+ "eval_accuracy": 0.9538091622374083,
97
+ "eval_f1": 0.9226785053644099,
98
+ "eval_loss": 0.18263815343379974,
99
+ "eval_precision": 0.9165747886806321,
100
+ "eval_recall": 0.9288640595903166,
101
+ "eval_runtime": 2.0314,
102
+ "eval_samples_per_second": 332.78,
103
+ "eval_steps_per_second": 21.168,
104
+ "step": 200
105
+ },
106
+ {
107
+ "epoch": 0.79,
108
+ "eval_ACT": {
109
+ "f1": 0.9261744966442953,
110
+ "number": 519,
111
+ "precision": 0.9217557251908397,
112
+ "recall": 0.930635838150289
113
+ },
114
+ "eval_CARDINAL": {
115
+ "f1": 0.9816581071166545,
116
+ "number": 678,
117
+ "precision": 0.9766423357664233,
118
+ "recall": 0.9867256637168141
119
+ },
120
+ "eval_FT": {
121
+ "f1": 0.0,
122
+ "number": 7,
123
+ "precision": 0.0,
124
+ "recall": 0.0
125
+ },
126
+ "eval_LOC": {
127
+ "f1": 0.947780678851175,
128
+ "number": 761,
129
+ "precision": 0.9416342412451362,
130
+ "recall": 0.9540078843626807
131
+ },
132
+ "eval_PER": {
133
+ "f1": 0.94620486366986,
134
+ "number": 679,
135
+ "precision": 0.9469026548672567,
136
+ "recall": 0.9455081001472754
137
+ },
138
+ "eval_TITRE": {
139
+ "f1": 0.4675324675324676,
140
+ "number": 41,
141
+ "precision": 0.5,
142
+ "recall": 0.43902439024390244
143
+ },
144
+ "eval_accuracy": 0.9639331814730449,
145
+ "eval_f1": 0.9436698271054099,
146
+ "eval_loss": 0.13531556725502014,
147
+ "eval_precision": 0.9420935412026726,
148
+ "eval_recall": 0.9452513966480447,
149
+ "eval_runtime": 2.0117,
150
+ "eval_samples_per_second": 336.027,
151
+ "eval_steps_per_second": 21.375,
152
+ "step": 300
153
+ },
154
+ {
155
+ "epoch": 1.05,
156
+ "eval_ACT": {
157
+ "f1": 0.9381541389153186,
158
+ "number": 519,
159
+ "precision": 0.9266917293233082,
160
+ "recall": 0.9499036608863198
161
+ },
162
+ "eval_CARDINAL": {
163
+ "f1": 0.9852724594992636,
164
+ "number": 678,
165
+ "precision": 0.9838235294117647,
166
+ "recall": 0.9867256637168141
167
+ },
168
+ "eval_FT": {
169
+ "f1": 0.0,
170
+ "number": 7,
171
+ "precision": 0.0,
172
+ "recall": 0.0
173
+ },
174
+ "eval_LOC": {
175
+ "f1": 0.9483322432962721,
176
+ "number": 761,
177
+ "precision": 0.9440104166666666,
178
+ "recall": 0.9526938239159002
179
+ },
180
+ "eval_PER": {
181
+ "f1": 0.9553113553113554,
182
+ "number": 679,
183
+ "precision": 0.9504373177842566,
184
+ "recall": 0.9602356406480118
185
+ },
186
+ "eval_TITRE": {
187
+ "f1": 0.5813953488372093,
188
+ "number": 41,
189
+ "precision": 0.5555555555555556,
190
+ "recall": 0.6097560975609756
191
+ },
192
+ "eval_accuracy": 0.9646924829157175,
193
+ "eval_f1": 0.9503335804299481,
194
+ "eval_loss": 0.11591742187738419,
195
+ "eval_precision": 0.9457764662486168,
196
+ "eval_recall": 0.9549348230912477,
197
+ "eval_runtime": 2.0409,
198
+ "eval_samples_per_second": 331.23,
199
+ "eval_steps_per_second": 21.069,
200
+ "step": 400
201
+ },
202
+ {
203
+ "epoch": 1.31,
204
+ "learning_rate": 9e-05,
205
+ "loss": 0.2356,
206
+ "step": 500
207
+ },
208
+ {
209
+ "epoch": 1.31,
210
+ "eval_ACT": {
211
+ "f1": 0.9393939393939394,
212
+ "number": 519,
213
+ "precision": 0.9236499068901304,
214
+ "recall": 0.9556840077071291
215
+ },
216
+ "eval_CARDINAL": {
217
+ "f1": 0.9830258302583026,
218
+ "number": 678,
219
+ "precision": 0.983751846381093,
220
+ "recall": 0.9823008849557522
221
+ },
222
+ "eval_FT": {
223
+ "f1": 0.0,
224
+ "number": 7,
225
+ "precision": 0.0,
226
+ "recall": 0.0
227
+ },
228
+ "eval_LOC": {
229
+ "f1": 0.944769330734243,
230
+ "number": 761,
231
+ "precision": 0.9344473007712082,
232
+ "recall": 0.9553219448094612
233
+ },
234
+ "eval_PER": {
235
+ "f1": 0.9618208516886931,
236
+ "number": 679,
237
+ "precision": 0.95900439238653,
238
+ "recall": 0.9646539027982327
239
+ },
240
+ "eval_TITRE": {
241
+ "f1": 0.684931506849315,
242
+ "number": 41,
243
+ "precision": 0.78125,
244
+ "recall": 0.6097560975609756
245
+ },
246
+ "eval_accuracy": 0.9710199949379904,
247
+ "eval_f1": 0.952893175074184,
248
+ "eval_loss": 0.10950864851474762,
249
+ "eval_precision": 0.949021056520133,
250
+ "eval_recall": 0.9567970204841714,
251
+ "eval_runtime": 2.1232,
252
+ "eval_samples_per_second": 318.382,
253
+ "eval_steps_per_second": 20.252,
254
+ "step": 500
255
+ },
256
+ {
257
+ "epoch": 1.57,
258
+ "eval_ACT": {
259
+ "f1": 0.9485714285714286,
260
+ "number": 519,
261
+ "precision": 0.9378531073446328,
262
+ "recall": 0.9595375722543352
263
+ },
264
+ "eval_CARDINAL": {
265
+ "f1": 0.9801907556859869,
266
+ "number": 678,
267
+ "precision": 0.9751824817518249,
268
+ "recall": 0.9852507374631269
269
+ },
270
+ "eval_FT": {
271
+ "f1": 0.0,
272
+ "number": 7,
273
+ "precision": 0.0,
274
+ "recall": 0.0
275
+ },
276
+ "eval_LOC": {
277
+ "f1": 0.9492187500000001,
278
+ "number": 761,
279
+ "precision": 0.9406451612903226,
280
+ "recall": 0.9579500657030223
281
+ },
282
+ "eval_PER": {
283
+ "f1": 0.96759941089838,
284
+ "number": 679,
285
+ "precision": 0.96759941089838,
286
+ "recall": 0.96759941089838
287
+ },
288
+ "eval_TITRE": {
289
+ "f1": 0.7160493827160495,
290
+ "number": 41,
291
+ "precision": 0.725,
292
+ "recall": 0.7073170731707317
293
+ },
294
+ "eval_accuracy": 0.9716527461402177,
295
+ "eval_f1": 0.9568118628359593,
296
+ "eval_loss": 0.09932182729244232,
297
+ "eval_precision": 0.9523985239852398,
298
+ "eval_recall": 0.9612662942271881,
299
+ "eval_runtime": 2.1374,
300
+ "eval_samples_per_second": 316.273,
301
+ "eval_steps_per_second": 20.118,
302
+ "step": 600
303
+ },
304
+ {
305
+ "epoch": 1.84,
306
+ "eval_ACT": {
307
+ "f1": 0.9541984732824428,
308
+ "number": 519,
309
+ "precision": 0.945179584120983,
310
+ "recall": 0.9633911368015414
311
+ },
312
+ "eval_CARDINAL": {
313
+ "f1": 0.9852507374631269,
314
+ "number": 678,
315
+ "precision": 0.9852507374631269,
316
+ "recall": 0.9852507374631269
317
+ },
318
+ "eval_FT": {
319
+ "f1": 0.0,
320
+ "number": 7,
321
+ "precision": 0.0,
322
+ "recall": 0.0
323
+ },
324
+ "eval_LOC": {
325
+ "f1": 0.9510124101894187,
326
+ "number": 761,
327
+ "precision": 0.9454545454545454,
328
+ "recall": 0.9566360052562418
329
+ },
330
+ "eval_PER": {
331
+ "f1": 0.9771891096394407,
332
+ "number": 679,
333
+ "precision": 0.9764705882352941,
334
+ "recall": 0.9779086892488954
335
+ },
336
+ "eval_TITRE": {
337
+ "f1": 0.7848101265822786,
338
+ "number": 41,
339
+ "precision": 0.8157894736842105,
340
+ "recall": 0.7560975609756098
341
+ },
342
+ "eval_accuracy": 0.9779802581624905,
343
+ "eval_f1": 0.9631970260223048,
344
+ "eval_loss": 0.08475597947835922,
345
+ "eval_precision": 0.9614100185528757,
346
+ "eval_recall": 0.9649906890130354,
347
+ "eval_runtime": 2.0431,
348
+ "eval_samples_per_second": 330.877,
349
+ "eval_steps_per_second": 21.047,
350
+ "step": 700
351
+ },
352
+ {
353
+ "epoch": 2.1,
354
+ "eval_ACT": {
355
+ "f1": 0.9468690702087287,
356
+ "number": 519,
357
+ "precision": 0.9327102803738317,
358
+ "recall": 0.9614643545279383
359
+ },
360
+ "eval_CARDINAL": {
361
+ "f1": 0.9852507374631269,
362
+ "number": 678,
363
+ "precision": 0.9852507374631269,
364
+ "recall": 0.9852507374631269
365
+ },
366
+ "eval_FT": {
367
+ "f1": 0.0,
368
+ "number": 7,
369
+ "precision": 0.0,
370
+ "recall": 0.0
371
+ },
372
+ "eval_LOC": {
373
+ "f1": 0.9432485322896281,
374
+ "number": 761,
375
+ "precision": 0.9365284974093264,
376
+ "recall": 0.9500657030223391
377
+ },
378
+ "eval_PER": {
379
+ "f1": 0.9705882352941176,
380
+ "number": 679,
381
+ "precision": 0.9691629955947136,
382
+ "recall": 0.9720176730486009
383
+ },
384
+ "eval_TITRE": {
385
+ "f1": 0.7594936708860759,
386
+ "number": 41,
387
+ "precision": 0.7894736842105263,
388
+ "recall": 0.7317073170731707
389
+ },
390
+ "eval_accuracy": 0.9746899519109087,
391
+ "eval_f1": 0.9575060308034886,
392
+ "eval_loss": 0.08957625180482864,
393
+ "eval_precision": 0.9541420118343196,
394
+ "eval_recall": 0.9608938547486033,
395
+ "eval_runtime": 2.0502,
396
+ "eval_samples_per_second": 329.727,
397
+ "eval_steps_per_second": 20.974,
398
+ "step": 800
399
+ },
400
+ {
401
+ "epoch": 2.36,
402
+ "eval_ACT": {
403
+ "f1": 0.9570200573065903,
404
+ "number": 519,
405
+ "precision": 0.9488636363636364,
406
+ "recall": 0.9653179190751445
407
+ },
408
+ "eval_CARDINAL": {
409
+ "f1": 0.9866666666666667,
410
+ "number": 678,
411
+ "precision": 0.9910714285714286,
412
+ "recall": 0.9823008849557522
413
+ },
414
+ "eval_FT": {
415
+ "f1": 0.22222222222222224,
416
+ "number": 7,
417
+ "precision": 0.5,
418
+ "recall": 0.14285714285714285
419
+ },
420
+ "eval_LOC": {
421
+ "f1": 0.9542483660130721,
422
+ "number": 761,
423
+ "precision": 0.9492847854356307,
424
+ "recall": 0.9592641261498029
425
+ },
426
+ "eval_PER": {
427
+ "f1": 0.9779086892488954,
428
+ "number": 679,
429
+ "precision": 0.9779086892488954,
430
+ "recall": 0.9779086892488954
431
+ },
432
+ "eval_TITRE": {
433
+ "f1": 0.7179487179487181,
434
+ "number": 41,
435
+ "precision": 0.7567567567567568,
436
+ "recall": 0.6829268292682927
437
+ },
438
+ "eval_accuracy": 0.9743103011895723,
439
+ "eval_f1": 0.9642591213700671,
440
+ "eval_loss": 0.08395500481128693,
441
+ "eval_precision": 0.9639002605135839,
442
+ "eval_recall": 0.9646182495344506,
443
+ "eval_runtime": 2.07,
444
+ "eval_samples_per_second": 326.576,
445
+ "eval_steps_per_second": 20.773,
446
+ "step": 900
447
+ }
448
+ ],
449
+ "max_steps": 5000,
450
+ "num_train_epochs": 14,
451
+ "total_flos": 365778917703408.0,
452
+ "trial_name": null,
453
+ "trial_params": null
454
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8decc10feab607704e246b8336e35d634cf0dc1065defecb21111669a5ae243
3
+ size 3503