sreejith8100 commited on
Commit
b0d8fee
1 Parent(s): e44f499

End of training

Browse files
added_tokens.json CHANGED
@@ -1,49 +1,11 @@
1
  {
2
  "</s>": 2,
3
- "</s_DOB>": 57558,
4
- "</s_Name_of_hospital>": 57547,
5
- "</s_POB_city>": 57539,
6
- "</s_POB_province>": 57562,
7
- "</s_UR_mother_city>": 57552,
8
- "</s_UR_mother_province>": 57555,
9
- "</s_UR_mother_street>": 57525,
10
- "</s_child_first_name>": 57532,
11
- "</s_child_last_name>": 57561,
12
- "</s_child_middle_name>": 57556,
13
- "</s_city>": 57533,
14
- "</s_father_birthplace>": 57554,
15
- "</s_father_first_name>": 57530,
16
- "</s_father_last_name>": 57553,
17
- "</s_father_middle_name>": 57564,
18
- "</s_mother_birthplace>": 57546,
19
- "</s_mother_first_name>": 57545,
20
- "</s_mother_last_name>": 57543,
21
- "</s_mother_middle_name>": 57550,
22
- "</s_province>": 57563,
23
  "<mask>": 57521,
24
  "<pad>": 1,
25
  "<s>": 0,
26
- "<s_DOB>": 57540,
27
- "<s_Name_of_hospital>": 57557,
28
- "<s_POB_city>": 57538,
29
- "<s_POB_province>": 57541,
30
- "<s_UR_mother_city>": 57529,
31
- "<s_UR_mother_province>": 57548,
32
- "<s_UR_mother_street>": 57531,
33
- "<s_child_first_name>": 57549,
34
- "<s_child_last_name>": 57536,
35
- "<s_child_middle_name>": 57537,
36
- "<s_city>": 57544,
37
- "<s_father_birthplace>": 57560,
38
- "<s_father_first_name>": 57534,
39
- "<s_father_last_name>": 57528,
40
- "<s_father_middle_name>": 57551,
41
  "<s_iitcdip>": 57523,
42
- "<s_mother_birthplace>": 57542,
43
- "<s_mother_first_name>": 57559,
44
- "<s_mother_last_name>": 57527,
45
- "<s_mother_middle_name>": 57535,
46
- "<s_province>": 57526,
47
  "<s_synthdog>": 57524,
48
  "<sep/>": 57522,
49
  "<unk>": 3
 
1
  {
2
  "</s>": 2,
3
+ "</s_province>": 57526,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4
  "<mask>": 57521,
5
  "<pad>": 1,
6
  "<s>": 0,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7
  "<s_iitcdip>": 57523,
8
+ "<s_province>": 57525,
 
 
 
 
9
  "<s_synthdog>": 57524,
10
  "<sep/>": 57522,
11
  "<unk>": 3
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:329e6727dd3f9eeea52fc6757b4c3b6e83eaec72d9bef537454a56e8f2e6f327
3
  size 809187097
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18364dee00c41a317efa603aafeb7738c8414b45685b09add86ef81c41edf647
3
  size 809187097
special_tokens_map.json CHANGED
@@ -2,48 +2,10 @@
2
  "additional_special_tokens": [
3
  "<s_iitcdip>",
4
  "<s_synthdog>",
5
- "</s_UR_mother_street>",
6
- "<s_province>",
7
- "<s_mother_last_name>",
8
- "<s_father_last_name>",
9
- "<s_UR_mother_city>",
10
- "</s_father_first_name>",
11
- "<s_UR_mother_street>",
12
- "</s_child_first_name>",
13
- "</s_city>",
14
- "<s_father_first_name>",
15
- "<s_mother_middle_name>",
16
- "<s_child_last_name>",
17
- "<s_child_middle_name>",
18
- "<s_POB_city>",
19
- "</s_POB_city>",
20
- "<s_DOB>",
21
- "<s_POB_province>",
22
- "<s_mother_birthplace>",
23
- "</s_mother_last_name>",
24
- "<s_city>",
25
  "<s>",
26
- "</s_mother_first_name>",
27
- "</s_mother_birthplace>",
28
- "</s_Name_of_hospital>",
29
- "<s_UR_mother_province>",
30
- "<s_child_first_name>",
31
- "</s_mother_middle_name>",
32
- "<s_father_middle_name>",
33
- "</s_UR_mother_city>",
34
- "</s_father_last_name>",
35
- "</s_father_birthplace>",
36
- "</s_UR_mother_province>",
37
- "</s_child_middle_name>",
38
  "</s>",
39
- "<s_Name_of_hospital>",
40
- "</s_DOB>",
41
- "<s_mother_first_name>",
42
- "<s_father_birthplace>",
43
- "</s_child_last_name>",
44
- "</s_POB_province>",
45
- "</s_province>",
46
- "</s_father_middle_name>"
47
  ],
48
  "bos_token": "<s>",
49
  "cls_token": "<s>",
 
2
  "additional_special_tokens": [
3
  "<s_iitcdip>",
4
  "<s_synthdog>",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5
  "<s>",
 
 
 
 
 
 
 
 
 
 
 
 
6
  "</s>",
7
+ "<s_province>",
8
+ "</s_province>"
 
 
 
 
 
 
9
  ],
10
  "bos_token": "<s>",
11
  "cls_token": "<s>",
tokenizer.json CHANGED
@@ -91,15 +91,6 @@
91
  },
92
  {
93
  "id": 57525,
94
- "content": "</s_UR_mother_street>",
95
- "single_word": false,
96
- "lstrip": true,
97
- "rstrip": true,
98
- "normalized": false,
99
- "special": true
100
- },
101
- {
102
- "id": 57526,
103
  "content": "<s_province>",
104
  "single_word": false,
105
  "lstrip": true,
@@ -108,346 +99,13 @@
108
  "special": true
109
  },
110
  {
111
- "id": 57527,
112
- "content": "<s_mother_last_name>",
113
- "single_word": false,
114
- "lstrip": true,
115
- "rstrip": true,
116
- "normalized": false,
117
- "special": true
118
- },
119
- {
120
- "id": 57528,
121
- "content": "<s_father_last_name>",
122
- "single_word": false,
123
- "lstrip": true,
124
- "rstrip": true,
125
- "normalized": false,
126
- "special": true
127
- },
128
- {
129
- "id": 57529,
130
- "content": "<s_UR_mother_city>",
131
- "single_word": false,
132
- "lstrip": true,
133
- "rstrip": true,
134
- "normalized": false,
135
- "special": true
136
- },
137
- {
138
- "id": 57530,
139
- "content": "</s_father_first_name>",
140
- "single_word": false,
141
- "lstrip": true,
142
- "rstrip": true,
143
- "normalized": false,
144
- "special": true
145
- },
146
- {
147
- "id": 57531,
148
- "content": "<s_UR_mother_street>",
149
- "single_word": false,
150
- "lstrip": true,
151
- "rstrip": true,
152
- "normalized": false,
153
- "special": true
154
- },
155
- {
156
- "id": 57532,
157
- "content": "</s_child_first_name>",
158
- "single_word": false,
159
- "lstrip": true,
160
- "rstrip": true,
161
- "normalized": false,
162
- "special": true
163
- },
164
- {
165
- "id": 57533,
166
- "content": "</s_city>",
167
- "single_word": false,
168
- "lstrip": true,
169
- "rstrip": true,
170
- "normalized": false,
171
- "special": true
172
- },
173
- {
174
- "id": 57534,
175
- "content": "<s_father_first_name>",
176
- "single_word": false,
177
- "lstrip": true,
178
- "rstrip": true,
179
- "normalized": false,
180
- "special": true
181
- },
182
- {
183
- "id": 57535,
184
- "content": "<s_mother_middle_name>",
185
- "single_word": false,
186
- "lstrip": true,
187
- "rstrip": true,
188
- "normalized": false,
189
- "special": true
190
- },
191
- {
192
- "id": 57536,
193
- "content": "<s_child_last_name>",
194
- "single_word": false,
195
- "lstrip": true,
196
- "rstrip": true,
197
- "normalized": false,
198
- "special": true
199
- },
200
- {
201
- "id": 57537,
202
- "content": "<s_child_middle_name>",
203
- "single_word": false,
204
- "lstrip": true,
205
- "rstrip": true,
206
- "normalized": false,
207
- "special": true
208
- },
209
- {
210
- "id": 57538,
211
- "content": "<s_POB_city>",
212
- "single_word": false,
213
- "lstrip": true,
214
- "rstrip": true,
215
- "normalized": false,
216
- "special": true
217
- },
218
- {
219
- "id": 57539,
220
- "content": "</s_POB_city>",
221
- "single_word": false,
222
- "lstrip": true,
223
- "rstrip": true,
224
- "normalized": false,
225
- "special": true
226
- },
227
- {
228
- "id": 57540,
229
- "content": "<s_DOB>",
230
- "single_word": false,
231
- "lstrip": true,
232
- "rstrip": true,
233
- "normalized": false,
234
- "special": true
235
- },
236
- {
237
- "id": 57541,
238
- "content": "<s_POB_province>",
239
- "single_word": false,
240
- "lstrip": true,
241
- "rstrip": true,
242
- "normalized": false,
243
- "special": true
244
- },
245
- {
246
- "id": 57542,
247
- "content": "<s_mother_birthplace>",
248
- "single_word": false,
249
- "lstrip": true,
250
- "rstrip": true,
251
- "normalized": false,
252
- "special": true
253
- },
254
- {
255
- "id": 57543,
256
- "content": "</s_mother_last_name>",
257
- "single_word": false,
258
- "lstrip": true,
259
- "rstrip": true,
260
- "normalized": false,
261
- "special": true
262
- },
263
- {
264
- "id": 57544,
265
- "content": "<s_city>",
266
- "single_word": false,
267
- "lstrip": true,
268
- "rstrip": true,
269
- "normalized": false,
270
- "special": true
271
- },
272
- {
273
- "id": 57545,
274
- "content": "</s_mother_first_name>",
275
- "single_word": false,
276
- "lstrip": true,
277
- "rstrip": true,
278
- "normalized": false,
279
- "special": true
280
- },
281
- {
282
- "id": 57546,
283
- "content": "</s_mother_birthplace>",
284
- "single_word": false,
285
- "lstrip": true,
286
- "rstrip": true,
287
- "normalized": false,
288
- "special": true
289
- },
290
- {
291
- "id": 57547,
292
- "content": "</s_Name_of_hospital>",
293
- "single_word": false,
294
- "lstrip": true,
295
- "rstrip": true,
296
- "normalized": false,
297
- "special": true
298
- },
299
- {
300
- "id": 57548,
301
- "content": "<s_UR_mother_province>",
302
- "single_word": false,
303
- "lstrip": true,
304
- "rstrip": true,
305
- "normalized": false,
306
- "special": true
307
- },
308
- {
309
- "id": 57549,
310
- "content": "<s_child_first_name>",
311
- "single_word": false,
312
- "lstrip": true,
313
- "rstrip": true,
314
- "normalized": false,
315
- "special": true
316
- },
317
- {
318
- "id": 57550,
319
- "content": "</s_mother_middle_name>",
320
- "single_word": false,
321
- "lstrip": true,
322
- "rstrip": true,
323
- "normalized": false,
324
- "special": true
325
- },
326
- {
327
- "id": 57551,
328
- "content": "<s_father_middle_name>",
329
- "single_word": false,
330
- "lstrip": true,
331
- "rstrip": true,
332
- "normalized": false,
333
- "special": true
334
- },
335
- {
336
- "id": 57552,
337
- "content": "</s_UR_mother_city>",
338
- "single_word": false,
339
- "lstrip": true,
340
- "rstrip": true,
341
- "normalized": false,
342
- "special": true
343
- },
344
- {
345
- "id": 57553,
346
- "content": "</s_father_last_name>",
347
- "single_word": false,
348
- "lstrip": true,
349
- "rstrip": true,
350
- "normalized": false,
351
- "special": true
352
- },
353
- {
354
- "id": 57554,
355
- "content": "</s_father_birthplace>",
356
- "single_word": false,
357
- "lstrip": true,
358
- "rstrip": true,
359
- "normalized": false,
360
- "special": true
361
- },
362
- {
363
- "id": 57555,
364
- "content": "</s_UR_mother_province>",
365
- "single_word": false,
366
- "lstrip": true,
367
- "rstrip": true,
368
- "normalized": false,
369
- "special": true
370
- },
371
- {
372
- "id": 57556,
373
- "content": "</s_child_middle_name>",
374
- "single_word": false,
375
- "lstrip": true,
376
- "rstrip": true,
377
- "normalized": false,
378
- "special": true
379
- },
380
- {
381
- "id": 57557,
382
- "content": "<s_Name_of_hospital>",
383
- "single_word": false,
384
- "lstrip": true,
385
- "rstrip": true,
386
- "normalized": false,
387
- "special": true
388
- },
389
- {
390
- "id": 57558,
391
- "content": "</s_DOB>",
392
- "single_word": false,
393
- "lstrip": true,
394
- "rstrip": true,
395
- "normalized": false,
396
- "special": true
397
- },
398
- {
399
- "id": 57559,
400
- "content": "<s_mother_first_name>",
401
- "single_word": false,
402
- "lstrip": true,
403
- "rstrip": true,
404
- "normalized": false,
405
- "special": true
406
- },
407
- {
408
- "id": 57560,
409
- "content": "<s_father_birthplace>",
410
- "single_word": false,
411
- "lstrip": true,
412
- "rstrip": true,
413
- "normalized": false,
414
- "special": true
415
- },
416
- {
417
- "id": 57561,
418
- "content": "</s_child_last_name>",
419
- "single_word": false,
420
- "lstrip": true,
421
- "rstrip": true,
422
- "normalized": false,
423
- "special": true
424
- },
425
- {
426
- "id": 57562,
427
- "content": "</s_POB_province>",
428
- "single_word": false,
429
- "lstrip": true,
430
- "rstrip": true,
431
- "normalized": false,
432
- "special": true
433
- },
434
- {
435
- "id": 57563,
436
  "content": "</s_province>",
437
  "single_word": false,
438
  "lstrip": true,
439
  "rstrip": true,
440
  "normalized": false,
441
  "special": true
442
- },
443
- {
444
- "id": 57564,
445
- "content": "</s_father_middle_name>",
446
- "single_word": false,
447
- "lstrip": true,
448
- "rstrip": true,
449
- "normalized": false,
450
- "special": true
451
  }
452
  ],
453
  "normalizer": {
 
91
  },
92
  {
93
  "id": 57525,
 
 
 
 
 
 
 
 
 
94
  "content": "<s_province>",
95
  "single_word": false,
96
  "lstrip": true,
 
99
  "special": true
100
  },
101
  {
102
+ "id": 57526,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
103
  "content": "</s_province>",
104
  "single_word": false,
105
  "lstrip": true,
106
  "rstrip": true,
107
  "normalized": false,
108
  "special": true
 
 
 
 
 
 
 
 
 
109
  }
110
  ],
111
  "normalizer": {
tokenizer_config.json CHANGED
@@ -65,14 +65,6 @@
65
  "special": true
66
  },
67
  "57525": {
68
- "content": "</s_UR_mother_street>",
69
- "lstrip": true,
70
- "normalized": false,
71
- "rstrip": true,
72
- "single_word": false,
73
- "special": true
74
- },
75
- "57526": {
76
  "content": "<s_province>",
77
  "lstrip": true,
78
  "normalized": false,
@@ -80,356 +72,22 @@
80
  "single_word": false,
81
  "special": true
82
  },
83
- "57527": {
84
- "content": "<s_mother_last_name>",
85
- "lstrip": true,
86
- "normalized": false,
87
- "rstrip": true,
88
- "single_word": false,
89
- "special": true
90
- },
91
- "57528": {
92
- "content": "<s_father_last_name>",
93
- "lstrip": true,
94
- "normalized": false,
95
- "rstrip": true,
96
- "single_word": false,
97
- "special": true
98
- },
99
- "57529": {
100
- "content": "<s_UR_mother_city>",
101
- "lstrip": true,
102
- "normalized": false,
103
- "rstrip": true,
104
- "single_word": false,
105
- "special": true
106
- },
107
- "57530": {
108
- "content": "</s_father_first_name>",
109
- "lstrip": true,
110
- "normalized": false,
111
- "rstrip": true,
112
- "single_word": false,
113
- "special": true
114
- },
115
- "57531": {
116
- "content": "<s_UR_mother_street>",
117
- "lstrip": true,
118
- "normalized": false,
119
- "rstrip": true,
120
- "single_word": false,
121
- "special": true
122
- },
123
- "57532": {
124
- "content": "</s_child_first_name>",
125
- "lstrip": true,
126
- "normalized": false,
127
- "rstrip": true,
128
- "single_word": false,
129
- "special": true
130
- },
131
- "57533": {
132
- "content": "</s_city>",
133
- "lstrip": true,
134
- "normalized": false,
135
- "rstrip": true,
136
- "single_word": false,
137
- "special": true
138
- },
139
- "57534": {
140
- "content": "<s_father_first_name>",
141
- "lstrip": true,
142
- "normalized": false,
143
- "rstrip": true,
144
- "single_word": false,
145
- "special": true
146
- },
147
- "57535": {
148
- "content": "<s_mother_middle_name>",
149
- "lstrip": true,
150
- "normalized": false,
151
- "rstrip": true,
152
- "single_word": false,
153
- "special": true
154
- },
155
- "57536": {
156
- "content": "<s_child_last_name>",
157
- "lstrip": true,
158
- "normalized": false,
159
- "rstrip": true,
160
- "single_word": false,
161
- "special": true
162
- },
163
- "57537": {
164
- "content": "<s_child_middle_name>",
165
- "lstrip": true,
166
- "normalized": false,
167
- "rstrip": true,
168
- "single_word": false,
169
- "special": true
170
- },
171
- "57538": {
172
- "content": "<s_POB_city>",
173
- "lstrip": true,
174
- "normalized": false,
175
- "rstrip": true,
176
- "single_word": false,
177
- "special": true
178
- },
179
- "57539": {
180
- "content": "</s_POB_city>",
181
- "lstrip": true,
182
- "normalized": false,
183
- "rstrip": true,
184
- "single_word": false,
185
- "special": true
186
- },
187
- "57540": {
188
- "content": "<s_DOB>",
189
- "lstrip": true,
190
- "normalized": false,
191
- "rstrip": true,
192
- "single_word": false,
193
- "special": true
194
- },
195
- "57541": {
196
- "content": "<s_POB_province>",
197
- "lstrip": true,
198
- "normalized": false,
199
- "rstrip": true,
200
- "single_word": false,
201
- "special": true
202
- },
203
- "57542": {
204
- "content": "<s_mother_birthplace>",
205
- "lstrip": true,
206
- "normalized": false,
207
- "rstrip": true,
208
- "single_word": false,
209
- "special": true
210
- },
211
- "57543": {
212
- "content": "</s_mother_last_name>",
213
- "lstrip": true,
214
- "normalized": false,
215
- "rstrip": true,
216
- "single_word": false,
217
- "special": true
218
- },
219
- "57544": {
220
- "content": "<s_city>",
221
- "lstrip": true,
222
- "normalized": false,
223
- "rstrip": true,
224
- "single_word": false,
225
- "special": true
226
- },
227
- "57545": {
228
- "content": "</s_mother_first_name>",
229
- "lstrip": true,
230
- "normalized": false,
231
- "rstrip": true,
232
- "single_word": false,
233
- "special": true
234
- },
235
- "57546": {
236
- "content": "</s_mother_birthplace>",
237
- "lstrip": true,
238
- "normalized": false,
239
- "rstrip": true,
240
- "single_word": false,
241
- "special": true
242
- },
243
- "57547": {
244
- "content": "</s_Name_of_hospital>",
245
- "lstrip": true,
246
- "normalized": false,
247
- "rstrip": true,
248
- "single_word": false,
249
- "special": true
250
- },
251
- "57548": {
252
- "content": "<s_UR_mother_province>",
253
- "lstrip": true,
254
- "normalized": false,
255
- "rstrip": true,
256
- "single_word": false,
257
- "special": true
258
- },
259
- "57549": {
260
- "content": "<s_child_first_name>",
261
- "lstrip": true,
262
- "normalized": false,
263
- "rstrip": true,
264
- "single_word": false,
265
- "special": true
266
- },
267
- "57550": {
268
- "content": "</s_mother_middle_name>",
269
- "lstrip": true,
270
- "normalized": false,
271
- "rstrip": true,
272
- "single_word": false,
273
- "special": true
274
- },
275
- "57551": {
276
- "content": "<s_father_middle_name>",
277
- "lstrip": true,
278
- "normalized": false,
279
- "rstrip": true,
280
- "single_word": false,
281
- "special": true
282
- },
283
- "57552": {
284
- "content": "</s_UR_mother_city>",
285
- "lstrip": true,
286
- "normalized": false,
287
- "rstrip": true,
288
- "single_word": false,
289
- "special": true
290
- },
291
- "57553": {
292
- "content": "</s_father_last_name>",
293
- "lstrip": true,
294
- "normalized": false,
295
- "rstrip": true,
296
- "single_word": false,
297
- "special": true
298
- },
299
- "57554": {
300
- "content": "</s_father_birthplace>",
301
- "lstrip": true,
302
- "normalized": false,
303
- "rstrip": true,
304
- "single_word": false,
305
- "special": true
306
- },
307
- "57555": {
308
- "content": "</s_UR_mother_province>",
309
- "lstrip": true,
310
- "normalized": false,
311
- "rstrip": true,
312
- "single_word": false,
313
- "special": true
314
- },
315
- "57556": {
316
- "content": "</s_child_middle_name>",
317
- "lstrip": true,
318
- "normalized": false,
319
- "rstrip": true,
320
- "single_word": false,
321
- "special": true
322
- },
323
- "57557": {
324
- "content": "<s_Name_of_hospital>",
325
- "lstrip": true,
326
- "normalized": false,
327
- "rstrip": true,
328
- "single_word": false,
329
- "special": true
330
- },
331
- "57558": {
332
- "content": "</s_DOB>",
333
- "lstrip": true,
334
- "normalized": false,
335
- "rstrip": true,
336
- "single_word": false,
337
- "special": true
338
- },
339
- "57559": {
340
- "content": "<s_mother_first_name>",
341
- "lstrip": true,
342
- "normalized": false,
343
- "rstrip": true,
344
- "single_word": false,
345
- "special": true
346
- },
347
- "57560": {
348
- "content": "<s_father_birthplace>",
349
- "lstrip": true,
350
- "normalized": false,
351
- "rstrip": true,
352
- "single_word": false,
353
- "special": true
354
- },
355
- "57561": {
356
- "content": "</s_child_last_name>",
357
- "lstrip": true,
358
- "normalized": false,
359
- "rstrip": true,
360
- "single_word": false,
361
- "special": true
362
- },
363
- "57562": {
364
- "content": "</s_POB_province>",
365
- "lstrip": true,
366
- "normalized": false,
367
- "rstrip": true,
368
- "single_word": false,
369
- "special": true
370
- },
371
- "57563": {
372
  "content": "</s_province>",
373
  "lstrip": true,
374
  "normalized": false,
375
  "rstrip": true,
376
  "single_word": false,
377
  "special": true
378
- },
379
- "57564": {
380
- "content": "</s_father_middle_name>",
381
- "lstrip": true,
382
- "normalized": false,
383
- "rstrip": true,
384
- "single_word": false,
385
- "special": true
386
  }
387
  },
388
  "additional_special_tokens": [
389
  "<s_iitcdip>",
390
  "<s_synthdog>",
391
- "</s_UR_mother_street>",
392
- "<s_province>",
393
- "<s_mother_last_name>",
394
- "<s_father_last_name>",
395
- "<s_UR_mother_city>",
396
- "</s_father_first_name>",
397
- "<s_UR_mother_street>",
398
- "</s_child_first_name>",
399
- "</s_city>",
400
- "<s_father_first_name>",
401
- "<s_mother_middle_name>",
402
- "<s_child_last_name>",
403
- "<s_child_middle_name>",
404
- "<s_POB_city>",
405
- "</s_POB_city>",
406
- "<s_DOB>",
407
- "<s_POB_province>",
408
- "<s_mother_birthplace>",
409
- "</s_mother_last_name>",
410
- "<s_city>",
411
  "<s>",
412
- "</s_mother_first_name>",
413
- "</s_mother_birthplace>",
414
- "</s_Name_of_hospital>",
415
- "<s_UR_mother_province>",
416
- "<s_child_first_name>",
417
- "</s_mother_middle_name>",
418
- "<s_father_middle_name>",
419
- "</s_UR_mother_city>",
420
- "</s_father_last_name>",
421
- "</s_father_birthplace>",
422
- "</s_UR_mother_province>",
423
- "</s_child_middle_name>",
424
  "</s>",
425
- "<s_Name_of_hospital>",
426
- "</s_DOB>",
427
- "<s_mother_first_name>",
428
- "<s_father_birthplace>",
429
- "</s_child_last_name>",
430
- "</s_POB_province>",
431
- "</s_province>",
432
- "</s_father_middle_name>"
433
  ],
434
  "bos_token": "<s>",
435
  "clean_up_tokenization_spaces": true,
 
65
  "special": true
66
  },
67
  "57525": {
 
 
 
 
 
 
 
 
68
  "content": "<s_province>",
69
  "lstrip": true,
70
  "normalized": false,
 
72
  "single_word": false,
73
  "special": true
74
  },
75
+ "57526": {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
76
  "content": "</s_province>",
77
  "lstrip": true,
78
  "normalized": false,
79
  "rstrip": true,
80
  "single_word": false,
81
  "special": true
 
 
 
 
 
 
 
 
82
  }
83
  },
84
  "additional_special_tokens": [
85
  "<s_iitcdip>",
86
  "<s_synthdog>",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
87
  "<s>",
 
 
 
 
 
 
 
 
 
 
 
 
88
  "</s>",
89
+ "<s_province>",
90
+ "</s_province>"
 
 
 
 
 
 
91
  ],
92
  "bos_token": "<s>",
93
  "clean_up_tokenization_spaces": true,