vishnu027 commited on
Commit
5460476
1 Parent(s): 8b86061

Training done

Browse files
added_tokens.json CHANGED
@@ -1,22 +1,26 @@
1
  {
2
- "</s_age>": 57534,
3
- "</s_birthplace>": 57538,
4
- "</s_bride>": 57530,
5
- "</s_groom>": 57528,
6
- "</s_marital_status>": 57540,
7
- "</s_name>": 57526,
8
- "</s_race>": 57536,
9
- "</s_residence>": 57532,
10
- "<s_age>": 57533,
11
- "<s_birthplace>": 57537,
12
- "<s_bride>": 57529,
13
- "<s_cord-v2>": 57541,
14
- "<s_groom>": 57527,
 
 
 
 
 
 
 
 
15
  "<s_iitcdip>": 57523,
16
- "<s_marital_status>": 57539,
17
- "<s_name>": 57525,
18
- "<s_race>": 57535,
19
- "<s_residence>": 57531,
20
  "<s_synthdog>": 57524,
21
  "<sep/>": 57522
22
  }
 
1
  {
2
+ "</s_Bride Age>": 57538,
3
+ "</s_Bride Birthplace>": 57540,
4
+ "</s_Bride Marital Status>": 57544,
5
+ "</s_Bride Residence>": 57536,
6
+ "</s_Bride name>": 57528,
7
+ "</s_Groom Age>": 57532,
8
+ "</s_Groom Birthplace>": 57534,
9
+ "</s_Groom Marital Status>": 57542,
10
+ "</s_Groom Residence>": 57530,
11
+ "</s_Groom name>": 57526,
12
+ "<s_Bride Age>": 57537,
13
+ "<s_Bride Birthplace>": 57539,
14
+ "<s_Bride Marital Status>": 57543,
15
+ "<s_Bride Residence>": 57535,
16
+ "<s_Bride name>": 57527,
17
+ "<s_Groom Age>": 57531,
18
+ "<s_Groom Birthplace>": 57533,
19
+ "<s_Groom Marital Status>": 57541,
20
+ "<s_Groom Residence>": 57529,
21
+ "<s_Groom name>": 57525,
22
+ "<s_cord-v2>": 57545,
23
  "<s_iitcdip>": 57523,
 
 
 
 
24
  "<s_synthdog>": 57524,
25
  "<sep/>": 57522
26
  }
preprocessor_config.json CHANGED
@@ -19,8 +19,8 @@
19
  "processor_class": "DonutProcessor",
20
  "resample": 2,
21
  "rescale_factor": 0.00392156862745098,
22
- "size": {
23
- "height": 1200,
24
- "width": 800
25
- }
26
  }
 
19
  "processor_class": "DonutProcessor",
20
  "resample": 2,
21
  "rescale_factor": 0.00392156862745098,
22
+ "size": [
23
+ 1200,
24
+ 800
25
+ ]
26
  }
special_tokens_map.json CHANGED
@@ -3,27 +3,9 @@
3
  "<s_iitcdip>",
4
  "<s_synthdog>"
5
  ],
6
- "bos_token": {
7
- "content": "<s>",
8
- "lstrip": false,
9
- "normalized": false,
10
- "rstrip": false,
11
- "single_word": false
12
- },
13
- "cls_token": {
14
- "content": "<s>",
15
- "lstrip": false,
16
- "normalized": false,
17
- "rstrip": false,
18
- "single_word": false
19
- },
20
- "eos_token": {
21
- "content": "</s>",
22
- "lstrip": false,
23
- "normalized": false,
24
- "rstrip": false,
25
- "single_word": false
26
- },
27
  "mask_token": {
28
  "content": "<mask>",
29
  "lstrip": true,
@@ -31,25 +13,7 @@
31
  "rstrip": false,
32
  "single_word": false
33
  },
34
- "pad_token": {
35
- "content": "<pad>",
36
- "lstrip": false,
37
- "normalized": false,
38
- "rstrip": false,
39
- "single_word": false
40
- },
41
- "sep_token": {
42
- "content": "</s>",
43
- "lstrip": false,
44
- "normalized": false,
45
- "rstrip": false,
46
- "single_word": false
47
- },
48
- "unk_token": {
49
- "content": "<unk>",
50
- "lstrip": false,
51
- "normalized": false,
52
- "rstrip": false,
53
- "single_word": false
54
- }
55
  }
 
3
  "<s_iitcdip>",
4
  "<s_synthdog>"
5
  ],
6
+ "bos_token": "<s>",
7
+ "cls_token": "<s>",
8
+ "eos_token": "</s>",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
9
  "mask_token": {
10
  "content": "<mask>",
11
  "lstrip": true,
 
13
  "rstrip": false,
14
  "single_word": false
15
  },
16
+ "pad_token": "<pad>",
17
+ "sep_token": "</s>",
18
+ "unk_token": "<unk>"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
19
  }
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json CHANGED
@@ -65,7 +65,7 @@
65
  "special": true
66
  },
67
  "57525": {
68
- "content": "<s_name>",
69
  "lstrip": false,
70
  "normalized": true,
71
  "rstrip": false,
@@ -73,7 +73,7 @@
73
  "special": false
74
  },
75
  "57526": {
76
- "content": "</s_name>",
77
  "lstrip": false,
78
  "normalized": true,
79
  "rstrip": false,
@@ -81,7 +81,7 @@
81
  "special": false
82
  },
83
  "57527": {
84
- "content": "<s_groom>",
85
  "lstrip": false,
86
  "normalized": true,
87
  "rstrip": false,
@@ -89,7 +89,7 @@
89
  "special": false
90
  },
91
  "57528": {
92
- "content": "</s_groom>",
93
  "lstrip": false,
94
  "normalized": true,
95
  "rstrip": false,
@@ -97,7 +97,7 @@
97
  "special": false
98
  },
99
  "57529": {
100
- "content": "<s_bride>",
101
  "lstrip": false,
102
  "normalized": true,
103
  "rstrip": false,
@@ -105,7 +105,7 @@
105
  "special": false
106
  },
107
  "57530": {
108
- "content": "</s_bride>",
109
  "lstrip": false,
110
  "normalized": true,
111
  "rstrip": false,
@@ -113,7 +113,7 @@
113
  "special": false
114
  },
115
  "57531": {
116
- "content": "<s_residence>",
117
  "lstrip": false,
118
  "normalized": true,
119
  "rstrip": false,
@@ -121,7 +121,7 @@
121
  "special": false
122
  },
123
  "57532": {
124
- "content": "</s_residence>",
125
  "lstrip": false,
126
  "normalized": true,
127
  "rstrip": false,
@@ -129,7 +129,7 @@
129
  "special": false
130
  },
131
  "57533": {
132
- "content": "<s_age>",
133
  "lstrip": false,
134
  "normalized": true,
135
  "rstrip": false,
@@ -137,7 +137,7 @@
137
  "special": false
138
  },
139
  "57534": {
140
- "content": "</s_age>",
141
  "lstrip": false,
142
  "normalized": true,
143
  "rstrip": false,
@@ -145,7 +145,7 @@
145
  "special": false
146
  },
147
  "57535": {
148
- "content": "<s_race>",
149
  "lstrip": false,
150
  "normalized": true,
151
  "rstrip": false,
@@ -153,7 +153,7 @@
153
  "special": false
154
  },
155
  "57536": {
156
- "content": "</s_race>",
157
  "lstrip": false,
158
  "normalized": true,
159
  "rstrip": false,
@@ -161,7 +161,7 @@
161
  "special": false
162
  },
163
  "57537": {
164
- "content": "<s_birthplace>",
165
  "lstrip": false,
166
  "normalized": true,
167
  "rstrip": false,
@@ -169,7 +169,7 @@
169
  "special": false
170
  },
171
  "57538": {
172
- "content": "</s_birthplace>",
173
  "lstrip": false,
174
  "normalized": true,
175
  "rstrip": false,
@@ -177,7 +177,7 @@
177
  "special": false
178
  },
179
  "57539": {
180
- "content": "<s_marital_status>",
181
  "lstrip": false,
182
  "normalized": true,
183
  "rstrip": false,
@@ -185,7 +185,7 @@
185
  "special": false
186
  },
187
  "57540": {
188
- "content": "</s_marital_status>",
189
  "lstrip": false,
190
  "normalized": true,
191
  "rstrip": false,
@@ -193,6 +193,38 @@
193
  "special": false
194
  },
195
  "57541": {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
196
  "content": "<s_cord-v2>",
197
  "lstrip": false,
198
  "normalized": true,
@@ -210,18 +242,11 @@
210
  "cls_token": "<s>",
211
  "eos_token": "</s>",
212
  "mask_token": "<mask>",
213
- "max_length": 768,
214
  "model_max_length": 1000000000000000019884624838656,
215
- "pad_to_multiple_of": null,
216
  "pad_token": "<pad>",
217
- "pad_token_type_id": 0,
218
- "padding_side": "right",
219
  "processor_class": "DonutProcessor",
220
  "sep_token": "</s>",
221
  "sp_model_kwargs": {},
222
- "stride": 0,
223
  "tokenizer_class": "XLMRobertaTokenizer",
224
- "truncation_side": "right",
225
- "truncation_strategy": "longest_first",
226
  "unk_token": "<unk>"
227
  }
 
65
  "special": true
66
  },
67
  "57525": {
68
+ "content": "<s_Groom name>",
69
  "lstrip": false,
70
  "normalized": true,
71
  "rstrip": false,
 
73
  "special": false
74
  },
75
  "57526": {
76
+ "content": "</s_Groom name>",
77
  "lstrip": false,
78
  "normalized": true,
79
  "rstrip": false,
 
81
  "special": false
82
  },
83
  "57527": {
84
+ "content": "<s_Bride name>",
85
  "lstrip": false,
86
  "normalized": true,
87
  "rstrip": false,
 
89
  "special": false
90
  },
91
  "57528": {
92
+ "content": "</s_Bride name>",
93
  "lstrip": false,
94
  "normalized": true,
95
  "rstrip": false,
 
97
  "special": false
98
  },
99
  "57529": {
100
+ "content": "<s_Groom Residence>",
101
  "lstrip": false,
102
  "normalized": true,
103
  "rstrip": false,
 
105
  "special": false
106
  },
107
  "57530": {
108
+ "content": "</s_Groom Residence>",
109
  "lstrip": false,
110
  "normalized": true,
111
  "rstrip": false,
 
113
  "special": false
114
  },
115
  "57531": {
116
+ "content": "<s_Groom Age>",
117
  "lstrip": false,
118
  "normalized": true,
119
  "rstrip": false,
 
121
  "special": false
122
  },
123
  "57532": {
124
+ "content": "</s_Groom Age>",
125
  "lstrip": false,
126
  "normalized": true,
127
  "rstrip": false,
 
129
  "special": false
130
  },
131
  "57533": {
132
+ "content": "<s_Groom Birthplace>",
133
  "lstrip": false,
134
  "normalized": true,
135
  "rstrip": false,
 
137
  "special": false
138
  },
139
  "57534": {
140
+ "content": "</s_Groom Birthplace>",
141
  "lstrip": false,
142
  "normalized": true,
143
  "rstrip": false,
 
145
  "special": false
146
  },
147
  "57535": {
148
+ "content": "<s_Bride Residence>",
149
  "lstrip": false,
150
  "normalized": true,
151
  "rstrip": false,
 
153
  "special": false
154
  },
155
  "57536": {
156
+ "content": "</s_Bride Residence>",
157
  "lstrip": false,
158
  "normalized": true,
159
  "rstrip": false,
 
161
  "special": false
162
  },
163
  "57537": {
164
+ "content": "<s_Bride Age>",
165
  "lstrip": false,
166
  "normalized": true,
167
  "rstrip": false,
 
169
  "special": false
170
  },
171
  "57538": {
172
+ "content": "</s_Bride Age>",
173
  "lstrip": false,
174
  "normalized": true,
175
  "rstrip": false,
 
177
  "special": false
178
  },
179
  "57539": {
180
+ "content": "<s_Bride Birthplace>",
181
  "lstrip": false,
182
  "normalized": true,
183
  "rstrip": false,
 
185
  "special": false
186
  },
187
  "57540": {
188
+ "content": "</s_Bride Birthplace>",
189
  "lstrip": false,
190
  "normalized": true,
191
  "rstrip": false,
 
193
  "special": false
194
  },
195
  "57541": {
196
+ "content": "<s_Groom Marital Status>",
197
+ "lstrip": false,
198
+ "normalized": true,
199
+ "rstrip": false,
200
+ "single_word": false,
201
+ "special": false
202
+ },
203
+ "57542": {
204
+ "content": "</s_Groom Marital Status>",
205
+ "lstrip": false,
206
+ "normalized": true,
207
+ "rstrip": false,
208
+ "single_word": false,
209
+ "special": false
210
+ },
211
+ "57543": {
212
+ "content": "<s_Bride Marital Status>",
213
+ "lstrip": false,
214
+ "normalized": true,
215
+ "rstrip": false,
216
+ "single_word": false,
217
+ "special": false
218
+ },
219
+ "57544": {
220
+ "content": "</s_Bride Marital Status>",
221
+ "lstrip": false,
222
+ "normalized": true,
223
+ "rstrip": false,
224
+ "single_word": false,
225
+ "special": false
226
+ },
227
+ "57545": {
228
  "content": "<s_cord-v2>",
229
  "lstrip": false,
230
  "normalized": true,
 
242
  "cls_token": "<s>",
243
  "eos_token": "</s>",
244
  "mask_token": "<mask>",
 
245
  "model_max_length": 1000000000000000019884624838656,
 
246
  "pad_token": "<pad>",
 
 
247
  "processor_class": "DonutProcessor",
248
  "sep_token": "</s>",
249
  "sp_model_kwargs": {},
 
250
  "tokenizer_class": "XLMRobertaTokenizer",
 
 
251
  "unk_token": "<unk>"
252
  }