sreejith8100 commited on
Commit
2592635
1 Parent(s): e9f159b

End of training

Browse files
README.md CHANGED
@@ -35,7 +35,7 @@ More information needed
35
 
36
  The following hyperparameters were used during training:
37
  - learning_rate: 2e-05
38
- - train_batch_size: 2
39
  - eval_batch_size: 8
40
  - seed: 42
41
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 
35
 
36
  The following hyperparameters were used during training:
37
  - learning_rate: 2e-05
38
+ - train_batch_size: 1
39
  - eval_batch_size: 8
40
  - seed: 42
41
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
added_tokens.json CHANGED
@@ -1,26 +1,20 @@
1
  {
2
  "</s>": 2,
3
- "</s_address>": 57530,
4
- "</s_father_name>": 57537,
5
- "</s_first_name>": 57534,
6
- "</s_last_name>": 57539,
7
- "</s_mother_name>": 57531,
8
- "</s_place_of_birth>": 57540,
9
- "</s_random_number>": 57532,
10
- "</s_title>": 57536,
11
  "<mask>": 57521,
12
  "<pad>": 1,
13
  "<s>": 0,
14
- "<s_address>": 57538,
15
- "<s_father_name>": 57526,
16
- "<s_first_name>": 57527,
17
  "<s_iitcdip>": 57523,
18
- "<s_last_name>": 57535,
19
- "<s_mother_name>": 57525,
20
- "<s_place_of_birth>": 57529,
21
- "<s_random_number>": 57528,
22
  "<s_synthdog>": 57524,
23
- "<s_title>": 57533,
24
  "<sep/>": 57522,
25
  "<unk>": 3
26
  }
 
1
  {
2
  "</s>": 2,
3
+ "</s_First>": 57529,
4
+ "</s_Last>": 57531,
5
+ "</s_Middle>": 57534,
6
+ "</s_no>": 57528,
7
+ "</s_province>": 57532,
 
 
 
8
  "<mask>": 57521,
9
  "<pad>": 1,
10
  "<s>": 0,
11
+ "<s_First>": 57527,
12
+ "<s_Last>": 57530,
13
+ "<s_Middle>": 57533,
14
  "<s_iitcdip>": 57523,
15
+ "<s_no>": 57526,
16
+ "<s_province>": 57525,
 
 
17
  "<s_synthdog>": 57524,
 
18
  "<sep/>": 57522,
19
  "<unk>": 3
20
  }
preprocessor_config.json CHANGED
@@ -20,7 +20,7 @@
20
  "resample": 2,
21
  "rescale_factor": 0.00392156862745098,
22
  "size": [
23
- 512,
24
- 512
25
  ]
26
  }
 
20
  "resample": 2,
21
  "rescale_factor": 0.00392156862745098,
22
  "size": [
23
+ 800,
24
+ 1200
25
  ]
26
  }
special_tokens_map.json CHANGED
@@ -2,24 +2,18 @@
2
  "additional_special_tokens": [
3
  "<s_iitcdip>",
4
  "<s_synthdog>",
5
- "<s_mother_name>",
6
- "<s_father_name>",
7
- "<s_first_name>",
8
  "</s>",
9
- "<s_random_number>",
10
- "<s_place_of_birth>",
11
- "</s_address>",
12
- "</s_mother_name>",
13
- "</s_random_number>",
14
- "<s_title>",
15
- "</s_first_name>",
16
- "<s_last_name>",
17
- "</s_title>",
18
- "</s_father_name>",
19
- "<s_address>",
20
  "<s>",
21
- "</s_last_name>",
22
- "</s_place_of_birth>"
23
  ],
24
  "bos_token": "<s>",
25
  "cls_token": "<s>",
 
2
  "additional_special_tokens": [
3
  "<s_iitcdip>",
4
  "<s_synthdog>",
 
 
 
5
  "</s>",
6
+ "<s_province>",
7
+ "<s_no>",
8
+ "<s_First>",
9
+ "</s_no>",
10
+ "</s_First>",
11
+ "<s_Last>",
12
+ "</s_Last>",
13
+ "</s_province>",
14
+ "<s_Middle>",
 
 
15
  "<s>",
16
+ "</s_Middle>"
 
17
  ],
18
  "bos_token": "<s>",
19
  "cls_token": "<s>",
tokenizer.json CHANGED
@@ -91,7 +91,7 @@
91
  },
92
  {
93
  "id": 57525,
94
- "content": "<s_mother_name>",
95
  "single_word": false,
96
  "lstrip": true,
97
  "rstrip": true,
@@ -100,7 +100,7 @@
100
  },
101
  {
102
  "id": 57526,
103
- "content": "<s_father_name>",
104
  "single_word": false,
105
  "lstrip": true,
106
  "rstrip": true,
@@ -109,7 +109,7 @@
109
  },
110
  {
111
  "id": 57527,
112
- "content": "<s_first_name>",
113
  "single_word": false,
114
  "lstrip": true,
115
  "rstrip": true,
@@ -118,7 +118,7 @@
118
  },
119
  {
120
  "id": 57528,
121
- "content": "<s_random_number>",
122
  "single_word": false,
123
  "lstrip": true,
124
  "rstrip": true,
@@ -127,7 +127,7 @@
127
  },
128
  {
129
  "id": 57529,
130
- "content": "<s_place_of_birth>",
131
  "single_word": false,
132
  "lstrip": true,
133
  "rstrip": true,
@@ -136,7 +136,7 @@
136
  },
137
  {
138
  "id": 57530,
139
- "content": "</s_address>",
140
  "single_word": false,
141
  "lstrip": true,
142
  "rstrip": true,
@@ -145,7 +145,7 @@
145
  },
146
  {
147
  "id": 57531,
148
- "content": "</s_mother_name>",
149
  "single_word": false,
150
  "lstrip": true,
151
  "rstrip": true,
@@ -154,7 +154,7 @@
154
  },
155
  {
156
  "id": 57532,
157
- "content": "</s_random_number>",
158
  "single_word": false,
159
  "lstrip": true,
160
  "rstrip": true,
@@ -163,7 +163,7 @@
163
  },
164
  {
165
  "id": 57533,
166
- "content": "<s_title>",
167
  "single_word": false,
168
  "lstrip": true,
169
  "rstrip": true,
@@ -172,61 +172,7 @@
172
  },
173
  {
174
  "id": 57534,
175
- "content": "</s_first_name>",
176
- "single_word": false,
177
- "lstrip": true,
178
- "rstrip": true,
179
- "normalized": false,
180
- "special": true
181
- },
182
- {
183
- "id": 57535,
184
- "content": "<s_last_name>",
185
- "single_word": false,
186
- "lstrip": true,
187
- "rstrip": true,
188
- "normalized": false,
189
- "special": true
190
- },
191
- {
192
- "id": 57536,
193
- "content": "</s_title>",
194
- "single_word": false,
195
- "lstrip": true,
196
- "rstrip": true,
197
- "normalized": false,
198
- "special": true
199
- },
200
- {
201
- "id": 57537,
202
- "content": "</s_father_name>",
203
- "single_word": false,
204
- "lstrip": true,
205
- "rstrip": true,
206
- "normalized": false,
207
- "special": true
208
- },
209
- {
210
- "id": 57538,
211
- "content": "<s_address>",
212
- "single_word": false,
213
- "lstrip": true,
214
- "rstrip": true,
215
- "normalized": false,
216
- "special": true
217
- },
218
- {
219
- "id": 57539,
220
- "content": "</s_last_name>",
221
- "single_word": false,
222
- "lstrip": true,
223
- "rstrip": true,
224
- "normalized": false,
225
- "special": true
226
- },
227
- {
228
- "id": 57540,
229
- "content": "</s_place_of_birth>",
230
  "single_word": false,
231
  "lstrip": true,
232
  "rstrip": true,
 
91
  },
92
  {
93
  "id": 57525,
94
+ "content": "<s_province>",
95
  "single_word": false,
96
  "lstrip": true,
97
  "rstrip": true,
 
100
  },
101
  {
102
  "id": 57526,
103
+ "content": "<s_no>",
104
  "single_word": false,
105
  "lstrip": true,
106
  "rstrip": true,
 
109
  },
110
  {
111
  "id": 57527,
112
+ "content": "<s_First>",
113
  "single_word": false,
114
  "lstrip": true,
115
  "rstrip": true,
 
118
  },
119
  {
120
  "id": 57528,
121
+ "content": "</s_no>",
122
  "single_word": false,
123
  "lstrip": true,
124
  "rstrip": true,
 
127
  },
128
  {
129
  "id": 57529,
130
+ "content": "</s_First>",
131
  "single_word": false,
132
  "lstrip": true,
133
  "rstrip": true,
 
136
  },
137
  {
138
  "id": 57530,
139
+ "content": "<s_Last>",
140
  "single_word": false,
141
  "lstrip": true,
142
  "rstrip": true,
 
145
  },
146
  {
147
  "id": 57531,
148
+ "content": "</s_Last>",
149
  "single_word": false,
150
  "lstrip": true,
151
  "rstrip": true,
 
154
  },
155
  {
156
  "id": 57532,
157
+ "content": "</s_province>",
158
  "single_word": false,
159
  "lstrip": true,
160
  "rstrip": true,
 
163
  },
164
  {
165
  "id": 57533,
166
+ "content": "<s_Middle>",
167
  "single_word": false,
168
  "lstrip": true,
169
  "rstrip": true,
 
172
  },
173
  {
174
  "id": 57534,
175
+ "content": "</s_Middle>",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
176
  "single_word": false,
177
  "lstrip": true,
178
  "rstrip": true,
tokenizer_config.json CHANGED
@@ -65,7 +65,7 @@
65
  "special": true
66
  },
67
  "57525": {
68
- "content": "<s_mother_name>",
69
  "lstrip": true,
70
  "normalized": false,
71
  "rstrip": true,
@@ -73,7 +73,7 @@
73
  "special": true
74
  },
75
  "57526": {
76
- "content": "<s_father_name>",
77
  "lstrip": true,
78
  "normalized": false,
79
  "rstrip": true,
@@ -81,7 +81,7 @@
81
  "special": true
82
  },
83
  "57527": {
84
- "content": "<s_first_name>",
85
  "lstrip": true,
86
  "normalized": false,
87
  "rstrip": true,
@@ -89,7 +89,7 @@
89
  "special": true
90
  },
91
  "57528": {
92
- "content": "<s_random_number>",
93
  "lstrip": true,
94
  "normalized": false,
95
  "rstrip": true,
@@ -97,7 +97,7 @@
97
  "special": true
98
  },
99
  "57529": {
100
- "content": "<s_place_of_birth>",
101
  "lstrip": true,
102
  "normalized": false,
103
  "rstrip": true,
@@ -105,7 +105,7 @@
105
  "special": true
106
  },
107
  "57530": {
108
- "content": "</s_address>",
109
  "lstrip": true,
110
  "normalized": false,
111
  "rstrip": true,
@@ -113,7 +113,7 @@
113
  "special": true
114
  },
115
  "57531": {
116
- "content": "</s_mother_name>",
117
  "lstrip": true,
118
  "normalized": false,
119
  "rstrip": true,
@@ -121,7 +121,7 @@
121
  "special": true
122
  },
123
  "57532": {
124
- "content": "</s_random_number>",
125
  "lstrip": true,
126
  "normalized": false,
127
  "rstrip": true,
@@ -129,7 +129,7 @@
129
  "special": true
130
  },
131
  "57533": {
132
- "content": "<s_title>",
133
  "lstrip": true,
134
  "normalized": false,
135
  "rstrip": true,
@@ -137,55 +137,7 @@
137
  "special": true
138
  },
139
  "57534": {
140
- "content": "</s_first_name>",
141
- "lstrip": true,
142
- "normalized": false,
143
- "rstrip": true,
144
- "single_word": false,
145
- "special": true
146
- },
147
- "57535": {
148
- "content": "<s_last_name>",
149
- "lstrip": true,
150
- "normalized": false,
151
- "rstrip": true,
152
- "single_word": false,
153
- "special": true
154
- },
155
- "57536": {
156
- "content": "</s_title>",
157
- "lstrip": true,
158
- "normalized": false,
159
- "rstrip": true,
160
- "single_word": false,
161
- "special": true
162
- },
163
- "57537": {
164
- "content": "</s_father_name>",
165
- "lstrip": true,
166
- "normalized": false,
167
- "rstrip": true,
168
- "single_word": false,
169
- "special": true
170
- },
171
- "57538": {
172
- "content": "<s_address>",
173
- "lstrip": true,
174
- "normalized": false,
175
- "rstrip": true,
176
- "single_word": false,
177
- "special": true
178
- },
179
- "57539": {
180
- "content": "</s_last_name>",
181
- "lstrip": true,
182
- "normalized": false,
183
- "rstrip": true,
184
- "single_word": false,
185
- "special": true
186
- },
187
- "57540": {
188
- "content": "</s_place_of_birth>",
189
  "lstrip": true,
190
  "normalized": false,
191
  "rstrip": true,
@@ -196,24 +148,18 @@
196
  "additional_special_tokens": [
197
  "<s_iitcdip>",
198
  "<s_synthdog>",
199
- "<s_mother_name>",
200
- "<s_father_name>",
201
- "<s_first_name>",
202
  "</s>",
203
- "<s_random_number>",
204
- "<s_place_of_birth>",
205
- "</s_address>",
206
- "</s_mother_name>",
207
- "</s_random_number>",
208
- "<s_title>",
209
- "</s_first_name>",
210
- "<s_last_name>",
211
- "</s_title>",
212
- "</s_father_name>",
213
- "<s_address>",
214
  "<s>",
215
- "</s_last_name>",
216
- "</s_place_of_birth>"
217
  ],
218
  "bos_token": "<s>",
219
  "clean_up_tokenization_spaces": true,
 
65
  "special": true
66
  },
67
  "57525": {
68
+ "content": "<s_province>",
69
  "lstrip": true,
70
  "normalized": false,
71
  "rstrip": true,
 
73
  "special": true
74
  },
75
  "57526": {
76
+ "content": "<s_no>",
77
  "lstrip": true,
78
  "normalized": false,
79
  "rstrip": true,
 
81
  "special": true
82
  },
83
  "57527": {
84
+ "content": "<s_First>",
85
  "lstrip": true,
86
  "normalized": false,
87
  "rstrip": true,
 
89
  "special": true
90
  },
91
  "57528": {
92
+ "content": "</s_no>",
93
  "lstrip": true,
94
  "normalized": false,
95
  "rstrip": true,
 
97
  "special": true
98
  },
99
  "57529": {
100
+ "content": "</s_First>",
101
  "lstrip": true,
102
  "normalized": false,
103
  "rstrip": true,
 
105
  "special": true
106
  },
107
  "57530": {
108
+ "content": "<s_Last>",
109
  "lstrip": true,
110
  "normalized": false,
111
  "rstrip": true,
 
113
  "special": true
114
  },
115
  "57531": {
116
+ "content": "</s_Last>",
117
  "lstrip": true,
118
  "normalized": false,
119
  "rstrip": true,
 
121
  "special": true
122
  },
123
  "57532": {
124
+ "content": "</s_province>",
125
  "lstrip": true,
126
  "normalized": false,
127
  "rstrip": true,
 
129
  "special": true
130
  },
131
  "57533": {
132
+ "content": "<s_Middle>",
133
  "lstrip": true,
134
  "normalized": false,
135
  "rstrip": true,
 
137
  "special": true
138
  },
139
  "57534": {
140
+ "content": "</s_Middle>",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
141
  "lstrip": true,
142
  "normalized": false,
143
  "rstrip": true,
 
148
  "additional_special_tokens": [
149
  "<s_iitcdip>",
150
  "<s_synthdog>",
 
 
 
151
  "</s>",
152
+ "<s_province>",
153
+ "<s_no>",
154
+ "<s_First>",
155
+ "</s_no>",
156
+ "</s_First>",
157
+ "<s_Last>",
158
+ "</s_Last>",
159
+ "</s_province>",
160
+ "<s_Middle>",
 
 
161
  "<s>",
162
+ "</s_Middle>"
 
163
  ],
164
  "bos_token": "<s>",
165
  "clean_up_tokenization_spaces": true,