sreejith8100 commited on
Commit
5f524f1
1 Parent(s): 9d352b0

End of training

Browse files
README.md CHANGED
@@ -40,7 +40,7 @@ The following hyperparameters were used during training:
40
  - seed: 42
41
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
42
  - lr_scheduler_type: linear
43
- - num_epochs: 1
44
 
45
  ### Training results
46
 
 
40
  - seed: 42
41
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
42
  - lr_scheduler_type: linear
43
+ - num_epochs: 6
44
 
45
  ### Training results
46
 
added_tokens.json CHANGED
@@ -1,18 +1,26 @@
1
  {
2
  "</s>": 2,
3
- "</s_address>": 57527,
4
- "</s_company>": 57529,
5
- "</s_date>": 57526,
6
- "</s_total>": 57528,
 
 
 
 
7
  "<mask>": 57521,
8
  "<pad>": 1,
9
  "<s>": 0,
10
- "<s_address>": 57530,
11
- "<s_company>": 57532,
12
- "<s_date>": 57525,
13
  "<s_iitcdip>": 57523,
 
 
 
 
14
  "<s_synthdog>": 57524,
15
- "<s_total>": 57531,
16
  "<sep/>": 57522,
17
  "<unk>": 3
18
  }
 
1
  {
2
  "</s>": 2,
3
+ "</s_address>": 57530,
4
+ "</s_father_name>": 57537,
5
+ "</s_first_name>": 57534,
6
+ "</s_last_name>": 57539,
7
+ "</s_mother_name>": 57531,
8
+ "</s_place_of_birth>": 57540,
9
+ "</s_random_number>": 57532,
10
+ "</s_title>": 57536,
11
  "<mask>": 57521,
12
  "<pad>": 1,
13
  "<s>": 0,
14
+ "<s_address>": 57538,
15
+ "<s_father_name>": 57526,
16
+ "<s_first_name>": 57527,
17
  "<s_iitcdip>": 57523,
18
+ "<s_last_name>": 57535,
19
+ "<s_mother_name>": 57525,
20
+ "<s_place_of_birth>": 57529,
21
+ "<s_random_number>": 57528,
22
  "<s_synthdog>": 57524,
23
+ "<s_title>": 57533,
24
  "<sep/>": 57522,
25
  "<unk>": 3
26
  }
preprocessor_config.json CHANGED
@@ -20,7 +20,7 @@
20
  "resample": 2,
21
  "rescale_factor": 0.00392156862745098,
22
  "size": [
23
- 720,
24
- 960
25
  ]
26
  }
 
20
  "resample": 2,
21
  "rescale_factor": 0.00392156862745098,
22
  "size": [
23
+ 512,
24
+ 512
25
  ]
26
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1ec5337ee2c229f65606bc0d106fb3ce1a1b9b20189b21e038d3268b0e70fce5
3
  size 809244441
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ac39cd5487d60cc7c781796714e6e496fa1b80beaf0c862789bace2dff351a0
3
  size 809244441
special_tokens_map.json CHANGED
@@ -2,16 +2,24 @@
2
  "additional_special_tokens": [
3
  "<s_iitcdip>",
4
  "<s_synthdog>",
5
- "<s_date>",
 
 
6
  "</s>",
7
- "</s_date>",
 
8
  "</s_address>",
9
- "</s_total>",
10
- "</s_company>",
 
 
 
 
 
11
  "<s_address>",
12
  "<s>",
13
- "<s_total>",
14
- "<s_company>"
15
  ],
16
  "bos_token": "<s>",
17
  "cls_token": "<s>",
 
2
  "additional_special_tokens": [
3
  "<s_iitcdip>",
4
  "<s_synthdog>",
5
+ "<s_mother_name>",
6
+ "<s_father_name>",
7
+ "<s_first_name>",
8
  "</s>",
9
+ "<s_random_number>",
10
+ "<s_place_of_birth>",
11
  "</s_address>",
12
+ "</s_mother_name>",
13
+ "</s_random_number>",
14
+ "<s_title>",
15
+ "</s_first_name>",
16
+ "<s_last_name>",
17
+ "</s_title>",
18
+ "</s_father_name>",
19
  "<s_address>",
20
  "<s>",
21
+ "</s_last_name>",
22
+ "</s_place_of_birth>"
23
  ],
24
  "bos_token": "<s>",
25
  "cls_token": "<s>",
tokenizer.json CHANGED
@@ -91,7 +91,7 @@
91
  },
92
  {
93
  "id": 57525,
94
- "content": "<s_date>",
95
  "single_word": false,
96
  "lstrip": true,
97
  "rstrip": true,
@@ -100,7 +100,7 @@
100
  },
101
  {
102
  "id": 57526,
103
- "content": "</s_date>",
104
  "single_word": false,
105
  "lstrip": true,
106
  "rstrip": true,
@@ -109,7 +109,7 @@
109
  },
110
  {
111
  "id": 57527,
112
- "content": "</s_address>",
113
  "single_word": false,
114
  "lstrip": true,
115
  "rstrip": true,
@@ -118,7 +118,7 @@
118
  },
119
  {
120
  "id": 57528,
121
- "content": "</s_total>",
122
  "single_word": false,
123
  "lstrip": true,
124
  "rstrip": true,
@@ -127,7 +127,7 @@
127
  },
128
  {
129
  "id": 57529,
130
- "content": "</s_company>",
131
  "single_word": false,
132
  "lstrip": true,
133
  "rstrip": true,
@@ -136,7 +136,7 @@
136
  },
137
  {
138
  "id": 57530,
139
- "content": "<s_address>",
140
  "single_word": false,
141
  "lstrip": true,
142
  "rstrip": true,
@@ -145,7 +145,7 @@
145
  },
146
  {
147
  "id": 57531,
148
- "content": "<s_total>",
149
  "single_word": false,
150
  "lstrip": true,
151
  "rstrip": true,
@@ -154,7 +154,79 @@
154
  },
155
  {
156
  "id": 57532,
157
- "content": "<s_company>",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
158
  "single_word": false,
159
  "lstrip": true,
160
  "rstrip": true,
 
91
  },
92
  {
93
  "id": 57525,
94
+ "content": "<s_mother_name>",
95
  "single_word": false,
96
  "lstrip": true,
97
  "rstrip": true,
 
100
  },
101
  {
102
  "id": 57526,
103
+ "content": "<s_father_name>",
104
  "single_word": false,
105
  "lstrip": true,
106
  "rstrip": true,
 
109
  },
110
  {
111
  "id": 57527,
112
+ "content": "<s_first_name>",
113
  "single_word": false,
114
  "lstrip": true,
115
  "rstrip": true,
 
118
  },
119
  {
120
  "id": 57528,
121
+ "content": "<s_random_number>",
122
  "single_word": false,
123
  "lstrip": true,
124
  "rstrip": true,
 
127
  },
128
  {
129
  "id": 57529,
130
+ "content": "<s_place_of_birth>",
131
  "single_word": false,
132
  "lstrip": true,
133
  "rstrip": true,
 
136
  },
137
  {
138
  "id": 57530,
139
+ "content": "</s_address>",
140
  "single_word": false,
141
  "lstrip": true,
142
  "rstrip": true,
 
145
  },
146
  {
147
  "id": 57531,
148
+ "content": "</s_mother_name>",
149
  "single_word": false,
150
  "lstrip": true,
151
  "rstrip": true,
 
154
  },
155
  {
156
  "id": 57532,
157
+ "content": "</s_random_number>",
158
+ "single_word": false,
159
+ "lstrip": true,
160
+ "rstrip": true,
161
+ "normalized": false,
162
+ "special": true
163
+ },
164
+ {
165
+ "id": 57533,
166
+ "content": "<s_title>",
167
+ "single_word": false,
168
+ "lstrip": true,
169
+ "rstrip": true,
170
+ "normalized": false,
171
+ "special": true
172
+ },
173
+ {
174
+ "id": 57534,
175
+ "content": "</s_first_name>",
176
+ "single_word": false,
177
+ "lstrip": true,
178
+ "rstrip": true,
179
+ "normalized": false,
180
+ "special": true
181
+ },
182
+ {
183
+ "id": 57535,
184
+ "content": "<s_last_name>",
185
+ "single_word": false,
186
+ "lstrip": true,
187
+ "rstrip": true,
188
+ "normalized": false,
189
+ "special": true
190
+ },
191
+ {
192
+ "id": 57536,
193
+ "content": "</s_title>",
194
+ "single_word": false,
195
+ "lstrip": true,
196
+ "rstrip": true,
197
+ "normalized": false,
198
+ "special": true
199
+ },
200
+ {
201
+ "id": 57537,
202
+ "content": "</s_father_name>",
203
+ "single_word": false,
204
+ "lstrip": true,
205
+ "rstrip": true,
206
+ "normalized": false,
207
+ "special": true
208
+ },
209
+ {
210
+ "id": 57538,
211
+ "content": "<s_address>",
212
+ "single_word": false,
213
+ "lstrip": true,
214
+ "rstrip": true,
215
+ "normalized": false,
216
+ "special": true
217
+ },
218
+ {
219
+ "id": 57539,
220
+ "content": "</s_last_name>",
221
+ "single_word": false,
222
+ "lstrip": true,
223
+ "rstrip": true,
224
+ "normalized": false,
225
+ "special": true
226
+ },
227
+ {
228
+ "id": 57540,
229
+ "content": "</s_place_of_birth>",
230
  "single_word": false,
231
  "lstrip": true,
232
  "rstrip": true,
tokenizer_config.json CHANGED
@@ -65,7 +65,7 @@
65
  "special": true
66
  },
67
  "57525": {
68
- "content": "<s_date>",
69
  "lstrip": true,
70
  "normalized": false,
71
  "rstrip": true,
@@ -73,7 +73,7 @@
73
  "special": true
74
  },
75
  "57526": {
76
- "content": "</s_date>",
77
  "lstrip": true,
78
  "normalized": false,
79
  "rstrip": true,
@@ -81,7 +81,7 @@
81
  "special": true
82
  },
83
  "57527": {
84
- "content": "</s_address>",
85
  "lstrip": true,
86
  "normalized": false,
87
  "rstrip": true,
@@ -89,7 +89,7 @@
89
  "special": true
90
  },
91
  "57528": {
92
- "content": "</s_total>",
93
  "lstrip": true,
94
  "normalized": false,
95
  "rstrip": true,
@@ -97,7 +97,7 @@
97
  "special": true
98
  },
99
  "57529": {
100
- "content": "</s_company>",
101
  "lstrip": true,
102
  "normalized": false,
103
  "rstrip": true,
@@ -105,7 +105,7 @@
105
  "special": true
106
  },
107
  "57530": {
108
- "content": "<s_address>",
109
  "lstrip": true,
110
  "normalized": false,
111
  "rstrip": true,
@@ -113,7 +113,7 @@
113
  "special": true
114
  },
115
  "57531": {
116
- "content": "<s_total>",
117
  "lstrip": true,
118
  "normalized": false,
119
  "rstrip": true,
@@ -121,7 +121,71 @@
121
  "special": true
122
  },
123
  "57532": {
124
- "content": "<s_company>",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
125
  "lstrip": true,
126
  "normalized": false,
127
  "rstrip": true,
@@ -132,16 +196,24 @@
132
  "additional_special_tokens": [
133
  "<s_iitcdip>",
134
  "<s_synthdog>",
135
- "<s_date>",
 
 
136
  "</s>",
137
- "</s_date>",
 
138
  "</s_address>",
139
- "</s_total>",
140
- "</s_company>",
 
 
 
 
 
141
  "<s_address>",
142
  "<s>",
143
- "<s_total>",
144
- "<s_company>"
145
  ],
146
  "bos_token": "<s>",
147
  "clean_up_tokenization_spaces": true,
 
65
  "special": true
66
  },
67
  "57525": {
68
+ "content": "<s_mother_name>",
69
  "lstrip": true,
70
  "normalized": false,
71
  "rstrip": true,
 
73
  "special": true
74
  },
75
  "57526": {
76
+ "content": "<s_father_name>",
77
  "lstrip": true,
78
  "normalized": false,
79
  "rstrip": true,
 
81
  "special": true
82
  },
83
  "57527": {
84
+ "content": "<s_first_name>",
85
  "lstrip": true,
86
  "normalized": false,
87
  "rstrip": true,
 
89
  "special": true
90
  },
91
  "57528": {
92
+ "content": "<s_random_number>",
93
  "lstrip": true,
94
  "normalized": false,
95
  "rstrip": true,
 
97
  "special": true
98
  },
99
  "57529": {
100
+ "content": "<s_place_of_birth>",
101
  "lstrip": true,
102
  "normalized": false,
103
  "rstrip": true,
 
105
  "special": true
106
  },
107
  "57530": {
108
+ "content": "</s_address>",
109
  "lstrip": true,
110
  "normalized": false,
111
  "rstrip": true,
 
113
  "special": true
114
  },
115
  "57531": {
116
+ "content": "</s_mother_name>",
117
  "lstrip": true,
118
  "normalized": false,
119
  "rstrip": true,
 
121
  "special": true
122
  },
123
  "57532": {
124
+ "content": "</s_random_number>",
125
+ "lstrip": true,
126
+ "normalized": false,
127
+ "rstrip": true,
128
+ "single_word": false,
129
+ "special": true
130
+ },
131
+ "57533": {
132
+ "content": "<s_title>",
133
+ "lstrip": true,
134
+ "normalized": false,
135
+ "rstrip": true,
136
+ "single_word": false,
137
+ "special": true
138
+ },
139
+ "57534": {
140
+ "content": "</s_first_name>",
141
+ "lstrip": true,
142
+ "normalized": false,
143
+ "rstrip": true,
144
+ "single_word": false,
145
+ "special": true
146
+ },
147
+ "57535": {
148
+ "content": "<s_last_name>",
149
+ "lstrip": true,
150
+ "normalized": false,
151
+ "rstrip": true,
152
+ "single_word": false,
153
+ "special": true
154
+ },
155
+ "57536": {
156
+ "content": "</s_title>",
157
+ "lstrip": true,
158
+ "normalized": false,
159
+ "rstrip": true,
160
+ "single_word": false,
161
+ "special": true
162
+ },
163
+ "57537": {
164
+ "content": "</s_father_name>",
165
+ "lstrip": true,
166
+ "normalized": false,
167
+ "rstrip": true,
168
+ "single_word": false,
169
+ "special": true
170
+ },
171
+ "57538": {
172
+ "content": "<s_address>",
173
+ "lstrip": true,
174
+ "normalized": false,
175
+ "rstrip": true,
176
+ "single_word": false,
177
+ "special": true
178
+ },
179
+ "57539": {
180
+ "content": "</s_last_name>",
181
+ "lstrip": true,
182
+ "normalized": false,
183
+ "rstrip": true,
184
+ "single_word": false,
185
+ "special": true
186
+ },
187
+ "57540": {
188
+ "content": "</s_place_of_birth>",
189
  "lstrip": true,
190
  "normalized": false,
191
  "rstrip": true,
 
196
  "additional_special_tokens": [
197
  "<s_iitcdip>",
198
  "<s_synthdog>",
199
+ "<s_mother_name>",
200
+ "<s_father_name>",
201
+ "<s_first_name>",
202
  "</s>",
203
+ "<s_random_number>",
204
+ "<s_place_of_birth>",
205
  "</s_address>",
206
+ "</s_mother_name>",
207
+ "</s_random_number>",
208
+ "<s_title>",
209
+ "</s_first_name>",
210
+ "<s_last_name>",
211
+ "</s_title>",
212
+ "</s_father_name>",
213
  "<s_address>",
214
  "<s>",
215
+ "</s_last_name>",
216
+ "</s_place_of_birth>"
217
  ],
218
  "bos_token": "<s>",
219
  "clean_up_tokenization_spaces": true,