amberschuh commited on
Commit
8d0599b
1 Parent(s): b0a02f0

End of training

Browse files
added_tokens.json CHANGED
@@ -1,13 +1,5 @@
1
  {
2
- "</s_address>": 57527,
3
- "</s_company>": 57529,
4
- "</s_date>": 57526,
5
- "</s_total>": 57528,
6
- "<s_address>": 57530,
7
- "<s_company>": 57532,
8
- "<s_date>": 57525,
9
  "<s_iitcdip>": 57523,
10
  "<s_synthdog>": 57524,
11
- "<s_total>": 57531,
12
  "<sep/>": 57522
13
  }
 
1
  {
 
 
 
 
 
 
 
2
  "<s_iitcdip>": 57523,
3
  "<s_synthdog>": 57524,
 
4
  "<sep/>": 57522
5
  }
special_tokens_map.json CHANGED
@@ -1,12 +1,5 @@
1
  {
2
  "additional_special_tokens": [
3
- {
4
- "content": "<s_date>",
5
- "lstrip": false,
6
- "normalized": false,
7
- "rstrip": false,
8
- "single_word": false
9
- },
10
  {
11
  "content": "</s>",
12
  "lstrip": false,
@@ -14,61 +7,12 @@
14
  "rstrip": false,
15
  "single_word": false
16
  },
17
- {
18
- "content": "</s_date>",
19
- "lstrip": false,
20
- "normalized": false,
21
- "rstrip": false,
22
- "single_word": false
23
- },
24
- {
25
- "content": "</s_address>",
26
- "lstrip": false,
27
- "normalized": false,
28
- "rstrip": false,
29
- "single_word": false
30
- },
31
- {
32
- "content": "</s_total>",
33
- "lstrip": false,
34
- "normalized": false,
35
- "rstrip": false,
36
- "single_word": false
37
- },
38
- {
39
- "content": "</s_company>",
40
- "lstrip": false,
41
- "normalized": false,
42
- "rstrip": false,
43
- "single_word": false
44
- },
45
- {
46
- "content": "<s_address>",
47
- "lstrip": false,
48
- "normalized": false,
49
- "rstrip": false,
50
- "single_word": false
51
- },
52
  {
53
  "content": "<s>",
54
  "lstrip": false,
55
  "normalized": false,
56
  "rstrip": false,
57
  "single_word": false
58
- },
59
- {
60
- "content": "<s_total>",
61
- "lstrip": false,
62
- "normalized": false,
63
- "rstrip": false,
64
- "single_word": false
65
- },
66
- {
67
- "content": "<s_company>",
68
- "lstrip": false,
69
- "normalized": false,
70
- "rstrip": false,
71
- "single_word": false
72
  }
73
  ],
74
  "bos_token": "<s>",
 
1
  {
2
  "additional_special_tokens": [
 
 
 
 
 
 
 
3
  {
4
  "content": "</s>",
5
  "lstrip": false,
 
7
  "rstrip": false,
8
  "single_word": false
9
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
10
  {
11
  "content": "<s>",
12
  "lstrip": false,
13
  "normalized": false,
14
  "rstrip": false,
15
  "single_word": false
 
 
 
 
 
 
 
 
 
 
 
 
 
 
16
  }
17
  ],
18
  "bos_token": "<s>",
tokenizer.json CHANGED
@@ -1,21 +1,7 @@
1
  {
2
  "version": "1.0",
3
- "truncation": {
4
- "direction": "Right",
5
- "max_length": 512,
6
- "strategy": "LongestFirst",
7
- "stride": 0
8
- },
9
- "padding": {
10
- "strategy": {
11
- "Fixed": 512
12
- },
13
- "direction": "Right",
14
- "pad_to_multiple_of": null,
15
- "pad_id": 1,
16
- "pad_type_id": 0,
17
- "pad_token": "<pad>"
18
- },
19
  "added_tokens": [
20
  {
21
  "id": 0,
@@ -88,78 +74,6 @@
88
  "rstrip": false,
89
  "normalized": false,
90
  "special": true
91
- },
92
- {
93
- "id": 57525,
94
- "content": "<s_date>",
95
- "single_word": false,
96
- "lstrip": false,
97
- "rstrip": false,
98
- "normalized": false,
99
- "special": true
100
- },
101
- {
102
- "id": 57526,
103
- "content": "</s_date>",
104
- "single_word": false,
105
- "lstrip": false,
106
- "rstrip": false,
107
- "normalized": false,
108
- "special": true
109
- },
110
- {
111
- "id": 57527,
112
- "content": "</s_address>",
113
- "single_word": false,
114
- "lstrip": false,
115
- "rstrip": false,
116
- "normalized": false,
117
- "special": true
118
- },
119
- {
120
- "id": 57528,
121
- "content": "</s_total>",
122
- "single_word": false,
123
- "lstrip": false,
124
- "rstrip": false,
125
- "normalized": false,
126
- "special": true
127
- },
128
- {
129
- "id": 57529,
130
- "content": "</s_company>",
131
- "single_word": false,
132
- "lstrip": false,
133
- "rstrip": false,
134
- "normalized": false,
135
- "special": true
136
- },
137
- {
138
- "id": 57530,
139
- "content": "<s_address>",
140
- "single_word": false,
141
- "lstrip": false,
142
- "rstrip": false,
143
- "normalized": false,
144
- "special": true
145
- },
146
- {
147
- "id": 57531,
148
- "content": "<s_total>",
149
- "single_word": false,
150
- "lstrip": false,
151
- "rstrip": false,
152
- "normalized": false,
153
- "special": true
154
- },
155
- {
156
- "id": 57532,
157
- "content": "<s_company>",
158
- "single_word": false,
159
- "lstrip": false,
160
- "rstrip": false,
161
- "normalized": false,
162
- "special": true
163
  }
164
  ],
165
  "normalizer": {
 
1
  {
2
  "version": "1.0",
3
+ "truncation": null,
4
+ "padding": null,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5
  "added_tokens": [
6
  {
7
  "id": 0,
 
74
  "rstrip": false,
75
  "normalized": false,
76
  "special": true
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
77
  }
78
  ],
79
  "normalizer": {
tokenizer_config.json CHANGED
@@ -63,83 +63,11 @@
63
  "rstrip": false,
64
  "single_word": false,
65
  "special": true
66
- },
67
- "57525": {
68
- "content": "<s_date>",
69
- "lstrip": false,
70
- "normalized": false,
71
- "rstrip": false,
72
- "single_word": false,
73
- "special": true
74
- },
75
- "57526": {
76
- "content": "</s_date>",
77
- "lstrip": false,
78
- "normalized": false,
79
- "rstrip": false,
80
- "single_word": false,
81
- "special": true
82
- },
83
- "57527": {
84
- "content": "</s_address>",
85
- "lstrip": false,
86
- "normalized": false,
87
- "rstrip": false,
88
- "single_word": false,
89
- "special": true
90
- },
91
- "57528": {
92
- "content": "</s_total>",
93
- "lstrip": false,
94
- "normalized": false,
95
- "rstrip": false,
96
- "single_word": false,
97
- "special": true
98
- },
99
- "57529": {
100
- "content": "</s_company>",
101
- "lstrip": false,
102
- "normalized": false,
103
- "rstrip": false,
104
- "single_word": false,
105
- "special": true
106
- },
107
- "57530": {
108
- "content": "<s_address>",
109
- "lstrip": false,
110
- "normalized": false,
111
- "rstrip": false,
112
- "single_word": false,
113
- "special": true
114
- },
115
- "57531": {
116
- "content": "<s_total>",
117
- "lstrip": false,
118
- "normalized": false,
119
- "rstrip": false,
120
- "single_word": false,
121
- "special": true
122
- },
123
- "57532": {
124
- "content": "<s_company>",
125
- "lstrip": false,
126
- "normalized": false,
127
- "rstrip": false,
128
- "single_word": false,
129
- "special": true
130
  }
131
  },
132
  "additional_special_tokens": [
133
- "<s_date>",
134
  "</s>",
135
- "</s_date>",
136
- "</s_address>",
137
- "</s_total>",
138
- "</s_company>",
139
- "<s_address>",
140
- "<s>",
141
- "<s_total>",
142
- "<s_company>"
143
  ],
144
  "bos_token": "<s>",
145
  "clean_up_tokenization_spaces": true,
 
63
  "rstrip": false,
64
  "single_word": false,
65
  "special": true
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
66
  }
67
  },
68
  "additional_special_tokens": [
 
69
  "</s>",
70
+ "<s>"
 
 
 
 
 
 
 
71
  ],
72
  "bos_token": "<s>",
73
  "clean_up_tokenization_spaces": true,