KoichiYasuoka commited on
Commit
991ef8f
1 Parent(s): 54e41fa

model improved

Browse files
config.json CHANGED
@@ -14,102 +14,97 @@
14
  "2": "ADP",
15
  "3": "ADV",
16
  "4": "AUX",
17
- "5": "AUX|Polarity=Neg",
18
- "6": "AUX|Polarity=Neg+VERB",
19
- "7": "B-ADJ",
20
- "8": "B-ADJ+ADJ",
21
- "9": "B-ADJ+AUX+AUX",
22
- "10": "B-ADJ+VERB",
23
- "11": "B-ADP",
24
- "12": "B-ADP+NOUN",
25
- "13": "B-ADV",
26
- "14": "B-ADV+ADP",
27
- "15": "B-ADV+ADP+VERB",
28
- "16": "B-AUX",
29
- "17": "B-AUX+AUX",
30
- "18": "B-AUX+AUX+AUX",
31
- "19": "B-AUX+AUX+PART",
32
  "20": "B-AUX+SCONJ",
33
- "21": "B-AUX|Polarity=Neg",
34
- "22": "B-AUX|Polarity=Neg+VERB",
35
- "23": "B-CCONJ",
36
- "24": "B-DET",
37
- "25": "B-INTJ",
38
- "26": "B-NOUN",
39
- "27": "B-NOUN+ADJ",
40
- "28": "B-NOUN+ADP",
41
- "29": "B-NOUN|Polarity=Neg",
42
- "30": "B-NUM",
43
- "31": "B-PART",
44
- "32": "B-PRON",
45
- "33": "B-PROPN",
46
- "34": "B-PUNCT",
47
- "35": "B-SCONJ",
48
- "36": "B-SYM",
49
- "37": "B-VERB",
50
- "38": "B-VERB+AUX",
51
- "39": "B-VERB+AUX+AUX",
52
- "40": "B-VERB+AUX+NOUN",
53
- "41": "B-VERB+AUX+PART",
54
- "42": "B-VERB+AUX+SCONJ",
55
- "43": "B-VERB+AUX|Polarity=Neg",
56
- "44": "B-X",
57
- "45": "CCONJ",
58
- "46": "DET",
59
- "47": "I-ADJ",
60
- "48": "I-ADJ+ADJ",
61
- "49": "I-ADJ+AUX+AUX",
62
- "50": "I-ADJ+VERB",
63
- "51": "I-ADP",
64
- "52": "I-ADP+NOUN",
65
- "53": "I-ADV",
66
- "54": "I-ADV+ADP",
67
- "55": "I-ADV+ADP+VERB",
68
- "56": "I-AUX",
69
- "57": "I-AUX+AUX",
70
- "58": "I-AUX+AUX+AUX",
71
- "59": "I-AUX+AUX+PART",
72
- "60": "I-AUX+SCONJ",
73
- "61": "I-AUX|Polarity=Neg",
74
- "62": "I-AUX|Polarity=Neg+VERB",
75
- "63": "I-CCONJ",
76
- "64": "I-DET",
77
- "65": "I-INTJ",
78
- "66": "I-NOUN",
79
- "67": "I-NOUN+ADJ",
80
- "68": "I-NOUN+ADP",
81
- "69": "I-NOUN|Polarity=Neg",
82
- "70": "I-NUM",
83
- "71": "I-PART",
84
- "72": "I-PRON",
85
- "73": "I-PROPN",
86
- "74": "I-PUNCT",
87
- "75": "I-SCONJ",
88
- "76": "I-SYM",
89
- "77": "I-VERB",
90
- "78": "I-VERB+AUX",
91
- "79": "I-VERB+AUX+AUX",
92
- "80": "I-VERB+AUX+NOUN",
93
- "81": "I-VERB+AUX+PART",
94
- "82": "I-VERB+AUX+SCONJ",
95
- "83": "I-VERB+AUX|Polarity=Neg",
96
- "84": "I-X",
97
- "85": "NOUN",
98
- "86": "NOUN+ADP",
99
- "87": "NOUN+AUX",
100
- "88": "NUM",
101
- "89": "PART",
102
- "90": "PRON",
103
- "91": "PRON+ADP",
104
- "92": "PROPN",
105
- "93": "PUNCT",
106
- "94": "SCONJ",
107
- "95": "SYM",
108
- "96": "VERB",
109
- "97": "VERB+AUX",
110
- "98": "VERB+AUX+PART",
111
- "99": "VERB+AUX|Polarity=Neg",
112
- "100": "X"
113
  },
114
  "initializer_range": 0.02,
115
  "intermediate_size": 4096,
@@ -119,102 +114,97 @@
119
  "ADP": 2,
120
  "ADV": 3,
121
  "AUX": 4,
122
- "AUX|Polarity=Neg": 5,
123
- "AUX|Polarity=Neg+VERB": 6,
124
- "B-ADJ": 7,
125
- "B-ADJ+ADJ": 8,
126
- "B-ADJ+AUX+AUX": 9,
127
- "B-ADJ+VERB": 10,
128
- "B-ADP": 11,
129
- "B-ADP+NOUN": 12,
130
- "B-ADV": 13,
131
- "B-ADV+ADP": 14,
132
- "B-ADV+ADP+VERB": 15,
133
- "B-AUX": 16,
134
- "B-AUX+AUX": 17,
135
- "B-AUX+AUX+AUX": 18,
136
- "B-AUX+AUX+PART": 19,
137
  "B-AUX+SCONJ": 20,
138
- "B-AUX|Polarity=Neg": 21,
139
- "B-AUX|Polarity=Neg+VERB": 22,
140
- "B-CCONJ": 23,
141
- "B-DET": 24,
142
- "B-INTJ": 25,
143
- "B-NOUN": 26,
144
- "B-NOUN+ADJ": 27,
145
- "B-NOUN+ADP": 28,
146
- "B-NOUN|Polarity=Neg": 29,
147
- "B-NUM": 30,
148
- "B-PART": 31,
149
- "B-PRON": 32,
150
- "B-PROPN": 33,
151
- "B-PUNCT": 34,
152
- "B-SCONJ": 35,
153
- "B-SYM": 36,
154
- "B-VERB": 37,
155
- "B-VERB+AUX": 38,
156
- "B-VERB+AUX+AUX": 39,
157
- "B-VERB+AUX+NOUN": 40,
158
- "B-VERB+AUX+PART": 41,
159
- "B-VERB+AUX+SCONJ": 42,
160
- "B-VERB+AUX|Polarity=Neg": 43,
161
- "B-X": 44,
162
- "CCONJ": 45,
163
- "DET": 46,
164
- "I-ADJ": 47,
165
- "I-ADJ+ADJ": 48,
166
- "I-ADJ+AUX+AUX": 49,
167
- "I-ADJ+VERB": 50,
168
- "I-ADP": 51,
169
- "I-ADP+NOUN": 52,
170
- "I-ADV": 53,
171
- "I-ADV+ADP": 54,
172
- "I-ADV+ADP+VERB": 55,
173
- "I-AUX": 56,
174
- "I-AUX+AUX": 57,
175
- "I-AUX+AUX+AUX": 58,
176
- "I-AUX+AUX+PART": 59,
177
- "I-AUX+SCONJ": 60,
178
- "I-AUX|Polarity=Neg": 61,
179
- "I-AUX|Polarity=Neg+VERB": 62,
180
- "I-CCONJ": 63,
181
- "I-DET": 64,
182
- "I-INTJ": 65,
183
- "I-NOUN": 66,
184
- "I-NOUN+ADJ": 67,
185
- "I-NOUN+ADP": 68,
186
- "I-NOUN|Polarity=Neg": 69,
187
- "I-NUM": 70,
188
- "I-PART": 71,
189
- "I-PRON": 72,
190
- "I-PROPN": 73,
191
- "I-PUNCT": 74,
192
- "I-SCONJ": 75,
193
- "I-SYM": 76,
194
- "I-VERB": 77,
195
- "I-VERB+AUX": 78,
196
- "I-VERB+AUX+AUX": 79,
197
- "I-VERB+AUX+NOUN": 80,
198
- "I-VERB+AUX+PART": 81,
199
- "I-VERB+AUX+SCONJ": 82,
200
- "I-VERB+AUX|Polarity=Neg": 83,
201
- "I-X": 84,
202
- "NOUN": 85,
203
- "NOUN+ADP": 86,
204
- "NOUN+AUX": 87,
205
- "NUM": 88,
206
- "PART": 89,
207
- "PRON": 90,
208
- "PRON+ADP": 91,
209
- "PROPN": 92,
210
- "PUNCT": 93,
211
- "SCONJ": 94,
212
- "SYM": 95,
213
- "VERB": 96,
214
- "VERB+AUX": 97,
215
- "VERB+AUX+PART": 98,
216
- "VERB+AUX|Polarity=Neg": 99,
217
- "X": 100
218
  },
219
  "layer_norm_eps": 1e-07,
220
  "max_position_embeddings": 512,
@@ -226,9 +216,12 @@
226
  "pooler_dropout": 0,
227
  "pooler_hidden_act": "gelu",
228
  "pooler_hidden_size": 1024,
229
- "pos_att_type": null,
230
- "position_biased_input": true,
231
- "relative_attention": false,
 
 
 
232
  "task_specific_params": {
233
  "upos_multiword": {
234
  "ADJ+ADJ": {
@@ -280,6 +273,10 @@
280
  ]
281
  },
282
  "AUX+AUX": {
 
 
 
 
283
  "\u30c1\u30e3\u30c3\u30bf": [
284
  "\u30c1\u30e3\u30c3",
285
  "\u30bf"
@@ -304,6 +301,13 @@
304
  "\u3060\u3051"
305
  ]
306
  },
 
 
 
 
 
 
 
307
  "AUX+SCONJ": {
308
  "\u3060\u3051\u3069": [
309
  "\u3060",
@@ -318,7 +322,7 @@
318
  "\u3051\u3069"
319
  ]
320
  },
321
- "AUX|Polarity=Neg+VERB": {
322
  "\u306a\u304f\u306a\u3063": [
323
  "\u306a\u304f",
324
  "\u306a\u3063"
@@ -393,6 +397,10 @@
393
  "\u304a\u3053\u306a\u308f",
394
  "\u308c"
395
  ],
 
 
 
 
396
  "\u3055\u3089\u308f\u308c": [
397
  "\u3055\u3089\u308f",
398
  "\u308c"
@@ -417,6 +425,10 @@
417
  "\u306a\u3058\u307e",
418
  "\u305b"
419
  ],
 
 
 
 
420
  "\u307f\u306a\u3055\u308c": [
421
  "\u307f\u306a\u3055",
422
  "\u308c"
@@ -469,6 +481,10 @@
469
  "\u548c\u307e",
470
  "\u305b"
471
  ],
 
 
 
 
472
  "\u554f\u308f\u308c": [
473
  "\u554f\u308f",
474
  "\u308c"
@@ -537,6 +553,10 @@
537
  "\u679c\u305f\u3059",
538
  "\u3079\u304f"
539
  ],
 
 
 
 
540
  "\u6b4c\u308f\u308c": [
541
  "\u6b4c\u308f",
542
  "\u308c"
@@ -577,6 +597,10 @@
577
  "\u884c\u3063",
578
  "\u3061\u3083\u3044"
579
  ],
 
 
 
 
580
  "\u884c\u308f\u308c": [
581
  "\u884c\u308f",
582
  "\u308c"
@@ -719,34 +743,12 @@
719
  "\u305f",
720
  "\u305f\u3081\u306b"
721
  ]
722
- },
723
- "VERB+AUX|Polarity=Neg": {
724
- "\u304b\u307e\u308f\u305a": [
725
- "\u304b\u307e\u308f",
726
- "\u305a"
727
- ],
728
- "\u306a\u3089\u305a": [
729
- "\u306a\u3089",
730
- "\u305a"
731
- ],
732
- "\u554f\u308f\u305a": [
733
- "\u554f\u308f",
734
- "\u305a"
735
- ],
736
- "\u69cb\u308f\u305a": [
737
- "\u69cb\u308f",
738
- "\u305a"
739
- ],
740
- "\u884c\u308f\u305a": [
741
- "\u884c\u308f",
742
- "\u305a"
743
- ]
744
  }
745
  }
746
  },
747
  "tokenizer_class": "DebertaV2TokenizerFast",
748
  "torch_dtype": "float32",
749
- "transformers_version": "4.19.4",
750
  "type_vocab_size": 0,
751
  "vocab_size": 32000
752
  }
14
  "2": "ADP",
15
  "3": "ADV",
16
  "4": "AUX",
17
+ "5": "AUX+VERB",
18
+ "6": "B-ADJ",
19
+ "7": "B-ADJ+ADJ",
20
+ "8": "B-ADJ+AUX+AUX",
21
+ "9": "B-ADJ+VERB",
22
+ "10": "B-ADP",
23
+ "11": "B-ADP+NOUN",
24
+ "12": "B-ADV",
25
+ "13": "B-ADV+ADP",
26
+ "14": "B-ADV+ADP+VERB",
27
+ "15": "B-AUX",
28
+ "16": "B-AUX+AUX",
29
+ "17": "B-AUX+AUX+AUX",
30
+ "18": "B-AUX+AUX+PART",
31
+ "19": "B-AUX+AUX+VERB",
32
  "20": "B-AUX+SCONJ",
33
+ "21": "B-AUX+VERB",
34
+ "22": "B-CCONJ",
35
+ "23": "B-DET",
36
+ "24": "B-INTJ",
37
+ "25": "B-NOUN",
38
+ "26": "B-NOUN+ADJ",
39
+ "27": "B-NOUN+ADP",
40
+ "28": "B-NUM",
41
+ "29": "B-PART",
42
+ "30": "B-PRON",
43
+ "31": "B-PROPN",
44
+ "32": "B-PUNCT",
45
+ "33": "B-SCONJ",
46
+ "34": "B-SYM",
47
+ "35": "B-VERB",
48
+ "36": "B-VERB+AUX",
49
+ "37": "B-VERB+AUX+AUX",
50
+ "38": "B-VERB+AUX+NOUN",
51
+ "39": "B-VERB+AUX+PART",
52
+ "40": "B-VERB+AUX+SCONJ",
53
+ "41": "B-X",
54
+ "42": "CCONJ",
55
+ "43": "DET",
56
+ "44": "I-ADJ",
57
+ "45": "I-ADJ+ADJ",
58
+ "46": "I-ADJ+AUX+AUX",
59
+ "47": "I-ADJ+VERB",
60
+ "48": "I-ADP",
61
+ "49": "I-ADP+NOUN",
62
+ "50": "I-ADV",
63
+ "51": "I-ADV+ADP",
64
+ "52": "I-ADV+ADP+VERB",
65
+ "53": "I-AUX",
66
+ "54": "I-AUX+AUX",
67
+ "55": "I-AUX+AUX+AUX",
68
+ "56": "I-AUX+AUX+PART",
69
+ "57": "I-AUX+AUX+VERB",
70
+ "58": "I-AUX+SCONJ",
71
+ "59": "I-AUX+VERB",
72
+ "60": "I-CCONJ",
73
+ "61": "I-DET",
74
+ "62": "I-INTJ",
75
+ "63": "I-NOUN",
76
+ "64": "I-NOUN+ADJ",
77
+ "65": "I-NOUN+ADP",
78
+ "66": "I-NUM",
79
+ "67": "I-PART",
80
+ "68": "I-PRON",
81
+ "69": "I-PROPN",
82
+ "70": "I-PUNCT",
83
+ "71": "I-SCONJ",
84
+ "72": "I-SYM",
85
+ "73": "I-VERB",
86
+ "74": "I-VERB+AUX",
87
+ "75": "I-VERB+AUX+AUX",
88
+ "76": "I-VERB+AUX+NOUN",
89
+ "77": "I-VERB+AUX+PART",
90
+ "78": "I-VERB+AUX+SCONJ",
91
+ "79": "I-X",
92
+ "80": "INTJ",
93
+ "81": "NOUN",
94
+ "82": "NOUN+ADP",
95
+ "83": "NOUN+AUX",
96
+ "84": "NUM",
97
+ "85": "PART",
98
+ "86": "PRON",
99
+ "87": "PRON+ADP",
100
+ "88": "PROPN",
101
+ "89": "PUNCT",
102
+ "90": "SCONJ",
103
+ "91": "SYM",
104
+ "92": "VERB",
105
+ "93": "VERB+AUX",
106
+ "94": "VERB+AUX+PART",
107
+ "95": "X"
 
 
 
 
 
108
  },
109
  "initializer_range": 0.02,
110
  "intermediate_size": 4096,
114
  "ADP": 2,
115
  "ADV": 3,
116
  "AUX": 4,
117
+ "AUX+VERB": 5,
118
+ "B-ADJ": 6,
119
+ "B-ADJ+ADJ": 7,
120
+ "B-ADJ+AUX+AUX": 8,
121
+ "B-ADJ+VERB": 9,
122
+ "B-ADP": 10,
123
+ "B-ADP+NOUN": 11,
124
+ "B-ADV": 12,
125
+ "B-ADV+ADP": 13,
126
+ "B-ADV+ADP+VERB": 14,
127
+ "B-AUX": 15,
128
+ "B-AUX+AUX": 16,
129
+ "B-AUX+AUX+AUX": 17,
130
+ "B-AUX+AUX+PART": 18,
131
+ "B-AUX+AUX+VERB": 19,
132
  "B-AUX+SCONJ": 20,
133
+ "B-AUX+VERB": 21,
134
+ "B-CCONJ": 22,
135
+ "B-DET": 23,
136
+ "B-INTJ": 24,
137
+ "B-NOUN": 25,
138
+ "B-NOUN+ADJ": 26,
139
+ "B-NOUN+ADP": 27,
140
+ "B-NUM": 28,
141
+ "B-PART": 29,
142
+ "B-PRON": 30,
143
+ "B-PROPN": 31,
144
+ "B-PUNCT": 32,
145
+ "B-SCONJ": 33,
146
+ "B-SYM": 34,
147
+ "B-VERB": 35,
148
+ "B-VERB+AUX": 36,
149
+ "B-VERB+AUX+AUX": 37,
150
+ "B-VERB+AUX+NOUN": 38,
151
+ "B-VERB+AUX+PART": 39,
152
+ "B-VERB+AUX+SCONJ": 40,
153
+ "B-X": 41,
154
+ "CCONJ": 42,
155
+ "DET": 43,
156
+ "I-ADJ": 44,
157
+ "I-ADJ+ADJ": 45,
158
+ "I-ADJ+AUX+AUX": 46,
159
+ "I-ADJ+VERB": 47,
160
+ "I-ADP": 48,
161
+ "I-ADP+NOUN": 49,
162
+ "I-ADV": 50,
163
+ "I-ADV+ADP": 51,
164
+ "I-ADV+ADP+VERB": 52,
165
+ "I-AUX": 53,
166
+ "I-AUX+AUX": 54,
167
+ "I-AUX+AUX+AUX": 55,
168
+ "I-AUX+AUX+PART": 56,
169
+ "I-AUX+AUX+VERB": 57,
170
+ "I-AUX+SCONJ": 58,
171
+ "I-AUX+VERB": 59,
172
+ "I-CCONJ": 60,
173
+ "I-DET": 61,
174
+ "I-INTJ": 62,
175
+ "I-NOUN": 63,
176
+ "I-NOUN+ADJ": 64,
177
+ "I-NOUN+ADP": 65,
178
+ "I-NUM": 66,
179
+ "I-PART": 67,
180
+ "I-PRON": 68,
181
+ "I-PROPN": 69,
182
+ "I-PUNCT": 70,
183
+ "I-SCONJ": 71,
184
+ "I-SYM": 72,
185
+ "I-VERB": 73,
186
+ "I-VERB+AUX": 74,
187
+ "I-VERB+AUX+AUX": 75,
188
+ "I-VERB+AUX+NOUN": 76,
189
+ "I-VERB+AUX+PART": 77,
190
+ "I-VERB+AUX+SCONJ": 78,
191
+ "I-X": 79,
192
+ "INTJ": 80,
193
+ "NOUN": 81,
194
+ "NOUN+ADP": 82,
195
+ "NOUN+AUX": 83,
196
+ "NUM": 84,
197
+ "PART": 85,
198
+ "PRON": 86,
199
+ "PRON+ADP": 87,
200
+ "PROPN": 88,
201
+ "PUNCT": 89,
202
+ "SCONJ": 90,
203
+ "SYM": 91,
204
+ "VERB": 92,
205
+ "VERB+AUX": 93,
206
+ "VERB+AUX+PART": 94,
207
+ "X": 95
 
 
 
 
 
208
  },
209
  "layer_norm_eps": 1e-07,
210
  "max_position_embeddings": 512,
216
  "pooler_dropout": 0,
217
  "pooler_hidden_act": "gelu",
218
  "pooler_hidden_size": 1024,
219
+ "pos_att_type": [
220
+ "p2c",
221
+ "c2p"
222
+ ],
223
+ "position_biased_input": false,
224
+ "relative_attention": true,
225
  "task_specific_params": {
226
  "upos_multiword": {
227
  "ADJ+ADJ": {
273
  ]
274
  },
275
  "AUX+AUX": {
276
+ "\u3066\u3057\u307e\u3044\u307e\u3057": [
277
+ "\u3066\u3057\u307e\u3044",
278
+ "\u307e\u3057"
279
+ ],
280
  "\u30c1\u30e3\u30c3\u30bf": [
281
  "\u30c1\u30e3\u30c3",
282
  "\u30bf"
301
  "\u3060\u3051"
302
  ]
303
  },
304
+ "AUX+AUX+VERB": {
305
+ "\u3084\u3063\u305f\u3089\u304b\u304b\u3063": [
306
+ "\u3084\u3063",
307
+ "\u305f\u3089",
308
+ "\u304b\u304b\u3063"
309
+ ]
310
+ },
311
  "AUX+SCONJ": {
312
  "\u3060\u3051\u3069": [
313
  "\u3060",
322
  "\u3051\u3069"
323
  ]
324
  },
325
+ "AUX+VERB": {
326
  "\u306a\u304f\u306a\u3063": [
327
  "\u306a\u304f",
328
  "\u306a\u3063"
397
  "\u304a\u3053\u306a\u308f",
398
  "\u308c"
399
  ],
400
+ "\u304b\u307e\u308f\u305a": [
401
+ "\u304b\u307e\u308f",
402
+ "\u305a"
403
+ ],
404
  "\u3055\u3089\u308f\u308c": [
405
  "\u3055\u3089\u308f",
406
  "\u308c"
425
  "\u306a\u3058\u307e",
426
  "\u305b"
427
  ],
428
+ "\u306a\u3089\u305a": [
429
+ "\u306a\u3089",
430
+ "\u305a"
431
+ ],
432
  "\u307f\u306a\u3055\u308c": [
433
  "\u307f\u306a\u3055",
434
  "\u308c"
481
  "\u548c\u307e",
482
  "\u305b"
483
  ],
484
+ "\u554f\u308f\u305a": [
485
+ "\u554f\u308f",
486
+ "\u305a"
487
+ ],
488
  "\u554f\u308f\u308c": [
489
  "\u554f\u308f",
490
  "\u308c"
553
  "\u679c\u305f\u3059",
554
  "\u3079\u304f"
555
  ],
556
+ "\u69cb\u308f\u305a": [
557
+ "\u69cb\u308f",
558
+ "\u305a"
559
+ ],
560
  "\u6b4c\u308f\u308c": [
561
  "\u6b4c\u308f",
562
  "\u308c"
597
  "\u884c\u3063",
598
  "\u3061\u3083\u3044"
599
  ],
600
+ "\u884c\u308f\u305a": [
601
+ "\u884c\u308f",
602
+ "\u305a"
603
+ ],
604
  "\u884c\u308f\u308c": [
605
  "\u884c\u308f",
606
  "\u308c"
743
  "\u305f",
744
  "\u305f\u3081\u306b"
745
  ]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
746
  }
747
  }
748
  },
749
  "tokenizer_class": "DebertaV2TokenizerFast",
750
  "torch_dtype": "float32",
751
+ "transformers_version": "4.22.1",
752
  "type_vocab_size": 0,
753
  "vocab_size": 32000
754
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:141c5df5ee7bd2676fea778d6ac7a97bfbdde0c5920254ba4afd91ad1ad65276
3
- size 1342965811
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf0da4c537c7bce06e4170930dc3c9b35b5bc275dd0e6d62192f5a1102c71190
3
+ size 1546599283
special_tokens_map.json CHANGED
@@ -1 +1,9 @@
1
- {"bos_token": "[CLS]", "eos_token": "[SEP]", "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]"}
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "[CLS]",
3
+ "cls_token": "[CLS]",
4
+ "eos_token": "[SEP]",
5
+ "mask_token": "[MASK]",
6
+ "pad_token": "[PAD]",
7
+ "sep_token": "[SEP]",
8
+ "unk_token": "[UNK]"
9
+ }
supar.model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ea810c64722637e4da616ecda3a31fe87001a296f7153b3dd546b82ca3990584
3
- size 1391428779
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5248b013cc3e84977dab33504b77ee262458ce0a7b7961ceed4fd59dc74676e
3
+ size 1595110891
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
tokenizer_config.json CHANGED
@@ -1 +1,14 @@
1
- {"do_lower_case": false, "bos_token": "[CLS]", "eos_token": "[SEP]", "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "split_by_punct": true, "keep_accents": true, "model_max_length": 512, "tokenizer_class": "DebertaV2TokenizerFast"}
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "[CLS]",
3
+ "cls_token": "[CLS]",
4
+ "do_lower_case": false,
5
+ "eos_token": "[SEP]",
6
+ "keep_accents": true,
7
+ "mask_token": "[MASK]",
8
+ "model_max_length": 512,
9
+ "pad_token": "[PAD]",
10
+ "sep_token": "[SEP]",
11
+ "split_by_punct": true,
12
+ "tokenizer_class": "DebertaV2TokenizerFast",
13
+ "unk_token": "[UNK]"
14
+ }