KoichiYasuoka commited on
Commit
32b1dca
1 Parent(s): 7cbf54c

model improved

Browse files
config.json CHANGED
@@ -14,102 +14,96 @@
14
  "2": "ADP",
15
  "3": "ADV",
16
  "4": "AUX",
17
- "5": "AUX|Polarity=Neg",
18
- "6": "AUX|Polarity=Neg+VERB",
19
- "7": "B-ADJ",
20
- "8": "B-ADJ+ADJ",
21
- "9": "B-ADJ+AUX+AUX",
22
- "10": "B-ADJ+VERB",
23
- "11": "B-ADP",
24
- "12": "B-ADP+NOUN",
25
- "13": "B-ADV",
26
- "14": "B-ADV+ADP",
27
- "15": "B-ADV+ADP+VERB",
28
- "16": "B-AUX",
29
- "17": "B-AUX+AUX",
30
- "18": "B-AUX+AUX+AUX",
31
- "19": "B-AUX+AUX+PART",
32
- "20": "B-AUX+SCONJ",
33
- "21": "B-AUX|Polarity=Neg",
34
- "22": "B-AUX|Polarity=Neg+VERB",
35
- "23": "B-CCONJ",
36
- "24": "B-DET",
37
- "25": "B-INTJ",
38
- "26": "B-NOUN",
39
- "27": "B-NOUN+ADJ",
40
- "28": "B-NOUN+ADP",
41
- "29": "B-NOUN|Polarity=Neg",
42
- "30": "B-NUM",
43
- "31": "B-PART",
44
- "32": "B-PRON",
45
- "33": "B-PROPN",
46
- "34": "B-PUNCT",
47
- "35": "B-SCONJ",
48
- "36": "B-SYM",
49
- "37": "B-VERB",
50
- "38": "B-VERB+AUX",
51
- "39": "B-VERB+AUX+AUX",
52
- "40": "B-VERB+AUX+NOUN",
53
- "41": "B-VERB+AUX+PART",
54
- "42": "B-VERB+AUX+SCONJ",
55
- "43": "B-VERB+AUX|Polarity=Neg",
56
- "44": "B-X",
57
- "45": "CCONJ",
58
- "46": "DET",
59
- "47": "I-ADJ",
60
- "48": "I-ADJ+ADJ",
61
- "49": "I-ADJ+AUX+AUX",
62
- "50": "I-ADJ+VERB",
63
- "51": "I-ADP",
64
- "52": "I-ADP+NOUN",
65
- "53": "I-ADV",
66
- "54": "I-ADV+ADP",
67
- "55": "I-ADV+ADP+VERB",
68
- "56": "I-AUX",
69
- "57": "I-AUX+AUX",
70
- "58": "I-AUX+AUX+AUX",
71
- "59": "I-AUX+AUX+PART",
72
- "60": "I-AUX+SCONJ",
73
- "61": "I-AUX|Polarity=Neg",
74
- "62": "I-AUX|Polarity=Neg+VERB",
75
- "63": "I-CCONJ",
76
- "64": "I-DET",
77
- "65": "I-INTJ",
78
- "66": "I-NOUN",
79
- "67": "I-NOUN+ADJ",
80
- "68": "I-NOUN+ADP",
81
- "69": "I-NOUN|Polarity=Neg",
82
- "70": "I-NUM",
83
- "71": "I-PART",
84
- "72": "I-PRON",
85
- "73": "I-PROPN",
86
- "74": "I-PUNCT",
87
- "75": "I-SCONJ",
88
- "76": "I-SYM",
89
- "77": "I-VERB",
90
- "78": "I-VERB+AUX",
91
- "79": "I-VERB+AUX+AUX",
92
- "80": "I-VERB+AUX+NOUN",
93
- "81": "I-VERB+AUX+PART",
94
- "82": "I-VERB+AUX+SCONJ",
95
- "83": "I-VERB+AUX|Polarity=Neg",
96
- "84": "I-X",
97
- "85": "NOUN",
98
- "86": "NOUN+ADP",
99
- "87": "NOUN+AUX",
100
- "88": "NUM",
101
- "89": "PART",
102
- "90": "PRON",
103
- "91": "PRON+ADP",
104
- "92": "PROPN",
105
- "93": "PUNCT",
106
- "94": "SCONJ",
107
- "95": "SYM",
108
- "96": "VERB",
109
- "97": "VERB+AUX",
110
- "98": "VERB+AUX+PART",
111
- "99": "VERB+AUX|Polarity=Neg",
112
- "100": "X"
113
  },
114
  "initializer_range": 0.02,
115
  "intermediate_size": 3072,
@@ -119,102 +113,96 @@
119
  "ADP": 2,
120
  "ADV": 3,
121
  "AUX": 4,
122
- "AUX|Polarity=Neg": 5,
123
- "AUX|Polarity=Neg+VERB": 6,
124
- "B-ADJ": 7,
125
- "B-ADJ+ADJ": 8,
126
- "B-ADJ+AUX+AUX": 9,
127
- "B-ADJ+VERB": 10,
128
- "B-ADP": 11,
129
- "B-ADP+NOUN": 12,
130
- "B-ADV": 13,
131
- "B-ADV+ADP": 14,
132
- "B-ADV+ADP+VERB": 15,
133
- "B-AUX": 16,
134
- "B-AUX+AUX": 17,
135
- "B-AUX+AUX+AUX": 18,
136
- "B-AUX+AUX+PART": 19,
137
- "B-AUX+SCONJ": 20,
138
- "B-AUX|Polarity=Neg": 21,
139
- "B-AUX|Polarity=Neg+VERB": 22,
140
- "B-CCONJ": 23,
141
- "B-DET": 24,
142
- "B-INTJ": 25,
143
- "B-NOUN": 26,
144
- "B-NOUN+ADJ": 27,
145
- "B-NOUN+ADP": 28,
146
- "B-NOUN|Polarity=Neg": 29,
147
- "B-NUM": 30,
148
- "B-PART": 31,
149
- "B-PRON": 32,
150
- "B-PROPN": 33,
151
- "B-PUNCT": 34,
152
- "B-SCONJ": 35,
153
- "B-SYM": 36,
154
- "B-VERB": 37,
155
- "B-VERB+AUX": 38,
156
- "B-VERB+AUX+AUX": 39,
157
- "B-VERB+AUX+NOUN": 40,
158
- "B-VERB+AUX+PART": 41,
159
- "B-VERB+AUX+SCONJ": 42,
160
- "B-VERB+AUX|Polarity=Neg": 43,
161
- "B-X": 44,
162
- "CCONJ": 45,
163
- "DET": 46,
164
- "I-ADJ": 47,
165
- "I-ADJ+ADJ": 48,
166
- "I-ADJ+AUX+AUX": 49,
167
- "I-ADJ+VERB": 50,
168
- "I-ADP": 51,
169
- "I-ADP+NOUN": 52,
170
- "I-ADV": 53,
171
- "I-ADV+ADP": 54,
172
- "I-ADV+ADP+VERB": 55,
173
- "I-AUX": 56,
174
- "I-AUX+AUX": 57,
175
- "I-AUX+AUX+AUX": 58,
176
- "I-AUX+AUX+PART": 59,
177
- "I-AUX+SCONJ": 60,
178
- "I-AUX|Polarity=Neg": 61,
179
- "I-AUX|Polarity=Neg+VERB": 62,
180
- "I-CCONJ": 63,
181
- "I-DET": 64,
182
- "I-INTJ": 65,
183
- "I-NOUN": 66,
184
- "I-NOUN+ADJ": 67,
185
- "I-NOUN+ADP": 68,
186
- "I-NOUN|Polarity=Neg": 69,
187
- "I-NUM": 70,
188
- "I-PART": 71,
189
- "I-PRON": 72,
190
- "I-PROPN": 73,
191
- "I-PUNCT": 74,
192
- "I-SCONJ": 75,
193
- "I-SYM": 76,
194
- "I-VERB": 77,
195
- "I-VERB+AUX": 78,
196
- "I-VERB+AUX+AUX": 79,
197
- "I-VERB+AUX+NOUN": 80,
198
- "I-VERB+AUX+PART": 81,
199
- "I-VERB+AUX+SCONJ": 82,
200
- "I-VERB+AUX|Polarity=Neg": 83,
201
- "I-X": 84,
202
- "NOUN": 85,
203
- "NOUN+ADP": 86,
204
- "NOUN+AUX": 87,
205
- "NUM": 88,
206
- "PART": 89,
207
- "PRON": 90,
208
- "PRON+ADP": 91,
209
- "PROPN": 92,
210
- "PUNCT": 93,
211
- "SCONJ": 94,
212
- "SYM": 95,
213
- "VERB": 96,
214
- "VERB+AUX": 97,
215
- "VERB+AUX+PART": 98,
216
- "VERB+AUX|Polarity=Neg": 99,
217
- "X": 100
218
  },
219
  "layer_norm_eps": 1e-07,
220
  "max_position_embeddings": 512,
@@ -226,9 +214,12 @@
226
  "pooler_dropout": 0,
227
  "pooler_hidden_act": "gelu",
228
  "pooler_hidden_size": 768,
229
- "pos_att_type": null,
230
- "position_biased_input": true,
231
- "relative_attention": false,
 
 
 
232
  "task_specific_params": {
233
  "upos_multiword": {
234
  "ADJ+ADJ": {
@@ -318,7 +309,7 @@
318
  "\u3051\u3069"
319
  ]
320
  },
321
- "AUX|Polarity=Neg+VERB": {
322
  "\u306a\u304f\u306a\u3063": [
323
  "\u306a\u304f",
324
  "\u306a\u3063"
@@ -380,6 +371,18 @@
380
  "\u304b"
381
  ]
382
  },
 
 
 
 
 
 
 
 
 
 
 
 
383
  "VERB+AUX": {
384
  "\u3044\u308f\u308c": [
385
  "\u3044\u308f",
@@ -393,6 +396,10 @@
393
  "\u304a\u3053\u306a\u308f",
394
  "\u308c"
395
  ],
 
 
 
 
396
  "\u3055\u3089\u308f\u308c": [
397
  "\u3055\u3089\u308f",
398
  "\u308c"
@@ -417,6 +424,10 @@
417
  "\u306a\u3058\u307e",
418
  "\u305b"
419
  ],
 
 
 
 
420
  "\u307f\u306a\u3055\u308c": [
421
  "\u307f\u306a\u3055",
422
  "\u308c"
@@ -469,6 +480,10 @@
469
  "\u548c\u307e",
470
  "\u305b"
471
  ],
 
 
 
 
472
  "\u554f\u308f\u308c": [
473
  "\u554f\u308f",
474
  "\u308c"
@@ -537,6 +552,10 @@
537
  "\u679c\u305f\u3059",
538
  "\u3079\u304f"
539
  ],
 
 
 
 
540
  "\u6b4c\u308f\u308c": [
541
  "\u6b4c\u308f",
542
  "\u308c"
@@ -577,6 +596,10 @@
577
  "\u884c\u3063",
578
  "\u3061\u3083\u3044"
579
  ],
 
 
 
 
580
  "\u884c\u308f\u308c": [
581
  "\u884c\u308f",
582
  "\u308c"
@@ -719,34 +742,12 @@
719
  "\u305f",
720
  "\u305f\u3081\u306b"
721
  ]
722
- },
723
- "VERB+AUX|Polarity=Neg": {
724
- "\u304b\u307e\u308f\u305a": [
725
- "\u304b\u307e\u308f",
726
- "\u305a"
727
- ],
728
- "\u306a\u3089\u305a": [
729
- "\u306a\u3089",
730
- "\u305a"
731
- ],
732
- "\u554f\u308f\u305a": [
733
- "\u554f\u308f",
734
- "\u305a"
735
- ],
736
- "\u69cb\u308f\u305a": [
737
- "\u69cb\u308f",
738
- "\u305a"
739
- ],
740
- "\u884c\u308f\u305a": [
741
- "\u884c\u308f",
742
- "\u305a"
743
- ]
744
  }
745
  }
746
  },
747
  "tokenizer_class": "DebertaV2TokenizerFast",
748
  "torch_dtype": "float32",
749
- "transformers_version": "4.19.4",
750
  "type_vocab_size": 0,
751
  "vocab_size": 32000
752
  }
14
  "2": "ADP",
15
  "3": "ADV",
16
  "4": "AUX",
17
+ "5": "AUX+VERB",
18
+ "6": "B-ADJ",
19
+ "7": "B-ADJ+ADJ",
20
+ "8": "B-ADJ+AUX+AUX",
21
+ "9": "B-ADJ+VERB",
22
+ "10": "B-ADP",
23
+ "11": "B-ADP+NOUN",
24
+ "12": "B-ADV",
25
+ "13": "B-ADV+ADP",
26
+ "14": "B-ADV+ADP+VERB",
27
+ "15": "B-AUX",
28
+ "16": "B-AUX+AUX",
29
+ "17": "B-AUX+AUX+AUX",
30
+ "18": "B-AUX+AUX+PART",
31
+ "19": "B-AUX+SCONJ",
32
+ "20": "B-AUX+VERB",
33
+ "21": "B-CCONJ",
34
+ "22": "B-DET",
35
+ "23": "B-INTJ",
36
+ "24": "B-NOUN",
37
+ "25": "B-NOUN+ADJ",
38
+ "26": "B-NOUN+ADP",
39
+ "27": "B-NUM",
40
+ "28": "B-PART",
41
+ "29": "B-PRON",
42
+ "30": "B-PROPN",
43
+ "31": "B-PUNCT+NOUN",
44
+ "32": "B-SCONJ",
45
+ "33": "B-SYM",
46
+ "34": "B-VERB",
47
+ "35": "B-VERB+AUX",
48
+ "36": "B-VERB+AUX+AUX",
49
+ "37": "B-VERB+AUX+NOUN",
50
+ "38": "B-VERB+AUX+PART",
51
+ "39": "B-VERB+AUX+SCONJ",
52
+ "40": "B-X",
53
+ "41": "CCONJ",
54
+ "42": "DET",
55
+ "43": "I-ADJ",
56
+ "44": "I-ADJ+ADJ",
57
+ "45": "I-ADJ+AUX+AUX",
58
+ "46": "I-ADJ+VERB",
59
+ "47": "I-ADP",
60
+ "48": "I-ADP+NOUN",
61
+ "49": "I-ADV",
62
+ "50": "I-ADV+ADP",
63
+ "51": "I-ADV+ADP+VERB",
64
+ "52": "I-AUX",
65
+ "53": "I-AUX+AUX",
66
+ "54": "I-AUX+AUX+AUX",
67
+ "55": "I-AUX+AUX+PART",
68
+ "56": "I-AUX+SCONJ",
69
+ "57": "I-AUX+VERB",
70
+ "58": "I-CCONJ",
71
+ "59": "I-DET",
72
+ "60": "I-INTJ",
73
+ "61": "I-NOUN",
74
+ "62": "I-NOUN+ADJ",
75
+ "63": "I-NOUN+ADP",
76
+ "64": "I-NUM",
77
+ "65": "I-PART",
78
+ "66": "I-PRON",
79
+ "67": "I-PROPN",
80
+ "68": "I-PUNCT+NOUN",
81
+ "69": "I-SCONJ",
82
+ "70": "I-SYM",
83
+ "71": "I-VERB",
84
+ "72": "I-VERB+AUX",
85
+ "73": "I-VERB+AUX+AUX",
86
+ "74": "I-VERB+AUX+NOUN",
87
+ "75": "I-VERB+AUX+PART",
88
+ "76": "I-VERB+AUX+SCONJ",
89
+ "77": "I-X",
90
+ "78": "NOUN",
91
+ "79": "NOUN+ADP",
92
+ "80": "NOUN+AUX",
93
+ "81": "NUM",
94
+ "82": "PART",
95
+ "83": "PRON",
96
+ "84": "PRON+ADP",
97
+ "85": "PROPN",
98
+ "86": "PUNCT",
99
+ "87": "PUNCT+PUNCT",
100
+ "88": "PUNCT+PUNCT+PUNCT",
101
+ "89": "SCONJ",
102
+ "90": "SYM",
103
+ "91": "VERB",
104
+ "92": "VERB+AUX",
105
+ "93": "VERB+AUX+PART",
106
+ "94": "X"
 
 
 
 
 
 
107
  },
108
  "initializer_range": 0.02,
109
  "intermediate_size": 3072,
113
  "ADP": 2,
114
  "ADV": 3,
115
  "AUX": 4,
116
+ "AUX+VERB": 5,
117
+ "B-ADJ": 6,
118
+ "B-ADJ+ADJ": 7,
119
+ "B-ADJ+AUX+AUX": 8,
120
+ "B-ADJ+VERB": 9,
121
+ "B-ADP": 10,
122
+ "B-ADP+NOUN": 11,
123
+ "B-ADV": 12,
124
+ "B-ADV+ADP": 13,
125
+ "B-ADV+ADP+VERB": 14,
126
+ "B-AUX": 15,
127
+ "B-AUX+AUX": 16,
128
+ "B-AUX+AUX+AUX": 17,
129
+ "B-AUX+AUX+PART": 18,
130
+ "B-AUX+SCONJ": 19,
131
+ "B-AUX+VERB": 20,
132
+ "B-CCONJ": 21,
133
+ "B-DET": 22,
134
+ "B-INTJ": 23,
135
+ "B-NOUN": 24,
136
+ "B-NOUN+ADJ": 25,
137
+ "B-NOUN+ADP": 26,
138
+ "B-NUM": 27,
139
+ "B-PART": 28,
140
+ "B-PRON": 29,
141
+ "B-PROPN": 30,
142
+ "B-PUNCT+NOUN": 31,
143
+ "B-SCONJ": 32,
144
+ "B-SYM": 33,
145
+ "B-VERB": 34,
146
+ "B-VERB+AUX": 35,
147
+ "B-VERB+AUX+AUX": 36,
148
+ "B-VERB+AUX+NOUN": 37,
149
+ "B-VERB+AUX+PART": 38,
150
+ "B-VERB+AUX+SCONJ": 39,
151
+ "B-X": 40,
152
+ "CCONJ": 41,
153
+ "DET": 42,
154
+ "I-ADJ": 43,
155
+ "I-ADJ+ADJ": 44,
156
+ "I-ADJ+AUX+AUX": 45,
157
+ "I-ADJ+VERB": 46,
158
+ "I-ADP": 47,
159
+ "I-ADP+NOUN": 48,
160
+ "I-ADV": 49,
161
+ "I-ADV+ADP": 50,
162
+ "I-ADV+ADP+VERB": 51,
163
+ "I-AUX": 52,
164
+ "I-AUX+AUX": 53,
165
+ "I-AUX+AUX+AUX": 54,
166
+ "I-AUX+AUX+PART": 55,
167
+ "I-AUX+SCONJ": 56,
168
+ "I-AUX+VERB": 57,
169
+ "I-CCONJ": 58,
170
+ "I-DET": 59,
171
+ "I-INTJ": 60,
172
+ "I-NOUN": 61,
173
+ "I-NOUN+ADJ": 62,
174
+ "I-NOUN+ADP": 63,
175
+ "I-NUM": 64,
176
+ "I-PART": 65,
177
+ "I-PRON": 66,
178
+ "I-PROPN": 67,
179
+ "I-PUNCT+NOUN": 68,
180
+ "I-SCONJ": 69,
181
+ "I-SYM": 70,
182
+ "I-VERB": 71,
183
+ "I-VERB+AUX": 72,
184
+ "I-VERB+AUX+AUX": 73,
185
+ "I-VERB+AUX+NOUN": 74,
186
+ "I-VERB+AUX+PART": 75,
187
+ "I-VERB+AUX+SCONJ": 76,
188
+ "I-X": 77,
189
+ "NOUN": 78,
190
+ "NOUN+ADP": 79,
191
+ "NOUN+AUX": 80,
192
+ "NUM": 81,
193
+ "PART": 82,
194
+ "PRON": 83,
195
+ "PRON+ADP": 84,
196
+ "PROPN": 85,
197
+ "PUNCT": 86,
198
+ "PUNCT+PUNCT": 87,
199
+ "PUNCT+PUNCT+PUNCT": 88,
200
+ "SCONJ": 89,
201
+ "SYM": 90,
202
+ "VERB": 91,
203
+ "VERB+AUX": 92,
204
+ "VERB+AUX+PART": 93,
205
+ "X": 94
 
 
 
 
 
 
206
  },
207
  "layer_norm_eps": 1e-07,
208
  "max_position_embeddings": 512,
214
  "pooler_dropout": 0,
215
  "pooler_hidden_act": "gelu",
216
  "pooler_hidden_size": 768,
217
+ "pos_att_type": [
218
+ "p2c",
219
+ "c2p"
220
+ ],
221
+ "position_biased_input": false,
222
+ "relative_attention": true,
223
  "task_specific_params": {
224
  "upos_multiword": {
225
  "ADJ+ADJ": {
309
  "\u3051\u3069"
310
  ]
311
  },
312
+ "AUX+VERB": {
313
  "\u306a\u304f\u306a\u3063": [
314
  "\u306a\u304f",
315
  "\u306a\u3063"
371
  "\u304b"
372
  ]
373
  },
374
+ "PUNCT+NOUN": {
375
+ ",\u201c\u62c9\u81f4\u76e3\u7981\u201d\u554f\u984c": [
376
+ ",",
377
+ "\u201c\u62c9\u81f4\u76e3\u7981\u201d\u554f\u984c"
378
+ ]
379
+ },
380
+ "PUNCT+PUNCT": {
381
+ ",\u201c": [
382
+ ",",
383
+ "\u201c"
384
+ ]
385
+ },
386
  "VERB+AUX": {
387
  "\u3044\u308f\u308c": [
388
  "\u3044\u308f",
396
  "\u304a\u3053\u306a\u308f",
397
  "\u308c"
398
  ],
399
+ "\u304b\u307e\u308f\u305a": [
400
+ "\u304b\u307e\u308f",
401
+ "\u305a"
402
+ ],
403
  "\u3055\u3089\u308f\u308c": [
404
  "\u3055\u3089\u308f",
405
  "\u308c"
424
  "\u306a\u3058\u307e",
425
  "\u305b"
426
  ],
427
+ "\u306a\u3089\u305a": [
428
+ "\u306a\u3089",
429
+ "\u305a"
430
+ ],
431
  "\u307f\u306a\u3055\u308c": [
432
  "\u307f\u306a\u3055",
433
  "\u308c"
480
  "\u548c\u307e",
481
  "\u305b"
482
  ],
483
+ "\u554f\u308f\u305a": [
484
+ "\u554f\u308f",
485
+ "\u305a"
486
+ ],
487
  "\u554f\u308f\u308c": [
488
  "\u554f\u308f",
489
  "\u308c"
552
  "\u679c\u305f\u3059",
553
  "\u3079\u304f"
554
  ],
555
+ "\u69cb\u308f\u305a": [
556
+ "\u69cb\u308f",
557
+ "\u305a"
558
+ ],
559
  "\u6b4c\u308f\u308c": [
560
  "\u6b4c\u308f",
561
  "\u308c"
596
  "\u884c\u3063",
597
  "\u3061\u3083\u3044"
598
  ],
599
+ "\u884c\u308f\u305a": [
600
+ "\u884c\u308f",
601
+ "\u305a"
602
+ ],
603
  "\u884c\u308f\u308c": [
604
  "\u884c\u308f",
605
  "\u308c"
742
  "\u305f",
743
  "\u305f\u3081\u306b"
744
  ]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
745
  }
746
  }
747
  },
748
  "tokenizer_class": "DebertaV2TokenizerFast",
749
  "torch_dtype": "float32",
750
+ "transformers_version": "4.22.1",
751
  "type_vocab_size": 0,
752
  "vocab_size": 32000
753
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:37128693dcce708756bf50fbee84d5d9d61bf02b3c20aa56044b88b1e512d862
3
- size 440482611
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:449963d8f2f70cb7606c6f7a8ec258c9f2d0ace75eacf31d48e356136ceb9cee
3
+ size 498750547
special_tokens_map.json CHANGED
@@ -1 +1,9 @@
1
- {"bos_token": "[CLS]", "eos_token": "[SEP]", "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]"}
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "[CLS]",
3
+ "cls_token": "[CLS]",
4
+ "eos_token": "[SEP]",
5
+ "mask_token": "[MASK]",
6
+ "pad_token": "[PAD]",
7
+ "sep_token": "[SEP]",
8
+ "unk_token": "[UNK]"
9
+ }
supar.model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ddd1931e9712901e6b03586f19cb7ba4ab7bb3da1f40af69b99d77cdc9d5da48
3
- size 488947819
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf053426925c490ebf2a2a0bc6465db9726f7359f3425833e6a5691979032caf
3
+ size 547274827
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
tokenizer_config.json CHANGED
@@ -1 +1,14 @@
1
- {"do_lower_case": false, "bos_token": "[CLS]", "eos_token": "[SEP]", "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "split_by_punct": true, "keep_accents": true, "model_max_length": 512, "tokenizer_class": "DebertaV2TokenizerFast"}
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "[CLS]",
3
+ "cls_token": "[CLS]",
4
+ "do_lower_case": false,
5
+ "eos_token": "[SEP]",
6
+ "keep_accents": true,
7
+ "mask_token": "[MASK]",
8
+ "model_max_length": 512,
9
+ "pad_token": "[PAD]",
10
+ "sep_token": "[SEP]",
11
+ "split_by_punct": true,
12
+ "tokenizer_class": "DebertaV2TokenizerFast",
13
+ "unk_token": "[UNK]"
14
+ }