Upload 8 files
Browse files- added_tokens.json +360 -0
- config.json +33 -0
- pytorch_model.bin +3 -0
- special_tokens_map.json +107 -0
- spiece.model +3 -0
- tokenizer.json +0 -0
- tokenizer_config.json +113 -0
- training_args.bin +3 -0
added_tokens.json
ADDED
@@ -0,0 +1,360 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bai": 32128,
|
3 |
+
"bang": 32129,
|
4 |
+
"bao": 32130,
|
5 |
+
"bei": 32131,
|
6 |
+
"ben": 32132,
|
7 |
+
"beng": 32133,
|
8 |
+
"bian": 32134,
|
9 |
+
"biang": 32135,
|
10 |
+
"biao": 32136,
|
11 |
+
"bie": 32137,
|
12 |
+
"bin": 32138,
|
13 |
+
"bing": 32139,
|
14 |
+
"bu": 32140,
|
15 |
+
"cai": 32141,
|
16 |
+
"can": 32142,
|
17 |
+
"cang": 32143,
|
18 |
+
"cao": 32144,
|
19 |
+
"cei": 32145,
|
20 |
+
"cen": 32146,
|
21 |
+
"ceng": 32147,
|
22 |
+
"cha": 32148,
|
23 |
+
"chai": 32149,
|
24 |
+
"chan": 32150,
|
25 |
+
"chang": 32151,
|
26 |
+
"chao": 32152,
|
27 |
+
"chen": 32153,
|
28 |
+
"cheng": 32154,
|
29 |
+
"chi": 32155,
|
30 |
+
"chong": 32156,
|
31 |
+
"chou": 32157,
|
32 |
+
"chu": 32158,
|
33 |
+
"chua": 32159,
|
34 |
+
"chuai": 32160,
|
35 |
+
"chuan": 32161,
|
36 |
+
"chuang": 32162,
|
37 |
+
"chui": 32163,
|
38 |
+
"chun": 32164,
|
39 |
+
"chuo": 32165,
|
40 |
+
"cong": 32166,
|
41 |
+
"cou": 32167,
|
42 |
+
"cu": 32168,
|
43 |
+
"cuan": 32169,
|
44 |
+
"cui": 32170,
|
45 |
+
"cun": 32171,
|
46 |
+
"cuo": 32172,
|
47 |
+
"dai": 32173,
|
48 |
+
"dan": 32174,
|
49 |
+
"dang": 32175,
|
50 |
+
"dao": 32176,
|
51 |
+
"dei": 32177,
|
52 |
+
"den": 32178,
|
53 |
+
"deng": 32179,
|
54 |
+
"dia": 32180,
|
55 |
+
"dian": 32181,
|
56 |
+
"diao": 32182,
|
57 |
+
"die": 32183,
|
58 |
+
"din": 32184,
|
59 |
+
"ding": 32185,
|
60 |
+
"diu": 32186,
|
61 |
+
"dong": 32187,
|
62 |
+
"dou": 32188,
|
63 |
+
"du": 32189,
|
64 |
+
"duan": 32190,
|
65 |
+
"dui": 32191,
|
66 |
+
"dun": 32192,
|
67 |
+
"duo": 32193,
|
68 |
+
"ei": 32194,
|
69 |
+
"eng": 32195,
|
70 |
+
"fan": 32196,
|
71 |
+
"fang": 32197,
|
72 |
+
"fei": 32198,
|
73 |
+
"fen": 32199,
|
74 |
+
"feng": 32200,
|
75 |
+
"fiao": 32201,
|
76 |
+
"fou": 32202,
|
77 |
+
"fu": 32203,
|
78 |
+
"gai": 32204,
|
79 |
+
"gan": 32205,
|
80 |
+
"gang": 32206,
|
81 |
+
"gao": 32207,
|
82 |
+
"gei": 32208,
|
83 |
+
"gen": 32209,
|
84 |
+
"geng": 32210,
|
85 |
+
"gong": 32211,
|
86 |
+
"gou": 32212,
|
87 |
+
"gu": 32213,
|
88 |
+
"gua": 32214,
|
89 |
+
"guai": 32215,
|
90 |
+
"guan": 32216,
|
91 |
+
"guang": 32217,
|
92 |
+
"gui": 32218,
|
93 |
+
"gun": 32219,
|
94 |
+
"guo": 32220,
|
95 |
+
"hai": 32221,
|
96 |
+
"hang": 32222,
|
97 |
+
"hao": 32223,
|
98 |
+
"hei": 32224,
|
99 |
+
"hen": 32225,
|
100 |
+
"heng": 32226,
|
101 |
+
"hm": 32227,
|
102 |
+
"hng": 32228,
|
103 |
+
"hong": 32229,
|
104 |
+
"hou": 32230,
|
105 |
+
"hua": 32231,
|
106 |
+
"huai": 32232,
|
107 |
+
"huan": 32233,
|
108 |
+
"huang": 32234,
|
109 |
+
"hui": 32235,
|
110 |
+
"hun": 32236,
|
111 |
+
"huo": 32237,
|
112 |
+
"jia": 32238,
|
113 |
+
"jian": 32239,
|
114 |
+
"jiang": 32240,
|
115 |
+
"jiao": 32241,
|
116 |
+
"jie": 32242,
|
117 |
+
"jin": 32243,
|
118 |
+
"jing": 32244,
|
119 |
+
"jiong": 32245,
|
120 |
+
"jiu": 32246,
|
121 |
+
"ju": 32247,
|
122 |
+
"juan": 32248,
|
123 |
+
"jue": 32249,
|
124 |
+
"jun": 32250,
|
125 |
+
"kai": 32251,
|
126 |
+
"kan": 32252,
|
127 |
+
"kang": 32253,
|
128 |
+
"kao": 32254,
|
129 |
+
"kei": 32255,
|
130 |
+
"ken": 32256,
|
131 |
+
"keng": 32257,
|
132 |
+
"kong": 32258,
|
133 |
+
"kou": 32259,
|
134 |
+
"ku": 32260,
|
135 |
+
"kua": 32261,
|
136 |
+
"kuai": 32262,
|
137 |
+
"kuan": 32263,
|
138 |
+
"kuang": 32264,
|
139 |
+
"kui": 32265,
|
140 |
+
"kun": 32266,
|
141 |
+
"kuo": 32267,
|
142 |
+
"lai": 32268,
|
143 |
+
"lang": 32269,
|
144 |
+
"lao": 32270,
|
145 |
+
"lei": 32271,
|
146 |
+
"len": 32272,
|
147 |
+
"leng": 32273,
|
148 |
+
"lia": 32274,
|
149 |
+
"lian": 32275,
|
150 |
+
"liang": 32276,
|
151 |
+
"liao": 32277,
|
152 |
+
"lie": 32278,
|
153 |
+
"ling": 32279,
|
154 |
+
"liu": 32280,
|
155 |
+
"long": 32281,
|
156 |
+
"lou": 32282,
|
157 |
+
"lu": 32283,
|
158 |
+
"luan": 32284,
|
159 |
+
"lun": 32285,
|
160 |
+
"luo": 32286,
|
161 |
+
"lv": 32287,
|
162 |
+
"lve": 32288,
|
163 |
+
"mai": 32289,
|
164 |
+
"mang": 32290,
|
165 |
+
"mao": 32291,
|
166 |
+
"mei": 32292,
|
167 |
+
"men": 32293,
|
168 |
+
"meng": 32294,
|
169 |
+
"mian": 32295,
|
170 |
+
"miao": 32296,
|
171 |
+
"mie": 32297,
|
172 |
+
"ming": 32298,
|
173 |
+
"miu": 32299,
|
174 |
+
"mou": 32300,
|
175 |
+
"mu": 32301,
|
176 |
+
"nai": 32302,
|
177 |
+
"nan": 32303,
|
178 |
+
"nang": 32304,
|
179 |
+
"nao": 32305,
|
180 |
+
"nei": 32306,
|
181 |
+
"nen": 32307,
|
182 |
+
"neng": 32308,
|
183 |
+
"nia": 32309,
|
184 |
+
"nian": 32310,
|
185 |
+
"niang": 32311,
|
186 |
+
"niao": 32312,
|
187 |
+
"nie": 32313,
|
188 |
+
"nin": 32314,
|
189 |
+
"ning": 32315,
|
190 |
+
"niu": 32316,
|
191 |
+
"nong": 32317,
|
192 |
+
"nou": 32318,
|
193 |
+
"nu": 32319,
|
194 |
+
"nuan": 32320,
|
195 |
+
"nun": 32321,
|
196 |
+
"nuo": 32322,
|
197 |
+
"nv": 32323,
|
198 |
+
"nve": 32324,
|
199 |
+
"pai": 32325,
|
200 |
+
"pan": 32326,
|
201 |
+
"pang": 32327,
|
202 |
+
"pao": 32328,
|
203 |
+
"pei": 32329,
|
204 |
+
"pen": 32330,
|
205 |
+
"peng": 32331,
|
206 |
+
"pian": 32332,
|
207 |
+
"piao": 32333,
|
208 |
+
"pie": 32334,
|
209 |
+
"pin": 32335,
|
210 |
+
"ping": 32336,
|
211 |
+
"pou": 32337,
|
212 |
+
"pu": 32338,
|
213 |
+
"qi": 32339,
|
214 |
+
"qia": 32340,
|
215 |
+
"qian": 32341,
|
216 |
+
"qiang": 32342,
|
217 |
+
"qiao": 32343,
|
218 |
+
"qie": 32344,
|
219 |
+
"qin": 32345,
|
220 |
+
"qing": 32346,
|
221 |
+
"qiong": 32347,
|
222 |
+
"qiu": 32348,
|
223 |
+
"qu": 32349,
|
224 |
+
"quan": 32350,
|
225 |
+
"que": 32351,
|
226 |
+
"qun": 32352,
|
227 |
+
"rang": 32353,
|
228 |
+
"rao": 32354,
|
229 |
+
"ren": 32355,
|
230 |
+
"reng": 32356,
|
231 |
+
"rong": 32357,
|
232 |
+
"rou": 32358,
|
233 |
+
"rua": 32359,
|
234 |
+
"ruan": 32360,
|
235 |
+
"rui": 32361,
|
236 |
+
"run": 32362,
|
237 |
+
"ruo": 32363,
|
238 |
+
"sai": 32364,
|
239 |
+
"san": 32365,
|
240 |
+
"sang": 32366,
|
241 |
+
"sao": 32367,
|
242 |
+
"sen": 32368,
|
243 |
+
"seng": 32369,
|
244 |
+
"sha": 32370,
|
245 |
+
"shai": 32371,
|
246 |
+
"shan": 32372,
|
247 |
+
"shang": 32373,
|
248 |
+
"shao": 32374,
|
249 |
+
"she": 32375,
|
250 |
+
"shei": 32376,
|
251 |
+
"shen": 32377,
|
252 |
+
"sheng": 32378,
|
253 |
+
"shou": 32379,
|
254 |
+
"shu": 32380,
|
255 |
+
"shua": 32381,
|
256 |
+
"shuai": 32382,
|
257 |
+
"shuan": 32383,
|
258 |
+
"shuang": 32384,
|
259 |
+
"shui": 32385,
|
260 |
+
"shun": 32386,
|
261 |
+
"shuo": 32387,
|
262 |
+
"song": 32388,
|
263 |
+
"sou": 32389,
|
264 |
+
"su": 32390,
|
265 |
+
"suan": 32391,
|
266 |
+
"sui": 32392,
|
267 |
+
"sun": 32393,
|
268 |
+
"suo": 32394,
|
269 |
+
"tai": 32395,
|
270 |
+
"tan": 32396,
|
271 |
+
"tang": 32397,
|
272 |
+
"tao": 32398,
|
273 |
+
"tei": 32399,
|
274 |
+
"teng": 32400,
|
275 |
+
"tian": 32401,
|
276 |
+
"tiao": 32402,
|
277 |
+
"tie": 32403,
|
278 |
+
"ting": 32404,
|
279 |
+
"tong": 32405,
|
280 |
+
"tou": 32406,
|
281 |
+
"tu": 32407,
|
282 |
+
"tuan": 32408,
|
283 |
+
"tui": 32409,
|
284 |
+
"tun": 32410,
|
285 |
+
"tuo": 32411,
|
286 |
+
"wa": 32412,
|
287 |
+
"wai": 32413,
|
288 |
+
"wan": 32414,
|
289 |
+
"wang": 32415,
|
290 |
+
"wei": 32416,
|
291 |
+
"wen": 32417,
|
292 |
+
"weng": 32418,
|
293 |
+
"wo": 32419,
|
294 |
+
"wong": 32420,
|
295 |
+
"wu": 32421,
|
296 |
+
"xi": 32422,
|
297 |
+
"xia": 32423,
|
298 |
+
"xian": 32424,
|
299 |
+
"xiang": 32425,
|
300 |
+
"xiao": 32426,
|
301 |
+
"xie": 32427,
|
302 |
+
"xin": 32428,
|
303 |
+
"xiong": 32429,
|
304 |
+
"xiu": 32430,
|
305 |
+
"xu": 32431,
|
306 |
+
"xuan": 32432,
|
307 |
+
"xue": 32433,
|
308 |
+
"xun": 32434,
|
309 |
+
"ya": 32435,
|
310 |
+
"yan": 32436,
|
311 |
+
"yang": 32437,
|
312 |
+
"yao": 32438,
|
313 |
+
"ye": 32439,
|
314 |
+
"yi": 32440,
|
315 |
+
"yin": 32441,
|
316 |
+
"ying": 32442,
|
317 |
+
"yong": 32443,
|
318 |
+
"you": 32444,
|
319 |
+
"yu": 32445,
|
320 |
+
"yuan": 32446,
|
321 |
+
"yue": 32447,
|
322 |
+
"yun": 32448,
|
323 |
+
"za": 32449,
|
324 |
+
"zai": 32450,
|
325 |
+
"zan": 32451,
|
326 |
+
"zang": 32452,
|
327 |
+
"zao": 32453,
|
328 |
+
"ze": 32454,
|
329 |
+
"zei": 32455,
|
330 |
+
"zen": 32456,
|
331 |
+
"zeng": 32457,
|
332 |
+
"zha": 32458,
|
333 |
+
"zhai": 32459,
|
334 |
+
"zhan": 32460,
|
335 |
+
"zhang": 32461,
|
336 |
+
"zhao": 32462,
|
337 |
+
"zhe": 32463,
|
338 |
+
"zhei": 32464,
|
339 |
+
"zhen": 32465,
|
340 |
+
"zheng": 32466,
|
341 |
+
"zhi": 32467,
|
342 |
+
"zhong": 32468,
|
343 |
+
"zhou": 32469,
|
344 |
+
"zhu": 32470,
|
345 |
+
"zhua": 32471,
|
346 |
+
"zhuai": 32472,
|
347 |
+
"zhuan": 32473,
|
348 |
+
"zhuang": 32474,
|
349 |
+
"zhui": 32475,
|
350 |
+
"zhun": 32476,
|
351 |
+
"zhuo": 32477,
|
352 |
+
"zi": 32478,
|
353 |
+
"zong": 32479,
|
354 |
+
"zou": 32480,
|
355 |
+
"zu": 32481,
|
356 |
+
"zuan": 32482,
|
357 |
+
"zui": 32483,
|
358 |
+
"zun": 32484,
|
359 |
+
"zuo": 32485
|
360 |
+
}
|
config.json
ADDED
@@ -0,0 +1,33 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "Langboat/mengzi-t5-base",
|
3 |
+
"architectures": [
|
4 |
+
"T5ForConditionalGeneration"
|
5 |
+
],
|
6 |
+
"d_ff": 2048,
|
7 |
+
"d_kv": 64,
|
8 |
+
"d_model": 768,
|
9 |
+
"decoder_start_token_id": 0,
|
10 |
+
"dense_act_fn": "gelu_new",
|
11 |
+
"dropout_rate": 0.1,
|
12 |
+
"eos_token_id": 1,
|
13 |
+
"feed_forward_proj": "gated-gelu",
|
14 |
+
"gradient_checkpointing": false,
|
15 |
+
"initializer_factor": 1.0,
|
16 |
+
"is_encoder_decoder": true,
|
17 |
+
"is_gated_act": true,
|
18 |
+
"layer_norm_epsilon": 1e-06,
|
19 |
+
"max_length": 128,
|
20 |
+
"model_type": "t5",
|
21 |
+
"num_decoder_layers": 12,
|
22 |
+
"num_heads": 12,
|
23 |
+
"num_layers": 12,
|
24 |
+
"output_past": true,
|
25 |
+
"pad_token_id": 0,
|
26 |
+
"relative_attention_max_distance": 128,
|
27 |
+
"relative_attention_num_buckets": 32,
|
28 |
+
"tie_word_embeddings": false,
|
29 |
+
"torch_dtype": "float32",
|
30 |
+
"transformers_version": "4.21.0",
|
31 |
+
"use_cache": true,
|
32 |
+
"vocab_size": 32486
|
33 |
+
}
|
pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:caaa6b46a4a3be786b1bb57af3e06a66298bcb57923643b683b9a9b2ab762253
|
3 |
+
size 992608437
|
special_tokens_map.json
ADDED
@@ -0,0 +1,107 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"additional_special_tokens": [
|
3 |
+
"<extra_id_0>",
|
4 |
+
"<extra_id_1>",
|
5 |
+
"<extra_id_2>",
|
6 |
+
"<extra_id_3>",
|
7 |
+
"<extra_id_4>",
|
8 |
+
"<extra_id_5>",
|
9 |
+
"<extra_id_6>",
|
10 |
+
"<extra_id_7>",
|
11 |
+
"<extra_id_8>",
|
12 |
+
"<extra_id_9>",
|
13 |
+
"<extra_id_10>",
|
14 |
+
"<extra_id_11>",
|
15 |
+
"<extra_id_12>",
|
16 |
+
"<extra_id_13>",
|
17 |
+
"<extra_id_14>",
|
18 |
+
"<extra_id_15>",
|
19 |
+
"<extra_id_16>",
|
20 |
+
"<extra_id_17>",
|
21 |
+
"<extra_id_18>",
|
22 |
+
"<extra_id_19>",
|
23 |
+
"<extra_id_20>",
|
24 |
+
"<extra_id_21>",
|
25 |
+
"<extra_id_22>",
|
26 |
+
"<extra_id_23>",
|
27 |
+
"<extra_id_24>",
|
28 |
+
"<extra_id_25>",
|
29 |
+
"<extra_id_26>",
|
30 |
+
"<extra_id_27>",
|
31 |
+
"<extra_id_28>",
|
32 |
+
"<extra_id_29>",
|
33 |
+
"<extra_id_30>",
|
34 |
+
"<extra_id_31>",
|
35 |
+
"<extra_id_32>",
|
36 |
+
"<extra_id_33>",
|
37 |
+
"<extra_id_34>",
|
38 |
+
"<extra_id_35>",
|
39 |
+
"<extra_id_36>",
|
40 |
+
"<extra_id_37>",
|
41 |
+
"<extra_id_38>",
|
42 |
+
"<extra_id_39>",
|
43 |
+
"<extra_id_40>",
|
44 |
+
"<extra_id_41>",
|
45 |
+
"<extra_id_42>",
|
46 |
+
"<extra_id_43>",
|
47 |
+
"<extra_id_44>",
|
48 |
+
"<extra_id_45>",
|
49 |
+
"<extra_id_46>",
|
50 |
+
"<extra_id_47>",
|
51 |
+
"<extra_id_48>",
|
52 |
+
"<extra_id_49>",
|
53 |
+
"<extra_id_50>",
|
54 |
+
"<extra_id_51>",
|
55 |
+
"<extra_id_52>",
|
56 |
+
"<extra_id_53>",
|
57 |
+
"<extra_id_54>",
|
58 |
+
"<extra_id_55>",
|
59 |
+
"<extra_id_56>",
|
60 |
+
"<extra_id_57>",
|
61 |
+
"<extra_id_58>",
|
62 |
+
"<extra_id_59>",
|
63 |
+
"<extra_id_60>",
|
64 |
+
"<extra_id_61>",
|
65 |
+
"<extra_id_62>",
|
66 |
+
"<extra_id_63>",
|
67 |
+
"<extra_id_64>",
|
68 |
+
"<extra_id_65>",
|
69 |
+
"<extra_id_66>",
|
70 |
+
"<extra_id_67>",
|
71 |
+
"<extra_id_68>",
|
72 |
+
"<extra_id_69>",
|
73 |
+
"<extra_id_70>",
|
74 |
+
"<extra_id_71>",
|
75 |
+
"<extra_id_72>",
|
76 |
+
"<extra_id_73>",
|
77 |
+
"<extra_id_74>",
|
78 |
+
"<extra_id_75>",
|
79 |
+
"<extra_id_76>",
|
80 |
+
"<extra_id_77>",
|
81 |
+
"<extra_id_78>",
|
82 |
+
"<extra_id_79>",
|
83 |
+
"<extra_id_80>",
|
84 |
+
"<extra_id_81>",
|
85 |
+
"<extra_id_82>",
|
86 |
+
"<extra_id_83>",
|
87 |
+
"<extra_id_84>",
|
88 |
+
"<extra_id_85>",
|
89 |
+
"<extra_id_86>",
|
90 |
+
"<extra_id_87>",
|
91 |
+
"<extra_id_88>",
|
92 |
+
"<extra_id_89>",
|
93 |
+
"<extra_id_90>",
|
94 |
+
"<extra_id_91>",
|
95 |
+
"<extra_id_92>",
|
96 |
+
"<extra_id_93>",
|
97 |
+
"<extra_id_94>",
|
98 |
+
"<extra_id_95>",
|
99 |
+
"<extra_id_96>",
|
100 |
+
"<extra_id_97>",
|
101 |
+
"<extra_id_98>",
|
102 |
+
"<extra_id_99>"
|
103 |
+
],
|
104 |
+
"eos_token": "</s>",
|
105 |
+
"pad_token": "<pad>",
|
106 |
+
"unk_token": "<unk>"
|
107 |
+
}
|
spiece.model
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e0dc796e4a3d83ccbeb33b35ce905c5821b427f19343e1bdad7d0b47a3317cac
|
3 |
+
size 725135
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer_config.json
ADDED
@@ -0,0 +1,113 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"additional_special_tokens": [
|
3 |
+
"<extra_id_0>",
|
4 |
+
"<extra_id_1>",
|
5 |
+
"<extra_id_2>",
|
6 |
+
"<extra_id_3>",
|
7 |
+
"<extra_id_4>",
|
8 |
+
"<extra_id_5>",
|
9 |
+
"<extra_id_6>",
|
10 |
+
"<extra_id_7>",
|
11 |
+
"<extra_id_8>",
|
12 |
+
"<extra_id_9>",
|
13 |
+
"<extra_id_10>",
|
14 |
+
"<extra_id_11>",
|
15 |
+
"<extra_id_12>",
|
16 |
+
"<extra_id_13>",
|
17 |
+
"<extra_id_14>",
|
18 |
+
"<extra_id_15>",
|
19 |
+
"<extra_id_16>",
|
20 |
+
"<extra_id_17>",
|
21 |
+
"<extra_id_18>",
|
22 |
+
"<extra_id_19>",
|
23 |
+
"<extra_id_20>",
|
24 |
+
"<extra_id_21>",
|
25 |
+
"<extra_id_22>",
|
26 |
+
"<extra_id_23>",
|
27 |
+
"<extra_id_24>",
|
28 |
+
"<extra_id_25>",
|
29 |
+
"<extra_id_26>",
|
30 |
+
"<extra_id_27>",
|
31 |
+
"<extra_id_28>",
|
32 |
+
"<extra_id_29>",
|
33 |
+
"<extra_id_30>",
|
34 |
+
"<extra_id_31>",
|
35 |
+
"<extra_id_32>",
|
36 |
+
"<extra_id_33>",
|
37 |
+
"<extra_id_34>",
|
38 |
+
"<extra_id_35>",
|
39 |
+
"<extra_id_36>",
|
40 |
+
"<extra_id_37>",
|
41 |
+
"<extra_id_38>",
|
42 |
+
"<extra_id_39>",
|
43 |
+
"<extra_id_40>",
|
44 |
+
"<extra_id_41>",
|
45 |
+
"<extra_id_42>",
|
46 |
+
"<extra_id_43>",
|
47 |
+
"<extra_id_44>",
|
48 |
+
"<extra_id_45>",
|
49 |
+
"<extra_id_46>",
|
50 |
+
"<extra_id_47>",
|
51 |
+
"<extra_id_48>",
|
52 |
+
"<extra_id_49>",
|
53 |
+
"<extra_id_50>",
|
54 |
+
"<extra_id_51>",
|
55 |
+
"<extra_id_52>",
|
56 |
+
"<extra_id_53>",
|
57 |
+
"<extra_id_54>",
|
58 |
+
"<extra_id_55>",
|
59 |
+
"<extra_id_56>",
|
60 |
+
"<extra_id_57>",
|
61 |
+
"<extra_id_58>",
|
62 |
+
"<extra_id_59>",
|
63 |
+
"<extra_id_60>",
|
64 |
+
"<extra_id_61>",
|
65 |
+
"<extra_id_62>",
|
66 |
+
"<extra_id_63>",
|
67 |
+
"<extra_id_64>",
|
68 |
+
"<extra_id_65>",
|
69 |
+
"<extra_id_66>",
|
70 |
+
"<extra_id_67>",
|
71 |
+
"<extra_id_68>",
|
72 |
+
"<extra_id_69>",
|
73 |
+
"<extra_id_70>",
|
74 |
+
"<extra_id_71>",
|
75 |
+
"<extra_id_72>",
|
76 |
+
"<extra_id_73>",
|
77 |
+
"<extra_id_74>",
|
78 |
+
"<extra_id_75>",
|
79 |
+
"<extra_id_76>",
|
80 |
+
"<extra_id_77>",
|
81 |
+
"<extra_id_78>",
|
82 |
+
"<extra_id_79>",
|
83 |
+
"<extra_id_80>",
|
84 |
+
"<extra_id_81>",
|
85 |
+
"<extra_id_82>",
|
86 |
+
"<extra_id_83>",
|
87 |
+
"<extra_id_84>",
|
88 |
+
"<extra_id_85>",
|
89 |
+
"<extra_id_86>",
|
90 |
+
"<extra_id_87>",
|
91 |
+
"<extra_id_88>",
|
92 |
+
"<extra_id_89>",
|
93 |
+
"<extra_id_90>",
|
94 |
+
"<extra_id_91>",
|
95 |
+
"<extra_id_92>",
|
96 |
+
"<extra_id_93>",
|
97 |
+
"<extra_id_94>",
|
98 |
+
"<extra_id_95>",
|
99 |
+
"<extra_id_96>",
|
100 |
+
"<extra_id_97>",
|
101 |
+
"<extra_id_98>",
|
102 |
+
"<extra_id_99>"
|
103 |
+
],
|
104 |
+
"eos_token": "</s>",
|
105 |
+
"extra_ids": 100,
|
106 |
+
"max_length": 128,
|
107 |
+
"name_or_path": "Langboat/mengzi-t5-base",
|
108 |
+
"pad_token": "<pad>",
|
109 |
+
"sp_model_kwargs": {},
|
110 |
+
"special_tokens_map_file": null,
|
111 |
+
"tokenizer_class": "T5Tokenizer",
|
112 |
+
"unk_token": "<unk>"
|
113 |
+
}
|
training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4bd43763a40e4f1c3fb579686bff7a455a7e01737828274cb97628dc57ded406
|
3 |
+
size 3387
|