EddieChen372 commited on
Commit
56d026e
1 Parent(s): 43dfc3b

Training in progress epoch 5

Browse files
added_tokens.json ADDED
@@ -0,0 +1,502 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "CLASS_0": 32500,
3
+ "CLASS_1": 32501,
4
+ "CLASS_10": 32510,
5
+ "CLASS_11": 32511,
6
+ "CLASS_12": 32512,
7
+ "CLASS_13": 32513,
8
+ "CLASS_14": 32514,
9
+ "CLASS_15": 32515,
10
+ "CLASS_16": 32516,
11
+ "CLASS_17": 32517,
12
+ "CLASS_18": 32518,
13
+ "CLASS_19": 32519,
14
+ "CLASS_2": 32502,
15
+ "CLASS_20": 32520,
16
+ "CLASS_21": 32521,
17
+ "CLASS_22": 32522,
18
+ "CLASS_23": 32523,
19
+ "CLASS_24": 32524,
20
+ "CLASS_25": 32525,
21
+ "CLASS_26": 32526,
22
+ "CLASS_27": 32527,
23
+ "CLASS_28": 32528,
24
+ "CLASS_29": 32529,
25
+ "CLASS_3": 32503,
26
+ "CLASS_30": 32530,
27
+ "CLASS_31": 32531,
28
+ "CLASS_32": 32532,
29
+ "CLASS_33": 32533,
30
+ "CLASS_34": 32534,
31
+ "CLASS_35": 32535,
32
+ "CLASS_36": 32536,
33
+ "CLASS_37": 32537,
34
+ "CLASS_38": 32538,
35
+ "CLASS_39": 32539,
36
+ "CLASS_4": 32504,
37
+ "CLASS_40": 32540,
38
+ "CLASS_41": 32541,
39
+ "CLASS_42": 32542,
40
+ "CLASS_43": 32543,
41
+ "CLASS_44": 32544,
42
+ "CLASS_45": 32545,
43
+ "CLASS_46": 32546,
44
+ "CLASS_47": 32547,
45
+ "CLASS_48": 32548,
46
+ "CLASS_49": 32549,
47
+ "CLASS_5": 32505,
48
+ "CLASS_50": 32550,
49
+ "CLASS_51": 32551,
50
+ "CLASS_52": 32552,
51
+ "CLASS_53": 32553,
52
+ "CLASS_54": 32554,
53
+ "CLASS_55": 32555,
54
+ "CLASS_56": 32556,
55
+ "CLASS_57": 32557,
56
+ "CLASS_58": 32558,
57
+ "CLASS_59": 32559,
58
+ "CLASS_6": 32506,
59
+ "CLASS_60": 32560,
60
+ "CLASS_61": 32561,
61
+ "CLASS_62": 32562,
62
+ "CLASS_63": 32563,
63
+ "CLASS_64": 32564,
64
+ "CLASS_65": 32565,
65
+ "CLASS_66": 32566,
66
+ "CLASS_67": 32567,
67
+ "CLASS_68": 32568,
68
+ "CLASS_69": 32569,
69
+ "CLASS_7": 32507,
70
+ "CLASS_70": 32570,
71
+ "CLASS_71": 32571,
72
+ "CLASS_72": 32572,
73
+ "CLASS_73": 32573,
74
+ "CLASS_74": 32574,
75
+ "CLASS_75": 32575,
76
+ "CLASS_76": 32576,
77
+ "CLASS_77": 32577,
78
+ "CLASS_78": 32578,
79
+ "CLASS_79": 32579,
80
+ "CLASS_8": 32508,
81
+ "CLASS_80": 32580,
82
+ "CLASS_81": 32581,
83
+ "CLASS_82": 32582,
84
+ "CLASS_83": 32583,
85
+ "CLASS_84": 32584,
86
+ "CLASS_85": 32585,
87
+ "CLASS_86": 32586,
88
+ "CLASS_87": 32587,
89
+ "CLASS_88": 32588,
90
+ "CLASS_89": 32589,
91
+ "CLASS_9": 32509,
92
+ "CLASS_90": 32590,
93
+ "CLASS_91": 32591,
94
+ "CLASS_92": 32592,
95
+ "CLASS_93": 32593,
96
+ "CLASS_94": 32594,
97
+ "CLASS_95": 32595,
98
+ "CLASS_96": 32596,
99
+ "CLASS_97": 32597,
100
+ "CLASS_98": 32598,
101
+ "CLASS_99": 32599,
102
+ "FUNC_0": 32400,
103
+ "FUNC_1": 32401,
104
+ "FUNC_10": 32410,
105
+ "FUNC_11": 32411,
106
+ "FUNC_12": 32412,
107
+ "FUNC_13": 32413,
108
+ "FUNC_14": 32414,
109
+ "FUNC_15": 32415,
110
+ "FUNC_16": 32416,
111
+ "FUNC_17": 32417,
112
+ "FUNC_18": 32418,
113
+ "FUNC_19": 32419,
114
+ "FUNC_2": 32402,
115
+ "FUNC_20": 32420,
116
+ "FUNC_21": 32421,
117
+ "FUNC_22": 32422,
118
+ "FUNC_23": 32423,
119
+ "FUNC_24": 32424,
120
+ "FUNC_25": 32425,
121
+ "FUNC_26": 32426,
122
+ "FUNC_27": 32427,
123
+ "FUNC_28": 32428,
124
+ "FUNC_29": 32429,
125
+ "FUNC_3": 32403,
126
+ "FUNC_30": 32430,
127
+ "FUNC_31": 32431,
128
+ "FUNC_32": 32432,
129
+ "FUNC_33": 32433,
130
+ "FUNC_34": 32434,
131
+ "FUNC_35": 32435,
132
+ "FUNC_36": 32436,
133
+ "FUNC_37": 32437,
134
+ "FUNC_38": 32438,
135
+ "FUNC_39": 32439,
136
+ "FUNC_4": 32404,
137
+ "FUNC_40": 32440,
138
+ "FUNC_41": 32441,
139
+ "FUNC_42": 32442,
140
+ "FUNC_43": 32443,
141
+ "FUNC_44": 32444,
142
+ "FUNC_45": 32445,
143
+ "FUNC_46": 32446,
144
+ "FUNC_47": 32447,
145
+ "FUNC_48": 32448,
146
+ "FUNC_49": 32449,
147
+ "FUNC_5": 32405,
148
+ "FUNC_50": 32450,
149
+ "FUNC_51": 32451,
150
+ "FUNC_52": 32452,
151
+ "FUNC_53": 32453,
152
+ "FUNC_54": 32454,
153
+ "FUNC_55": 32455,
154
+ "FUNC_56": 32456,
155
+ "FUNC_57": 32457,
156
+ "FUNC_58": 32458,
157
+ "FUNC_59": 32459,
158
+ "FUNC_6": 32406,
159
+ "FUNC_60": 32460,
160
+ "FUNC_61": 32461,
161
+ "FUNC_62": 32462,
162
+ "FUNC_63": 32463,
163
+ "FUNC_64": 32464,
164
+ "FUNC_65": 32465,
165
+ "FUNC_66": 32466,
166
+ "FUNC_67": 32467,
167
+ "FUNC_68": 32468,
168
+ "FUNC_69": 32469,
169
+ "FUNC_7": 32407,
170
+ "FUNC_70": 32470,
171
+ "FUNC_71": 32471,
172
+ "FUNC_72": 32472,
173
+ "FUNC_73": 32473,
174
+ "FUNC_74": 32474,
175
+ "FUNC_75": 32475,
176
+ "FUNC_76": 32476,
177
+ "FUNC_77": 32477,
178
+ "FUNC_78": 32478,
179
+ "FUNC_79": 32479,
180
+ "FUNC_8": 32408,
181
+ "FUNC_80": 32480,
182
+ "FUNC_81": 32481,
183
+ "FUNC_82": 32482,
184
+ "FUNC_83": 32483,
185
+ "FUNC_84": 32484,
186
+ "FUNC_85": 32485,
187
+ "FUNC_86": 32486,
188
+ "FUNC_87": 32487,
189
+ "FUNC_88": 32488,
190
+ "FUNC_89": 32489,
191
+ "FUNC_9": 32409,
192
+ "FUNC_90": 32490,
193
+ "FUNC_91": 32491,
194
+ "FUNC_92": 32492,
195
+ "FUNC_93": 32493,
196
+ "FUNC_94": 32494,
197
+ "FUNC_95": 32495,
198
+ "FUNC_96": 32496,
199
+ "FUNC_97": 32497,
200
+ "FUNC_98": 32498,
201
+ "FUNC_99": 32499,
202
+ "VAR_0": 32100,
203
+ "VAR_1": 32101,
204
+ "VAR_10": 32110,
205
+ "VAR_100": 32200,
206
+ "VAR_101": 32201,
207
+ "VAR_102": 32202,
208
+ "VAR_103": 32203,
209
+ "VAR_104": 32204,
210
+ "VAR_105": 32205,
211
+ "VAR_106": 32206,
212
+ "VAR_107": 32207,
213
+ "VAR_108": 32208,
214
+ "VAR_109": 32209,
215
+ "VAR_11": 32111,
216
+ "VAR_110": 32210,
217
+ "VAR_111": 32211,
218
+ "VAR_112": 32212,
219
+ "VAR_113": 32213,
220
+ "VAR_114": 32214,
221
+ "VAR_115": 32215,
222
+ "VAR_116": 32216,
223
+ "VAR_117": 32217,
224
+ "VAR_118": 32218,
225
+ "VAR_119": 32219,
226
+ "VAR_12": 32112,
227
+ "VAR_120": 32220,
228
+ "VAR_121": 32221,
229
+ "VAR_122": 32222,
230
+ "VAR_123": 32223,
231
+ "VAR_124": 32224,
232
+ "VAR_125": 32225,
233
+ "VAR_126": 32226,
234
+ "VAR_127": 32227,
235
+ "VAR_128": 32228,
236
+ "VAR_129": 32229,
237
+ "VAR_13": 32113,
238
+ "VAR_130": 32230,
239
+ "VAR_131": 32231,
240
+ "VAR_132": 32232,
241
+ "VAR_133": 32233,
242
+ "VAR_134": 32234,
243
+ "VAR_135": 32235,
244
+ "VAR_136": 32236,
245
+ "VAR_137": 32237,
246
+ "VAR_138": 32238,
247
+ "VAR_139": 32239,
248
+ "VAR_14": 32114,
249
+ "VAR_140": 32240,
250
+ "VAR_141": 32241,
251
+ "VAR_142": 32242,
252
+ "VAR_143": 32243,
253
+ "VAR_144": 32244,
254
+ "VAR_145": 32245,
255
+ "VAR_146": 32246,
256
+ "VAR_147": 32247,
257
+ "VAR_148": 32248,
258
+ "VAR_149": 32249,
259
+ "VAR_15": 32115,
260
+ "VAR_150": 32250,
261
+ "VAR_151": 32251,
262
+ "VAR_152": 32252,
263
+ "VAR_153": 32253,
264
+ "VAR_154": 32254,
265
+ "VAR_155": 32255,
266
+ "VAR_156": 32256,
267
+ "VAR_157": 32257,
268
+ "VAR_158": 32258,
269
+ "VAR_159": 32259,
270
+ "VAR_16": 32116,
271
+ "VAR_160": 32260,
272
+ "VAR_161": 32261,
273
+ "VAR_162": 32262,
274
+ "VAR_163": 32263,
275
+ "VAR_164": 32264,
276
+ "VAR_165": 32265,
277
+ "VAR_166": 32266,
278
+ "VAR_167": 32267,
279
+ "VAR_168": 32268,
280
+ "VAR_169": 32269,
281
+ "VAR_17": 32117,
282
+ "VAR_170": 32270,
283
+ "VAR_171": 32271,
284
+ "VAR_172": 32272,
285
+ "VAR_173": 32273,
286
+ "VAR_174": 32274,
287
+ "VAR_175": 32275,
288
+ "VAR_176": 32276,
289
+ "VAR_177": 32277,
290
+ "VAR_178": 32278,
291
+ "VAR_179": 32279,
292
+ "VAR_18": 32118,
293
+ "VAR_180": 32280,
294
+ "VAR_181": 32281,
295
+ "VAR_182": 32282,
296
+ "VAR_183": 32283,
297
+ "VAR_184": 32284,
298
+ "VAR_185": 32285,
299
+ "VAR_186": 32286,
300
+ "VAR_187": 32287,
301
+ "VAR_188": 32288,
302
+ "VAR_189": 32289,
303
+ "VAR_19": 32119,
304
+ "VAR_190": 32290,
305
+ "VAR_191": 32291,
306
+ "VAR_192": 32292,
307
+ "VAR_193": 32293,
308
+ "VAR_194": 32294,
309
+ "VAR_195": 32295,
310
+ "VAR_196": 32296,
311
+ "VAR_197": 32297,
312
+ "VAR_198": 32298,
313
+ "VAR_199": 32299,
314
+ "VAR_2": 32102,
315
+ "VAR_20": 32120,
316
+ "VAR_200": 32300,
317
+ "VAR_201": 32301,
318
+ "VAR_202": 32302,
319
+ "VAR_203": 32303,
320
+ "VAR_204": 32304,
321
+ "VAR_205": 32305,
322
+ "VAR_206": 32306,
323
+ "VAR_207": 32307,
324
+ "VAR_208": 32308,
325
+ "VAR_209": 32309,
326
+ "VAR_21": 32121,
327
+ "VAR_210": 32310,
328
+ "VAR_211": 32311,
329
+ "VAR_212": 32312,
330
+ "VAR_213": 32313,
331
+ "VAR_214": 32314,
332
+ "VAR_215": 32315,
333
+ "VAR_216": 32316,
334
+ "VAR_217": 32317,
335
+ "VAR_218": 32318,
336
+ "VAR_219": 32319,
337
+ "VAR_22": 32122,
338
+ "VAR_220": 32320,
339
+ "VAR_221": 32321,
340
+ "VAR_222": 32322,
341
+ "VAR_223": 32323,
342
+ "VAR_224": 32324,
343
+ "VAR_225": 32325,
344
+ "VAR_226": 32326,
345
+ "VAR_227": 32327,
346
+ "VAR_228": 32328,
347
+ "VAR_229": 32329,
348
+ "VAR_23": 32123,
349
+ "VAR_230": 32330,
350
+ "VAR_231": 32331,
351
+ "VAR_232": 32332,
352
+ "VAR_233": 32333,
353
+ "VAR_234": 32334,
354
+ "VAR_235": 32335,
355
+ "VAR_236": 32336,
356
+ "VAR_237": 32337,
357
+ "VAR_238": 32338,
358
+ "VAR_239": 32339,
359
+ "VAR_24": 32124,
360
+ "VAR_240": 32340,
361
+ "VAR_241": 32341,
362
+ "VAR_242": 32342,
363
+ "VAR_243": 32343,
364
+ "VAR_244": 32344,
365
+ "VAR_245": 32345,
366
+ "VAR_246": 32346,
367
+ "VAR_247": 32347,
368
+ "VAR_248": 32348,
369
+ "VAR_249": 32349,
370
+ "VAR_25": 32125,
371
+ "VAR_250": 32350,
372
+ "VAR_251": 32351,
373
+ "VAR_252": 32352,
374
+ "VAR_253": 32353,
375
+ "VAR_254": 32354,
376
+ "VAR_255": 32355,
377
+ "VAR_256": 32356,
378
+ "VAR_257": 32357,
379
+ "VAR_258": 32358,
380
+ "VAR_259": 32359,
381
+ "VAR_26": 32126,
382
+ "VAR_260": 32360,
383
+ "VAR_261": 32361,
384
+ "VAR_262": 32362,
385
+ "VAR_263": 32363,
386
+ "VAR_264": 32364,
387
+ "VAR_265": 32365,
388
+ "VAR_266": 32366,
389
+ "VAR_267": 32367,
390
+ "VAR_268": 32368,
391
+ "VAR_269": 32369,
392
+ "VAR_27": 32127,
393
+ "VAR_270": 32370,
394
+ "VAR_271": 32371,
395
+ "VAR_272": 32372,
396
+ "VAR_273": 32373,
397
+ "VAR_274": 32374,
398
+ "VAR_275": 32375,
399
+ "VAR_276": 32376,
400
+ "VAR_277": 32377,
401
+ "VAR_278": 32378,
402
+ "VAR_279": 32379,
403
+ "VAR_28": 32128,
404
+ "VAR_280": 32380,
405
+ "VAR_281": 32381,
406
+ "VAR_282": 32382,
407
+ "VAR_283": 32383,
408
+ "VAR_284": 32384,
409
+ "VAR_285": 32385,
410
+ "VAR_286": 32386,
411
+ "VAR_287": 32387,
412
+ "VAR_288": 32388,
413
+ "VAR_289": 32389,
414
+ "VAR_29": 32129,
415
+ "VAR_290": 32390,
416
+ "VAR_291": 32391,
417
+ "VAR_292": 32392,
418
+ "VAR_293": 32393,
419
+ "VAR_294": 32394,
420
+ "VAR_295": 32395,
421
+ "VAR_296": 32396,
422
+ "VAR_297": 32397,
423
+ "VAR_298": 32398,
424
+ "VAR_299": 32399,
425
+ "VAR_3": 32103,
426
+ "VAR_30": 32130,
427
+ "VAR_31": 32131,
428
+ "VAR_32": 32132,
429
+ "VAR_33": 32133,
430
+ "VAR_34": 32134,
431
+ "VAR_35": 32135,
432
+ "VAR_36": 32136,
433
+ "VAR_37": 32137,
434
+ "VAR_38": 32138,
435
+ "VAR_39": 32139,
436
+ "VAR_4": 32104,
437
+ "VAR_40": 32140,
438
+ "VAR_41": 32141,
439
+ "VAR_42": 32142,
440
+ "VAR_43": 32143,
441
+ "VAR_44": 32144,
442
+ "VAR_45": 32145,
443
+ "VAR_46": 32146,
444
+ "VAR_47": 32147,
445
+ "VAR_48": 32148,
446
+ "VAR_49": 32149,
447
+ "VAR_5": 32105,
448
+ "VAR_50": 32150,
449
+ "VAR_51": 32151,
450
+ "VAR_52": 32152,
451
+ "VAR_53": 32153,
452
+ "VAR_54": 32154,
453
+ "VAR_55": 32155,
454
+ "VAR_56": 32156,
455
+ "VAR_57": 32157,
456
+ "VAR_58": 32158,
457
+ "VAR_59": 32159,
458
+ "VAR_6": 32106,
459
+ "VAR_60": 32160,
460
+ "VAR_61": 32161,
461
+ "VAR_62": 32162,
462
+ "VAR_63": 32163,
463
+ "VAR_64": 32164,
464
+ "VAR_65": 32165,
465
+ "VAR_66": 32166,
466
+ "VAR_67": 32167,
467
+ "VAR_68": 32168,
468
+ "VAR_69": 32169,
469
+ "VAR_7": 32107,
470
+ "VAR_70": 32170,
471
+ "VAR_71": 32171,
472
+ "VAR_72": 32172,
473
+ "VAR_73": 32173,
474
+ "VAR_74": 32174,
475
+ "VAR_75": 32175,
476
+ "VAR_76": 32176,
477
+ "VAR_77": 32177,
478
+ "VAR_78": 32178,
479
+ "VAR_79": 32179,
480
+ "VAR_8": 32108,
481
+ "VAR_80": 32180,
482
+ "VAR_81": 32181,
483
+ "VAR_82": 32182,
484
+ "VAR_83": 32183,
485
+ "VAR_84": 32184,
486
+ "VAR_85": 32185,
487
+ "VAR_86": 32186,
488
+ "VAR_87": 32187,
489
+ "VAR_88": 32188,
490
+ "VAR_89": 32189,
491
+ "VAR_9": 32109,
492
+ "VAR_90": 32190,
493
+ "VAR_91": 32191,
494
+ "VAR_92": 32192,
495
+ "VAR_93": 32193,
496
+ "VAR_94": 32194,
497
+ "VAR_95": 32195,
498
+ "VAR_96": 32196,
499
+ "VAR_97": 32197,
500
+ "VAR_98": 32198,
501
+ "VAR_99": 32199
502
+ }
config.json ADDED
@@ -0,0 +1,68 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "Salesforce/codet5-small",
3
+ "architectures": [
4
+ "T5ForConditionalGeneration"
5
+ ],
6
+ "bos_token_id": 1,
7
+ "d_ff": 2048,
8
+ "d_kv": 64,
9
+ "d_model": 512,
10
+ "decoder_start_token_id": 0,
11
+ "dense_act_fn": "relu",
12
+ "dropout_rate": 0.1,
13
+ "eos_token_id": 2,
14
+ "feed_forward_proj": "relu",
15
+ "gradient_checkpointing": false,
16
+ "id2label": {
17
+ "0": "LABEL_0"
18
+ },
19
+ "initializer_factor": 1.0,
20
+ "is_encoder_decoder": true,
21
+ "is_gated_act": false,
22
+ "label2id": {
23
+ "LABEL_0": 0
24
+ },
25
+ "layer_norm_epsilon": 1e-06,
26
+ "model_type": "t5",
27
+ "n_positions": 512,
28
+ "num_decoder_layers": 6,
29
+ "num_heads": 8,
30
+ "num_layers": 6,
31
+ "output_past": true,
32
+ "pad_token_id": 0,
33
+ "relative_attention_max_distance": 128,
34
+ "relative_attention_num_buckets": 32,
35
+ "task_specific_params": {
36
+ "summarization": {
37
+ "early_stopping": true,
38
+ "length_penalty": 2.0,
39
+ "max_length": 200,
40
+ "min_length": 30,
41
+ "no_repeat_ngram_size": 3,
42
+ "num_beams": 4,
43
+ "prefix": "summarize: "
44
+ },
45
+ "translation_en_to_de": {
46
+ "early_stopping": true,
47
+ "max_length": 300,
48
+ "num_beams": 4,
49
+ "prefix": "translate English to German: "
50
+ },
51
+ "translation_en_to_fr": {
52
+ "early_stopping": true,
53
+ "max_length": 300,
54
+ "num_beams": 4,
55
+ "prefix": "translate English to French: "
56
+ },
57
+ "translation_en_to_ro": {
58
+ "early_stopping": true,
59
+ "max_length": 300,
60
+ "num_beams": 4,
61
+ "prefix": "translate English to Romanian: "
62
+ }
63
+ },
64
+ "torch_dtype": "float32",
65
+ "transformers_version": "4.26.0",
66
+ "use_cache": true,
67
+ "vocab_size": 32600
68
+ }
generation_config.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 1,
4
+ "decoder_start_token_id": 0,
5
+ "eos_token_id": 2,
6
+ "pad_token_id": 0,
7
+ "transformers_version": "4.26.0"
8
+ }
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f5c2a0f5b7a039aee1818cf2870d60954d52ac1bc277ffe3b1c90d5a8526b31
3
+ size 243038297
special_tokens_map.json ADDED
@@ -0,0 +1,753 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ {
4
+ "content": "<extra_id_99>",
5
+ "lstrip": true,
6
+ "normalized": true,
7
+ "rstrip": false,
8
+ "single_word": false
9
+ },
10
+ {
11
+ "content": "<extra_id_98>",
12
+ "lstrip": true,
13
+ "normalized": true,
14
+ "rstrip": false,
15
+ "single_word": false
16
+ },
17
+ {
18
+ "content": "<extra_id_97>",
19
+ "lstrip": true,
20
+ "normalized": true,
21
+ "rstrip": false,
22
+ "single_word": false
23
+ },
24
+ {
25
+ "content": "<extra_id_96>",
26
+ "lstrip": true,
27
+ "normalized": true,
28
+ "rstrip": false,
29
+ "single_word": false
30
+ },
31
+ {
32
+ "content": "<extra_id_95>",
33
+ "lstrip": true,
34
+ "normalized": true,
35
+ "rstrip": false,
36
+ "single_word": false
37
+ },
38
+ {
39
+ "content": "<extra_id_94>",
40
+ "lstrip": true,
41
+ "normalized": true,
42
+ "rstrip": false,
43
+ "single_word": false
44
+ },
45
+ {
46
+ "content": "<extra_id_93>",
47
+ "lstrip": true,
48
+ "normalized": true,
49
+ "rstrip": false,
50
+ "single_word": false
51
+ },
52
+ {
53
+ "content": "<extra_id_92>",
54
+ "lstrip": true,
55
+ "normalized": true,
56
+ "rstrip": false,
57
+ "single_word": false
58
+ },
59
+ {
60
+ "content": "<extra_id_91>",
61
+ "lstrip": true,
62
+ "normalized": true,
63
+ "rstrip": false,
64
+ "single_word": false
65
+ },
66
+ {
67
+ "content": "<extra_id_90>",
68
+ "lstrip": true,
69
+ "normalized": true,
70
+ "rstrip": false,
71
+ "single_word": false
72
+ },
73
+ {
74
+ "content": "<extra_id_89>",
75
+ "lstrip": true,
76
+ "normalized": true,
77
+ "rstrip": false,
78
+ "single_word": false
79
+ },
80
+ {
81
+ "content": "<extra_id_88>",
82
+ "lstrip": true,
83
+ "normalized": true,
84
+ "rstrip": false,
85
+ "single_word": false
86
+ },
87
+ {
88
+ "content": "<extra_id_87>",
89
+ "lstrip": true,
90
+ "normalized": true,
91
+ "rstrip": false,
92
+ "single_word": false
93
+ },
94
+ {
95
+ "content": "<extra_id_86>",
96
+ "lstrip": true,
97
+ "normalized": true,
98
+ "rstrip": false,
99
+ "single_word": false
100
+ },
101
+ {
102
+ "content": "<extra_id_85>",
103
+ "lstrip": true,
104
+ "normalized": true,
105
+ "rstrip": false,
106
+ "single_word": false
107
+ },
108
+ {
109
+ "content": "<extra_id_84>",
110
+ "lstrip": true,
111
+ "normalized": true,
112
+ "rstrip": false,
113
+ "single_word": false
114
+ },
115
+ {
116
+ "content": "<extra_id_83>",
117
+ "lstrip": true,
118
+ "normalized": true,
119
+ "rstrip": false,
120
+ "single_word": false
121
+ },
122
+ {
123
+ "content": "<extra_id_82>",
124
+ "lstrip": true,
125
+ "normalized": true,
126
+ "rstrip": false,
127
+ "single_word": false
128
+ },
129
+ {
130
+ "content": "<extra_id_81>",
131
+ "lstrip": true,
132
+ "normalized": true,
133
+ "rstrip": false,
134
+ "single_word": false
135
+ },
136
+ {
137
+ "content": "<extra_id_80>",
138
+ "lstrip": true,
139
+ "normalized": true,
140
+ "rstrip": false,
141
+ "single_word": false
142
+ },
143
+ {
144
+ "content": "<extra_id_79>",
145
+ "lstrip": true,
146
+ "normalized": true,
147
+ "rstrip": false,
148
+ "single_word": false
149
+ },
150
+ {
151
+ "content": "<extra_id_78>",
152
+ "lstrip": true,
153
+ "normalized": true,
154
+ "rstrip": false,
155
+ "single_word": false
156
+ },
157
+ {
158
+ "content": "<extra_id_77>",
159
+ "lstrip": true,
160
+ "normalized": true,
161
+ "rstrip": false,
162
+ "single_word": false
163
+ },
164
+ {
165
+ "content": "<extra_id_76>",
166
+ "lstrip": true,
167
+ "normalized": true,
168
+ "rstrip": false,
169
+ "single_word": false
170
+ },
171
+ {
172
+ "content": "<extra_id_75>",
173
+ "lstrip": true,
174
+ "normalized": true,
175
+ "rstrip": false,
176
+ "single_word": false
177
+ },
178
+ {
179
+ "content": "<extra_id_74>",
180
+ "lstrip": true,
181
+ "normalized": true,
182
+ "rstrip": false,
183
+ "single_word": false
184
+ },
185
+ {
186
+ "content": "<extra_id_73>",
187
+ "lstrip": true,
188
+ "normalized": true,
189
+ "rstrip": false,
190
+ "single_word": false
191
+ },
192
+ {
193
+ "content": "<extra_id_72>",
194
+ "lstrip": true,
195
+ "normalized": true,
196
+ "rstrip": false,
197
+ "single_word": false
198
+ },
199
+ {
200
+ "content": "<extra_id_71>",
201
+ "lstrip": true,
202
+ "normalized": true,
203
+ "rstrip": false,
204
+ "single_word": false
205
+ },
206
+ {
207
+ "content": "<extra_id_70>",
208
+ "lstrip": true,
209
+ "normalized": true,
210
+ "rstrip": false,
211
+ "single_word": false
212
+ },
213
+ {
214
+ "content": "<extra_id_69>",
215
+ "lstrip": true,
216
+ "normalized": true,
217
+ "rstrip": false,
218
+ "single_word": false
219
+ },
220
+ {
221
+ "content": "<extra_id_68>",
222
+ "lstrip": true,
223
+ "normalized": true,
224
+ "rstrip": false,
225
+ "single_word": false
226
+ },
227
+ {
228
+ "content": "<extra_id_67>",
229
+ "lstrip": true,
230
+ "normalized": true,
231
+ "rstrip": false,
232
+ "single_word": false
233
+ },
234
+ {
235
+ "content": "<extra_id_66>",
236
+ "lstrip": true,
237
+ "normalized": true,
238
+ "rstrip": false,
239
+ "single_word": false
240
+ },
241
+ {
242
+ "content": "<extra_id_65>",
243
+ "lstrip": true,
244
+ "normalized": true,
245
+ "rstrip": false,
246
+ "single_word": false
247
+ },
248
+ {
249
+ "content": "<extra_id_64>",
250
+ "lstrip": true,
251
+ "normalized": true,
252
+ "rstrip": false,
253
+ "single_word": false
254
+ },
255
+ {
256
+ "content": "<extra_id_63>",
257
+ "lstrip": true,
258
+ "normalized": true,
259
+ "rstrip": false,
260
+ "single_word": false
261
+ },
262
+ {
263
+ "content": "<extra_id_62>",
264
+ "lstrip": true,
265
+ "normalized": true,
266
+ "rstrip": false,
267
+ "single_word": false
268
+ },
269
+ {
270
+ "content": "<extra_id_61>",
271
+ "lstrip": true,
272
+ "normalized": true,
273
+ "rstrip": false,
274
+ "single_word": false
275
+ },
276
+ {
277
+ "content": "<extra_id_60>",
278
+ "lstrip": true,
279
+ "normalized": true,
280
+ "rstrip": false,
281
+ "single_word": false
282
+ },
283
+ {
284
+ "content": "<extra_id_59>",
285
+ "lstrip": true,
286
+ "normalized": true,
287
+ "rstrip": false,
288
+ "single_word": false
289
+ },
290
+ {
291
+ "content": "<extra_id_58>",
292
+ "lstrip": true,
293
+ "normalized": true,
294
+ "rstrip": false,
295
+ "single_word": false
296
+ },
297
+ {
298
+ "content": "<extra_id_57>",
299
+ "lstrip": true,
300
+ "normalized": true,
301
+ "rstrip": false,
302
+ "single_word": false
303
+ },
304
+ {
305
+ "content": "<extra_id_56>",
306
+ "lstrip": true,
307
+ "normalized": true,
308
+ "rstrip": false,
309
+ "single_word": false
310
+ },
311
+ {
312
+ "content": "<extra_id_55>",
313
+ "lstrip": true,
314
+ "normalized": true,
315
+ "rstrip": false,
316
+ "single_word": false
317
+ },
318
+ {
319
+ "content": "<extra_id_54>",
320
+ "lstrip": true,
321
+ "normalized": true,
322
+ "rstrip": false,
323
+ "single_word": false
324
+ },
325
+ {
326
+ "content": "<extra_id_53>",
327
+ "lstrip": true,
328
+ "normalized": true,
329
+ "rstrip": false,
330
+ "single_word": false
331
+ },
332
+ {
333
+ "content": "<extra_id_52>",
334
+ "lstrip": true,
335
+ "normalized": true,
336
+ "rstrip": false,
337
+ "single_word": false
338
+ },
339
+ {
340
+ "content": "<extra_id_51>",
341
+ "lstrip": true,
342
+ "normalized": true,
343
+ "rstrip": false,
344
+ "single_word": false
345
+ },
346
+ {
347
+ "content": "<extra_id_50>",
348
+ "lstrip": true,
349
+ "normalized": true,
350
+ "rstrip": false,
351
+ "single_word": false
352
+ },
353
+ {
354
+ "content": "<extra_id_49>",
355
+ "lstrip": true,
356
+ "normalized": true,
357
+ "rstrip": false,
358
+ "single_word": false
359
+ },
360
+ {
361
+ "content": "<extra_id_48>",
362
+ "lstrip": true,
363
+ "normalized": true,
364
+ "rstrip": false,
365
+ "single_word": false
366
+ },
367
+ {
368
+ "content": "<extra_id_47>",
369
+ "lstrip": true,
370
+ "normalized": true,
371
+ "rstrip": false,
372
+ "single_word": false
373
+ },
374
+ {
375
+ "content": "<extra_id_46>",
376
+ "lstrip": true,
377
+ "normalized": true,
378
+ "rstrip": false,
379
+ "single_word": false
380
+ },
381
+ {
382
+ "content": "<extra_id_45>",
383
+ "lstrip": true,
384
+ "normalized": true,
385
+ "rstrip": false,
386
+ "single_word": false
387
+ },
388
+ {
389
+ "content": "<extra_id_44>",
390
+ "lstrip": true,
391
+ "normalized": true,
392
+ "rstrip": false,
393
+ "single_word": false
394
+ },
395
+ {
396
+ "content": "<extra_id_43>",
397
+ "lstrip": true,
398
+ "normalized": true,
399
+ "rstrip": false,
400
+ "single_word": false
401
+ },
402
+ {
403
+ "content": "<extra_id_42>",
404
+ "lstrip": true,
405
+ "normalized": true,
406
+ "rstrip": false,
407
+ "single_word": false
408
+ },
409
+ {
410
+ "content": "<extra_id_41>",
411
+ "lstrip": true,
412
+ "normalized": true,
413
+ "rstrip": false,
414
+ "single_word": false
415
+ },
416
+ {
417
+ "content": "<extra_id_40>",
418
+ "lstrip": true,
419
+ "normalized": true,
420
+ "rstrip": false,
421
+ "single_word": false
422
+ },
423
+ {
424
+ "content": "<extra_id_39>",
425
+ "lstrip": true,
426
+ "normalized": true,
427
+ "rstrip": false,
428
+ "single_word": false
429
+ },
430
+ {
431
+ "content": "<extra_id_38>",
432
+ "lstrip": true,
433
+ "normalized": true,
434
+ "rstrip": false,
435
+ "single_word": false
436
+ },
437
+ {
438
+ "content": "<extra_id_37>",
439
+ "lstrip": true,
440
+ "normalized": true,
441
+ "rstrip": false,
442
+ "single_word": false
443
+ },
444
+ {
445
+ "content": "<extra_id_36>",
446
+ "lstrip": true,
447
+ "normalized": true,
448
+ "rstrip": false,
449
+ "single_word": false
450
+ },
451
+ {
452
+ "content": "<extra_id_35>",
453
+ "lstrip": true,
454
+ "normalized": true,
455
+ "rstrip": false,
456
+ "single_word": false
457
+ },
458
+ {
459
+ "content": "<extra_id_34>",
460
+ "lstrip": true,
461
+ "normalized": true,
462
+ "rstrip": false,
463
+ "single_word": false
464
+ },
465
+ {
466
+ "content": "<extra_id_33>",
467
+ "lstrip": true,
468
+ "normalized": true,
469
+ "rstrip": false,
470
+ "single_word": false
471
+ },
472
+ {
473
+ "content": "<extra_id_32>",
474
+ "lstrip": true,
475
+ "normalized": true,
476
+ "rstrip": false,
477
+ "single_word": false
478
+ },
479
+ {
480
+ "content": "<extra_id_31>",
481
+ "lstrip": true,
482
+ "normalized": true,
483
+ "rstrip": false,
484
+ "single_word": false
485
+ },
486
+ {
487
+ "content": "<extra_id_30>",
488
+ "lstrip": true,
489
+ "normalized": true,
490
+ "rstrip": false,
491
+ "single_word": false
492
+ },
493
+ {
494
+ "content": "<extra_id_29>",
495
+ "lstrip": true,
496
+ "normalized": true,
497
+ "rstrip": false,
498
+ "single_word": false
499
+ },
500
+ {
501
+ "content": "<extra_id_28>",
502
+ "lstrip": true,
503
+ "normalized": true,
504
+ "rstrip": false,
505
+ "single_word": false
506
+ },
507
+ {
508
+ "content": "<extra_id_27>",
509
+ "lstrip": true,
510
+ "normalized": true,
511
+ "rstrip": false,
512
+ "single_word": false
513
+ },
514
+ {
515
+ "content": "<extra_id_26>",
516
+ "lstrip": true,
517
+ "normalized": true,
518
+ "rstrip": false,
519
+ "single_word": false
520
+ },
521
+ {
522
+ "content": "<extra_id_25>",
523
+ "lstrip": true,
524
+ "normalized": true,
525
+ "rstrip": false,
526
+ "single_word": false
527
+ },
528
+ {
529
+ "content": "<extra_id_24>",
530
+ "lstrip": true,
531
+ "normalized": true,
532
+ "rstrip": false,
533
+ "single_word": false
534
+ },
535
+ {
536
+ "content": "<extra_id_23>",
537
+ "lstrip": true,
538
+ "normalized": true,
539
+ "rstrip": false,
540
+ "single_word": false
541
+ },
542
+ {
543
+ "content": "<extra_id_22>",
544
+ "lstrip": true,
545
+ "normalized": true,
546
+ "rstrip": false,
547
+ "single_word": false
548
+ },
549
+ {
550
+ "content": "<extra_id_21>",
551
+ "lstrip": true,
552
+ "normalized": true,
553
+ "rstrip": false,
554
+ "single_word": false
555
+ },
556
+ {
557
+ "content": "<extra_id_20>",
558
+ "lstrip": true,
559
+ "normalized": true,
560
+ "rstrip": false,
561
+ "single_word": false
562
+ },
563
+ {
564
+ "content": "<extra_id_19>",
565
+ "lstrip": true,
566
+ "normalized": true,
567
+ "rstrip": false,
568
+ "single_word": false
569
+ },
570
+ {
571
+ "content": "<extra_id_18>",
572
+ "lstrip": true,
573
+ "normalized": true,
574
+ "rstrip": false,
575
+ "single_word": false
576
+ },
577
+ {
578
+ "content": "<extra_id_17>",
579
+ "lstrip": true,
580
+ "normalized": true,
581
+ "rstrip": false,
582
+ "single_word": false
583
+ },
584
+ {
585
+ "content": "<extra_id_16>",
586
+ "lstrip": true,
587
+ "normalized": true,
588
+ "rstrip": false,
589
+ "single_word": false
590
+ },
591
+ {
592
+ "content": "<extra_id_15>",
593
+ "lstrip": true,
594
+ "normalized": true,
595
+ "rstrip": false,
596
+ "single_word": false
597
+ },
598
+ {
599
+ "content": "<extra_id_14>",
600
+ "lstrip": true,
601
+ "normalized": true,
602
+ "rstrip": false,
603
+ "single_word": false
604
+ },
605
+ {
606
+ "content": "<extra_id_13>",
607
+ "lstrip": true,
608
+ "normalized": true,
609
+ "rstrip": false,
610
+ "single_word": false
611
+ },
612
+ {
613
+ "content": "<extra_id_12>",
614
+ "lstrip": true,
615
+ "normalized": true,
616
+ "rstrip": false,
617
+ "single_word": false
618
+ },
619
+ {
620
+ "content": "<extra_id_11>",
621
+ "lstrip": true,
622
+ "normalized": true,
623
+ "rstrip": false,
624
+ "single_word": false
625
+ },
626
+ {
627
+ "content": "<extra_id_10>",
628
+ "lstrip": true,
629
+ "normalized": true,
630
+ "rstrip": false,
631
+ "single_word": false
632
+ },
633
+ {
634
+ "content": "<extra_id_9>",
635
+ "lstrip": true,
636
+ "normalized": true,
637
+ "rstrip": false,
638
+ "single_word": false
639
+ },
640
+ {
641
+ "content": "<extra_id_8>",
642
+ "lstrip": true,
643
+ "normalized": true,
644
+ "rstrip": false,
645
+ "single_word": false
646
+ },
647
+ {
648
+ "content": "<extra_id_7>",
649
+ "lstrip": true,
650
+ "normalized": true,
651
+ "rstrip": false,
652
+ "single_word": false
653
+ },
654
+ {
655
+ "content": "<extra_id_6>",
656
+ "lstrip": true,
657
+ "normalized": true,
658
+ "rstrip": false,
659
+ "single_word": false
660
+ },
661
+ {
662
+ "content": "<extra_id_5>",
663
+ "lstrip": true,
664
+ "normalized": true,
665
+ "rstrip": false,
666
+ "single_word": false
667
+ },
668
+ {
669
+ "content": "<extra_id_4>",
670
+ "lstrip": true,
671
+ "normalized": true,
672
+ "rstrip": false,
673
+ "single_word": false
674
+ },
675
+ {
676
+ "content": "<extra_id_3>",
677
+ "lstrip": true,
678
+ "normalized": true,
679
+ "rstrip": false,
680
+ "single_word": false
681
+ },
682
+ {
683
+ "content": "<extra_id_2>",
684
+ "lstrip": true,
685
+ "normalized": true,
686
+ "rstrip": false,
687
+ "single_word": false
688
+ },
689
+ {
690
+ "content": "<extra_id_1>",
691
+ "lstrip": true,
692
+ "normalized": true,
693
+ "rstrip": false,
694
+ "single_word": false
695
+ },
696
+ {
697
+ "content": "<extra_id_0>",
698
+ "lstrip": true,
699
+ "normalized": true,
700
+ "rstrip": false,
701
+ "single_word": false
702
+ }
703
+ ],
704
+ "bos_token": {
705
+ "content": "<s>",
706
+ "lstrip": false,
707
+ "normalized": true,
708
+ "rstrip": false,
709
+ "single_word": false
710
+ },
711
+ "cls_token": {
712
+ "content": "<s>",
713
+ "lstrip": false,
714
+ "normalized": true,
715
+ "rstrip": false,
716
+ "single_word": false
717
+ },
718
+ "eos_token": {
719
+ "content": "</s>",
720
+ "lstrip": false,
721
+ "normalized": true,
722
+ "rstrip": false,
723
+ "single_word": false
724
+ },
725
+ "mask_token": {
726
+ "content": "<mask>",
727
+ "lstrip": true,
728
+ "normalized": true,
729
+ "rstrip": false,
730
+ "single_word": false
731
+ },
732
+ "pad_token": {
733
+ "content": "<pad>",
734
+ "lstrip": false,
735
+ "normalized": true,
736
+ "rstrip": false,
737
+ "single_word": false
738
+ },
739
+ "sep_token": {
740
+ "content": "</s>",
741
+ "lstrip": false,
742
+ "normalized": true,
743
+ "rstrip": false,
744
+ "single_word": false
745
+ },
746
+ "unk_token": {
747
+ "content": "<unk>",
748
+ "lstrip": false,
749
+ "normalized": true,
750
+ "rstrip": false,
751
+ "single_word": false
752
+ }
753
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,65 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "bos_token": {
4
+ "__type": "AddedToken",
5
+ "content": "<s>",
6
+ "lstrip": false,
7
+ "normalized": true,
8
+ "rstrip": false,
9
+ "single_word": false
10
+ },
11
+ "cls_token": {
12
+ "__type": "AddedToken",
13
+ "content": "<s>",
14
+ "lstrip": false,
15
+ "normalized": true,
16
+ "rstrip": false,
17
+ "single_word": false
18
+ },
19
+ "eos_token": {
20
+ "__type": "AddedToken",
21
+ "content": "</s>",
22
+ "lstrip": false,
23
+ "normalized": true,
24
+ "rstrip": false,
25
+ "single_word": false
26
+ },
27
+ "errors": "replace",
28
+ "mask_token": {
29
+ "__type": "AddedToken",
30
+ "content": "<mask>",
31
+ "lstrip": true,
32
+ "normalized": true,
33
+ "rstrip": false,
34
+ "single_word": false
35
+ },
36
+ "model_max_length": 512,
37
+ "name_or_path": "Salesforce/codet5-small",
38
+ "pad_token": {
39
+ "__type": "AddedToken",
40
+ "content": "<pad>",
41
+ "lstrip": false,
42
+ "normalized": true,
43
+ "rstrip": false,
44
+ "single_word": false
45
+ },
46
+ "sep_token": {
47
+ "__type": "AddedToken",
48
+ "content": "</s>",
49
+ "lstrip": false,
50
+ "normalized": true,
51
+ "rstrip": false,
52
+ "single_word": false
53
+ },
54
+ "special_tokens_map_file": "/root/.cache/huggingface/hub/models--Salesforce--codet5-small/snapshots/a642dc934e5475185369d09ac07091dfe72a31fc/special_tokens_map.json",
55
+ "tokenizer_class": "RobertaTokenizer",
56
+ "trim_offsets": true,
57
+ "unk_token": {
58
+ "__type": "AddedToken",
59
+ "content": "<unk>",
60
+ "lstrip": false,
61
+ "normalized": true,
62
+ "rstrip": false,
63
+ "single_word": false
64
+ }
65
+ }
vocab.json ADDED
The diff for this file is too large to render. See raw diff