alvations commited on
Commit
2d0b34a
1 Parent(s): ba7ee39

Training in progress, step 5

Browse files
.gitattributes CHANGED
@@ -32,3 +32,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
35
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
.gitignore ADDED
@@ -0,0 +1 @@
 
 
1
+ checkpoint-*/
added_tokens.json ADDED
@@ -0,0 +1,1054 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "abundant": 250922,
3
+ "achachi": 250100,
4
+ "achachila": 250101,
5
+ "achachilan tatapa": 250102,
6
+ "achacu": 250103,
7
+ "achaku": 250104,
8
+ "achupalla": 250105,
9
+ "achuqallu": 250106,
10
+ "aeroplane": 250866,
11
+ "afflict": 250976,
12
+ "afflicted": 251054,
13
+ "afternoon": 250943,
14
+ "ahuayo": 250107,
15
+ "ahuicha": 250108,
16
+ "ahuichan mamapa": 250109,
17
+ "ajanu": 250110,
18
+ "ajarankhu": 250111,
19
+ "ajhanu": 250112,
20
+ "ajusa": 250113,
21
+ "akhan tuyuña walikiti": 250114,
22
+ "alajgpacha": 250115,
23
+ "alajha": 250116,
24
+ "alajhpacha": 250117,
25
+ "alga": 250985,
26
+ "aliqa": 250118,
27
+ "aljheri": 250119,
28
+ "allchhi": 250120,
29
+ "allpachu": 250121,
30
+ "allpi": 250122,
31
+ "allqa": 250123,
32
+ "allqamari": 250124,
33
+ "allu": 250125,
34
+ "almost": 251013,
35
+ "alpaca": 250852,
36
+ "although": 250932,
37
+ "amaya": 250126,
38
+ "ampar moqo": 250127,
39
+ "ampar quta": 250128,
40
+ "ampara": 250129,
41
+ "amulet": 251007,
42
+ "amuyu": 250130,
43
+ "amwulansya thaqanim": 250131,
44
+ "anaqa": 250132,
45
+ "anata": 250133,
46
+ "anqa": 250134,
47
+ "apachi": 250135,
48
+ "apnaqeri": 250136,
49
+ "apples": 251000,
50
+ "armadillo": 250969,
51
+ "armpit": 250899,
52
+ "aru apiri": 250137,
53
+ "aruma": 250138,
54
+ "arumanti": 250139,
55
+ "arumi": 250140,
56
+ "arumita": 250141,
57
+ "asiru": 250142,
58
+ "aski": 250143,
59
+ "askiru churata tatay": 250144,
60
+ "aspirin": 250864,
61
+ "aspirina": 250145,
62
+ "ass": 250894,
63
+ "asu": 250146,
64
+ "asukara": 250147,
65
+ "aucch'i": 250148,
66
+ "auqui": 250149,
67
+ "autipacha": 250150,
68
+ "awti": 250151,
69
+ "awtu": 250152,
70
+ "awyuna": 250153,
71
+ "aycha kanka": 250154,
72
+ "aychathejhe": 250155,
73
+ "aymara": 250156,
74
+ "aynacha": 250157,
75
+ "añuthaya": 250158,
76
+ "barley": 251087,
77
+ "beefsteak": 250867,
78
+ "belly": 251028,
79
+ "biscuits": 251004,
80
+ "bitter": 250941,
81
+ "black and white": 250854,
82
+ "blacken": 251066,
83
+ "blurry": 250898,
84
+ "braid": 250957,
85
+ "breathing": 251081,
86
+ "broom": 251036,
87
+ "brother": 250945,
88
+ "brother-in-law": 250986,
89
+ "bunch": 251139,
90
+ "butcher": 251002,
91
+ "buttock": 250883,
92
+ "callachi": 250159,
93
+ "callchi": 250160,
94
+ "canary": 250878,
95
+ "caratacu": 250161,
96
+ "carrot": 251082,
97
+ "catari": 250162,
98
+ "catjata": 250163,
99
+ "cattle": 251132,
100
+ "catuña": 250164,
101
+ "cauquitaastasa?": 250165,
102
+ "cayu": 250166,
103
+ "cayumoqo": 250167,
104
+ "ch'aca": 250168,
105
+ "ch'aka": 250169,
106
+ "ch'aku": 250170,
107
+ "ch'alla": 250171,
108
+ "ch'amaka": 250172,
109
+ "ch'apaqa": 250173,
110
+ "ch'api": 250174,
111
+ "ch'araña": 250175,
112
+ "ch'armiri": 250176,
113
+ "ch'arqi": 250177,
114
+ "ch'axwa": 250178,
115
+ "ch'ayña": 250179,
116
+ "ch'añari": 250180,
117
+ "ch'ejhe": 250181,
118
+ "ch'epa ampara": 250182,
119
+ "ch'eqa ampara": 250183,
120
+ "ch'ihu": 250184,
121
+ "ch'iji": 250185,
122
+ "ch'ijma": 250186,
123
+ "ch'iki": 250187,
124
+ "ch'ina": 250188,
125
+ "ch'ipoqo": 250189,
126
+ "ch'ipuqu": 250190,
127
+ "ch'iqa": 250191,
128
+ "ch'islli": 250192,
129
+ "ch'iyar sajuna": 250193,
130
+ "ch'iyara": 250194,
131
+ "ch'ojhña": 250195,
132
+ "ch'oqe": 250196,
133
+ "ch'uju": 250197,
134
+ "ch'ulla": 250198,
135
+ "ch'umphi": 250199,
136
+ "ch'umpi": 250200,
137
+ "ch'uqi": 250201,
138
+ "ch'urahui": 250202,
139
+ "ch'uru": 250203,
140
+ "ch'usa": 250204,
141
+ "ch'uspi": 250205,
142
+ "ch'utu": 250206,
143
+ "ch'uxña": 250207,
144
+ "chaca": 250208,
145
+ "chacha": 250209,
146
+ "chacha yaq'aña": 250210,
147
+ "challa": 250211,
148
+ "challhua": 250212,
149
+ "challwa": 250213,
150
+ "chaullacaturi": 250214,
151
+ "chawlla": 250215,
152
+ "chayanta": 250216,
153
+ "chchiara": 250217,
154
+ "cheek": 250968,
155
+ "cheers!": 251123,
156
+ "cheese": 250978,
157
+ "chest": 251151,
158
+ "chhaqachhaqa": 250218,
159
+ "chharpu": 250219,
160
+ "chhaxlla": 250220,
161
+ "chheqanqara": 250221,
162
+ "chhichhillanca": 250222,
163
+ "chhichhillanka": 250223,
164
+ "chhijchi": 250224,
165
+ "chhipchi": 250225,
166
+ "chhiqanqara": 250226,
167
+ "chhojhchiphorqe": 250227,
168
+ "chhullchu": 250228,
169
+ "chhullunkhaya": 250229,
170
+ "chhuxchi": 250230,
171
+ "chhuxlla": 250231,
172
+ "chhuxu": 250232,
173
+ "chica": 250233,
174
+ "chica uru": 250234,
175
+ "chicäruma": 250235,
176
+ "chinqi": 250236,
177
+ "chips": 251020,
178
+ "chiqa": 250237,
179
+ "chira": 250238,
180
+ "chiuchi": 250239,
181
+ "chiwchi": 250240,
182
+ "chiñi": 250241,
183
+ "chopsticks": 250998,
184
+ "chore": 250995,
185
+ "chuhua": 250242,
186
+ "chuima": 250243,
187
+ "chujhaña": 250244,
188
+ "chullpa": 250245,
189
+ "chullunkiya": 250246,
190
+ "chupa": 250247,
191
+ "chupika": 250248,
192
+ "chuqa": 250249,
193
+ "chuqi": 250250,
194
+ "chuqupa": 250251,
195
+ "chuxu": 250252,
196
+ "chuyma": 250253,
197
+ "chuymani": 250254,
198
+ "cloudy": 250890,
199
+ "condor": 250911,
200
+ "convulsion": 250966,
201
+ "corpse": 250856,
202
+ "cough": 251131,
203
+ "coward": 250901,
204
+ "credit card": 250910,
205
+ "credit tarjita": 250255,
206
+ "cub": 251056,
207
+ "cucumber": 251037,
208
+ "cullaca": 250256,
209
+ "cunca": 250257,
210
+ "cunturi": 250258,
211
+ "cup and saucer": 251039,
212
+ "cupi ampara": 250259,
213
+ "curmi": 250260,
214
+ "curse": 251063,
215
+ "cusicusi": 250261,
216
+ "cyclone": 251120,
217
+ "dancer": 251097,
218
+ "dandruff": 251050,
219
+ "dark blue": 250886,
220
+ "darkness": 250873,
221
+ "daughter-in-law": 251148,
222
+ "daugther": 251034,
223
+ "deer": 251092,
224
+ "desert": 250916,
225
+ "diligent": 251047,
226
+ "dirt": 250885,
227
+ "disarranged": 250902,
228
+ "distant": 250942,
229
+ "donkey": 250895,
230
+ "dough": 251038,
231
+ "dozen": 251112,
232
+ "dried beef": 250876,
233
+ "drunken": 251122,
234
+ "dungeon": 250853,
235
+ "ear": 250947,
236
+ "eight": 251071,
237
+ "eighteen": 251115,
238
+ "eighty": 251072,
239
+ "elbow": 251005,
240
+ "elegant": 250958,
241
+ "eternal": 251142,
242
+ "excrement": 250930,
243
+ "excuse me": 251001,
244
+ "eyebrow": 250884,
245
+ "eyelash": 250900,
246
+ "farmer": 251147,
247
+ "father-in-law": 250865,
248
+ "fertilizing": 250949,
249
+ "fetus": 251090,
250
+ "fib": 251033,
251
+ "fifth": 251031,
252
+ "fifty": 251030,
253
+ "fingernail": 251085,
254
+ "firefly": 251011,
255
+ "fisherman": 250897,
256
+ "flamingo": 251024,
257
+ "flatulence": 251086,
258
+ "flea": 250960,
259
+ "flour": 250929,
260
+ "forefront": 251022,
261
+ "forehead": 251023,
262
+ "fork": 251103,
263
+ "forty": 251045,
264
+ "four hundred": 251043,
265
+ "fourteen": 251114,
266
+ "fourth": 251044,
267
+ "full moon": 251125,
268
+ "garlic": 250848,
269
+ "gents' toilet": 250896,
270
+ "get an ambulance!": 250859,
271
+ "glowworm": 251012,
272
+ "glue": 251121,
273
+ "godfather": 250921,
274
+ "godmother": 250920,
275
+ "good afternoon": 251141,
276
+ "good evening": 251144,
277
+ "good morning": 250863,
278
+ "good-bye": 251083,
279
+ "grandfather": 250841,
280
+ "grandmother": 250845,
281
+ "grandson": 250851,
282
+ "grapefruit": 251119,
283
+ "grapes": 251129,
284
+ "great grandfather": 250842,
285
+ "great grandmother": 250846,
286
+ "grippe": 250956,
287
+ "guanaco": 251134,
288
+ "guinea pig": 251135,
289
+ "hamacura": 250262,
290
+ "hanchi": 250263,
291
+ "handful": 251048,
292
+ "hankko": 250264,
293
+ "have you got a pen?": 251040,
294
+ "help!": 251146,
295
+ "herd": 250860,
296
+ "hiwisa": 250265,
297
+ "hollow": 251017,
298
+ "honeybee": 251041,
299
+ "how much is this?": 251059,
300
+ "huahuita": 250266,
301
+ "huallpa": 250267,
302
+ "huampara": 250268,
303
+ "huank'u": 250269,
304
+ "huarahuara": 250270,
305
+ "huaranqa": 250271,
306
+ "huaranqanhuaranqapa": 250272,
307
+ "huarmi": 250273,
308
+ "huasara": 250274,
309
+ "huasuru": 250275,
310
+ "huat'a": 250276,
311
+ "huayna": 250277,
312
+ "huayronqo": 250278,
313
+ "hucumari": 250279,
314
+ "huila": 250280,
315
+ "huit'u": 250281,
316
+ "hunttuña": 250282,
317
+ "hupa llamayu": 250283,
318
+ "i don't eat meat": 250933,
319
+ "i don't know": 250937,
320
+ "i don't smoke": 250936,
321
+ "i don't understand": 250934,
322
+ "i feel ill": 251127,
323
+ "i need a doctor": 251107,
324
+ "i'd like a window seat, please": 251143,
325
+ "ichumama": 250284,
326
+ "ichutata": 250285,
327
+ "identical": 250977,
328
+ "idleness": 251075,
329
+ "ijma": 250286,
330
+ "ikiña": 250287,
331
+ "illapu": 250288,
332
+ "illness": 251126,
333
+ "illpa": 250289,
334
+ "imilla": 250290,
335
+ "in front": 250967,
336
+ "inkilla": 250291,
337
+ "insect": 251019,
338
+ "insipid": 250874,
339
+ "intelligent": 250882,
340
+ "intestine": 250948,
341
+ "intijalanta": 250292,
342
+ "intijalsu": 250293,
343
+ "iquilla": 250294,
344
+ "iquiña": 250295,
345
+ "is it safe to swim here?": 250849,
346
+ "isk'aqota": 250296,
347
+ "ispa": 250297,
348
+ "ispillo": 250298,
349
+ "itapallu": 250299,
350
+ "jach'a luk'ana": 250300,
351
+ "jach'a uta": 250301,
352
+ "jach'a wasu": 250302,
353
+ "jach'aqollo": 250303,
354
+ "jach'aqota": 250304,
355
+ "jacha": 250305,
356
+ "jahuari": 250306,
357
+ "jahuira": 250307,
358
+ "jak'u": 250308,
359
+ "jallu": 250309,
360
+ "jamach'i": 250310,
361
+ "jamp'atu": 250311,
362
+ "jamwurjisa": 250312,
363
+ "janchi": 250313,
364
+ "janis": 250314,
365
+ "janiw aych manq'rïktti": 250315,
366
+ "janiw intintktti": 250316,
367
+ "janiw pitañ luwarakiti": 250317,
368
+ "janiw pitirïktti": 250318,
369
+ "janiw yatktti": 250319,
370
+ "janiwa": 250320,
371
+ "janq'o": 250321,
372
+ "janq'u": 250322,
373
+ "janq'ulla": 250323,
374
+ "jant'aku": 250324,
375
+ "jaqi": 250325,
376
+ "jararankha": 250326,
377
+ "jararankhu": 250327,
378
+ "jaru": 250328,
379
+ "jatha": 250329,
380
+ "jathi": 250330,
381
+ "jawasa": 250331,
382
+ "jaxu": 250332,
383
+ "jay": 250333,
384
+ "jayp'u": 250334,
385
+ "jayra": 250335,
386
+ "jayri": 250336,
387
+ "jayu": 250337,
388
+ "jichhüru": 250338,
389
+ "jikhani": 250339,
390
+ "jilata": 250340,
391
+ "jilatata": 250341,
392
+ "jincho": 250342,
393
+ "jinchu": 250343,
394
+ "jinq'i": 250344,
395
+ "jiphilla": 250345,
396
+ "jiru": 250346,
397
+ "jisa": 250347,
398
+ "jiski": 250348,
399
+ "jiwaka": 250349,
400
+ "jiwaki": 250350,
401
+ "jiwata": 250351,
402
+ "jiwq'i": 250352,
403
+ "juch'usa": 250353,
404
+ "jucha": 250354,
405
+ "jucu": 250355,
406
+ "jucumari": 250356,
407
+ "jump'i": 250357,
408
+ "junt'u": 250358,
409
+ "junt'upacha": 250359,
410
+ "jupa": 250360,
411
+ "jupuqu": 250361,
412
+ "juq'ullu": 250362,
413
+ "jurma": 250363,
414
+ "juykhu": 250364,
415
+ "juyphipacha": 250365,
416
+ "juyra": 250366,
417
+ "k'achatak arst'am": 250367,
418
+ "k'achi": 250368,
419
+ "k'aira": 250369,
420
+ "k'aja": 250370,
421
+ "k'ana": 250371,
422
+ "k'anchilla": 250372,
423
+ "k'ank'a": 250373,
424
+ "k'ari": 250374,
425
+ "k'auna": 250375,
426
+ "k'awna": 250376,
427
+ "k'axilu": 250377,
428
+ "k'ayra": 250378,
429
+ "k'ita": 250379,
430
+ "k'iwcha": 250380,
431
+ "k'uchi": 250381,
432
+ "k'ulli": 250382,
433
+ "k'ullu": 250383,
434
+ "k'uma": 250384,
435
+ "k'umara": 250385,
436
+ "k'umu": 250386,
437
+ "k'usillo": 250387,
438
+ "k'uti": 250388,
439
+ "kallachi": 250389,
440
+ "kamisaraki": 250390,
441
+ "kanqiri": 250391,
442
+ "kaphiya": 250392,
443
+ "kawallu": 250393,
444
+ "kawkhans taksi utji": 250394,
445
+ "kawkharus awt istasyunirista": 250395,
446
+ "kawki": 250396,
447
+ "kawkins awt alkili": 250397,
448
+ "kawkits pasaj alirista": 250398,
449
+ "khallu": 250399,
450
+ "khankha": 250400,
451
+ "kharkhati": 250401,
452
+ "kharu": 250402,
453
+ "khaycatana": 250403,
454
+ "khañu": 250404,
455
+ "khirkhi": 250405,
456
+ "khuchi": 250406,
457
+ "khuchi li'ki": 250407,
458
+ "khuchuña": 250408,
459
+ "khullu": 250409,
460
+ "khuna": 250410,
461
+ "khunu": 250411,
462
+ "khunuqollonaca": 250412,
463
+ "khusa": 250413,
464
+ "kichu": 250414,
465
+ "kikipa": 250415,
466
+ "kimsa": 250416,
467
+ "kiru": 250417,
468
+ "kisu": 250418,
469
+ "kkunkkuri": 250419,
470
+ "knife": 250973,
471
+ "knives": 250974,
472
+ "kucha": 250420,
473
+ "kuchara": 250421,
474
+ "kuchillu": 250422,
475
+ "kukakula": 250423,
476
+ "kuliktiwu": 250424,
477
+ "kullaka": 250425,
478
+ "kumri": 250426,
479
+ "kuna uraxisa": 250427,
480
+ "kunata": 250428,
481
+ "kunjata": 250429,
482
+ "kunka": 250430,
483
+ "kuns umañ munta": 250431,
484
+ "kuntura": 250432,
485
+ "kupi": 250433,
486
+ "kusikusi": 250434,
487
+ "laca": 250435,
488
+ "lacach'aca": 250436,
489
+ "ladies' toilet": 251137,
490
+ "lagoon": 250925,
491
+ "lajhra": 250437,
492
+ "laka chaca": 250438,
493
+ "lakhampu": 250439,
494
+ "lamana": 250440,
495
+ "lamb": 250914,
496
+ "landmark": 251084,
497
+ "lankhu": 250441,
498
+ "lap'a": 250442,
499
+ "laphi": 250443,
500
+ "laq'a": 250444,
501
+ "laq'u": 250445,
502
+ "laqa": 250446,
503
+ "laqatu": 250447,
504
+ "laqha": 250448,
505
+ "laqu": 250449,
506
+ "larama": 250450,
507
+ "laranja": 250451,
508
+ "larankha": 250452,
509
+ "latanu": 250453,
510
+ "laxra": 250454,
511
+ "laxwi": 250455,
512
+ "layqa": 250456,
513
+ "left hand": 250880,
514
+ "lichi": 250457,
515
+ "light blue": 251062,
516
+ "lightning": 250991,
517
+ "liju": 250458,
518
+ "lik'i": 250459,
519
+ "limp": 250909,
520
+ "limuna": 250460,
521
+ "lip'ichi": 250461,
522
+ "liqi liqi": 250462,
523
+ "lirpu": 250463,
524
+ "lizard": 250939,
525
+ "llaki": 250464,
526
+ "llallawa": 250465,
527
+ "llama": 251061,
528
+ "llaphi": 250466,
529
+ "llatunctunca": 250467,
530
+ "llawi": 250468,
531
+ "lliju lliju": 250469,
532
+ "llijulliju": 250470,
533
+ "llilli": 250471,
534
+ "llink'i": 250472,
535
+ "llumpaqa": 250473,
536
+ "llätunca": 250474,
537
+ "lodging": 251080,
538
+ "louse": 250984,
539
+ "luk'ana": 250475,
540
+ "lukkana": 250476,
541
+ "lunthata": 250477,
542
+ "luraña": 250478,
543
+ "luxru": 250479,
544
+ "magician": 250987,
545
+ "magnificent": 250988,
546
+ "maize": 251118,
547
+ "makaña": 250480,
548
+ "malitanakasti": 250481,
549
+ "mallku": 250482,
550
+ "mallq'a": 250483,
551
+ "mamani": 250484,
552
+ "manku": 250485,
553
+ "manq'a jayt'uña": 250486,
554
+ "manq'añ sirk'i": 250487,
555
+ "manqha": 250488,
556
+ "mansana": 250489,
557
+ "mantikilla": 250490,
558
+ "mascot": 250906,
559
+ "mat'aqi": 250491,
560
+ "may i use your phone?": 251100,
561
+ "mayay jiskt'asïma": 250492,
562
+ "mañaso": 250493,
563
+ "mijilla": 250494,
564
+ "mik'i": 250495,
565
+ "mikha": 250496,
566
+ "millu": 250497,
567
+ "mirq'i": 250498,
568
+ "misk'i": 250499,
569
+ "misk'i t'ant'alla": 250500,
570
+ "mosquito": 250893,
571
+ "mother-in-law": 251094,
572
+ "mountain range": 250975,
573
+ "moustache": 251091,
574
+ "mucus": 250953,
575
+ "mug": 250928,
576
+ "mujlli": 250501,
577
+ "muk'i": 250502,
578
+ "mullu": 250503,
579
+ "muraru": 250504,
580
+ "muruqu": 250505,
581
+ "mushroom": 251046,
582
+ "mushrooms": 250999,
583
+ "mute": 250858,
584
+ "muxsa": 250506,
585
+ "muxsa chhuxllu": 250507,
586
+ "muyta": 250508,
587
+ "naira": 250509,
588
+ "nalra": 250510,
589
+ "nappy": 250913,
590
+ "nayra": 250511,
591
+ "near": 251014,
592
+ "nearly": 251015,
593
+ "neat": 250993,
594
+ "neighbor": 251128,
595
+ "nerve": 250861,
596
+ "nettle": 250927,
597
+ "new moon": 250944,
598
+ "ninalaq'o": 250512,
599
+ "ninanqu": 250513,
600
+ "nineteen": 251110,
601
+ "ninety": 250990,
602
+ "non-smoking please": 250935,
603
+ "noon": 250903,
604
+ "nose": 251010,
605
+ "one hundred": 251026,
606
+ "one thousand": 250915,
607
+ "oraqe": 250514,
608
+ "orphan": 251133,
609
+ "outside": 250862,
610
+ "outstanding": 250961,
611
+ "p'eke": 250515,
612
+ "p'iqi": 250516,
613
+ "p'isaqa": 250517,
614
+ "p'iya": 250518,
615
+ "p'ujru chuwa": 250519,
616
+ "paca": 250520,
617
+ "pachpa": 250521,
618
+ "palatu": 250522,
619
+ "palaya": 250523,
620
+ "palaya kawkhankisa": 250524,
621
+ "pampa": 250525,
622
+ "pancake": 251096,
623
+ "pankataya": 250526,
624
+ "panqara": 250527,
625
+ "papa phirita": 250528,
626
+ "papataca": 250529,
627
+ "paqallqo": 250530,
628
+ "paqallqtunca": 250531,
629
+ "paqallqu": 250532,
630
+ "pariwana": 250533,
631
+ "parrot": 251124,
632
+ "partridge": 251016,
633
+ "pasapurt lunthatapxitu": 250534,
634
+ "pasapurti": 250535,
635
+ "pataca": 250536,
636
+ "patacmara": 250537,
637
+ "pataka": 250538,
638
+ "patunca": 250539,
639
+ "paya": 250540,
640
+ "peanut": 250908,
641
+ "peninsula": 250919,
642
+ "perqa": 250541,
643
+ "phajhsi": 250542,
644
+ "phalahuiru": 250543,
645
+ "phantta": 250544,
646
+ "pharmasya kawkhankisa": 250545,
647
+ "phatanka": 250546,
648
+ "phaxcha": 250547,
649
+ "phaxi": 250548,
650
+ "phesqa": 250549,
651
+ "phesqatunca": 250550,
652
+ "phesqëri": 250551,
653
+ "phichitanqa": 250552,
654
+ "phisi": 250553,
655
+ "phisna": 250554,
656
+ "phisqa": 250555,
657
+ "phucha": 250556,
658
+ "phucu": 250557,
659
+ "phuju": 250558,
660
+ "phurutilla": 250559,
661
+ "phuyu": 250560,
662
+ "pichana": 250561,
663
+ "pichaña": 250562,
664
+ "pichu": 250563,
665
+ "pigeon": 251074,
666
+ "pillow": 250881,
667
+ "pilpinto": 250564,
668
+ "pilpintu": 250565,
669
+ "pineapple": 250843,
670
+ "pipinu": 250566,
671
+ "pirasa": 250567,
672
+ "pirtunitayya": 250568,
673
+ "pisi": 250569,
674
+ "pitu": 250570,
675
+ "platillu": 250571,
676
+ "please speak more slowly": 250955,
677
+ "plentiful": 250923,
678
+ "poqota": 250572,
679
+ "pork": 250970,
680
+ "porker": 250971,
681
+ "potato": 250887,
682
+ "potatoes": 250889,
683
+ "ppekke": 250573,
684
+ "provisions": 250954,
685
+ "puncu": 250574,
686
+ "puntawul lanktati": 250575,
687
+ "pupa": 250576,
688
+ "puquta": 250577,
689
+ "puraca": 250578,
690
+ "puraka": 250579,
691
+ "pusi": 250580,
692
+ "pusipataca": 250581,
693
+ "pusiri": 250582,
694
+ "pusitunca": 250583,
695
+ "päpataca": 250584,
696
+ "pätunca": 250585,
697
+ "q'allampa": 250586,
698
+ "q'anu": 250587,
699
+ "q'apa": 250588,
700
+ "q'api": 250589,
701
+ "q'ara": 250590,
702
+ "q'asa": 250591,
703
+ "q'atawi": 250592,
704
+ "q'ayma": 250593,
705
+ "q'añu": 250594,
706
+ "q'ejhoq'ejho": 250595,
707
+ "q'ellu": 250596,
708
+ "q'ili": 250597,
709
+ "q'illu": 250598,
710
+ "q'ita": 250599,
711
+ "q'iwi": 250600,
712
+ "q'uruta": 250601,
713
+ "q'uya": 250602,
714
+ "qachu": 250603,
715
+ "qallu": 250604,
716
+ "qallu luk'ana": 250605,
717
+ "qamaqe": 250606,
718
+ "qamaqi": 250607,
719
+ "qampu": 250608,
720
+ "qanjili": 250609,
721
+ "qanjlli": 250610,
722
+ "qapa": 250611,
723
+ "qaqa": 250612,
724
+ "qaqawara": 250613,
725
+ "qarqa": 250614,
726
+ "qasiwi": 250615,
727
+ "qasïwi": 250616,
728
+ "qawqhas akaxa": 250617,
729
+ "qawqhaxisa": 250618,
730
+ "qawra": 250619,
731
+ "qaxsi": 250620,
732
+ "qellqeri": 250621,
733
+ "qenaya": 250622,
734
+ "qhala": 250623,
735
+ "qhana": 250624,
736
+ "qhana sajuna": 250625,
737
+ "qhatu": 250626,
738
+ "qhepa": 250627,
739
+ "qheri": 250628,
740
+ "qhespi": 250629,
741
+ "qhilla": 250630,
742
+ "qhincha": 250631,
743
+ "qhini": 250632,
744
+ "qhiphürkama": 250633,
745
+ "qhisti": 250634,
746
+ "qhontiri": 250635,
747
+ "qhuna": 250636,
748
+ "qilla": 250637,
749
+ "qimara": 250638,
750
+ "qinaya": 250639,
751
+ "qisimi": 250640,
752
+ "qismi": 250641,
753
+ "qolli": 250642,
754
+ "qollqe": 250643,
755
+ "qonqori": 250644,
756
+ "qont'asina": 250645,
757
+ "qont'asiña": 250646,
758
+ "qoqa": 250647,
759
+ "qoqaqoqa": 250648,
760
+ "qora": 250649,
761
+ "qota": 250650,
762
+ "quimsa": 250651,
763
+ "quimsapataca": 250652,
764
+ "quimsaqallqo": 250653,
765
+ "quimsaqallqtunca": 250654,
766
+ "quimsatunca": 250655,
767
+ "quimsiri": 250656,
768
+ "quimsïri": 250657,
769
+ "quitula": 250658,
770
+ "qulayu": 250659,
771
+ "qulla": 250660,
772
+ "qullana": 250661,
773
+ "qullpa": 250662,
774
+ "qullqi": 250663,
775
+ "qullu": 250664,
776
+ "quna": 250665,
777
+ "qunchu": 250666,
778
+ "qunquri": 250667,
779
+ "qupa": 250668,
780
+ "quqa": 250669,
781
+ "ququ": 250670,
782
+ "quri": 250671,
783
+ "qurpa": 250672,
784
+ "quta": 250673,
785
+ "quña": 250674,
786
+ "quñchu": 250675,
787
+ "raspberries": 251008,
788
+ "remedy": 251076,
789
+ "right hand": 250912,
790
+ "rusara": 250676,
791
+ "sacred": 251077,
792
+ "sajuna": 250677,
793
+ "salesman": 250850,
794
+ "saliva": 251098,
795
+ "saltpeter": 251078,
796
+ "samana": 250678,
797
+ "sanawrya": 250679,
798
+ "sand": 250872,
799
+ "sapha": 250680,
800
+ "saru": 250681,
801
+ "sarxäya": 250682,
802
+ "sausage": 250868,
803
+ "saxra": 250683,
804
+ "saywa": 250684,
805
+ "scare": 251006,
806
+ "scorpion": 250847,
807
+ "scurf": 251051,
808
+ "seashell": 250891,
809
+ "see you tomorrow": 251065,
810
+ "seed": 250905,
811
+ "serpent": 250870,
812
+ "seventeen": 251111,
813
+ "sheep": 251130,
814
+ "shower": 251106,
815
+ "sillq'i": 250685,
816
+ "sillu": 250686,
817
+ "siqusa": 250687,
818
+ "sira": 250688,
819
+ "sirwisa": 250689,
820
+ "sirwuyla": 250690,
821
+ "siwara": 250691,
822
+ "siwi": 250692,
823
+ "siwulla": 250693,
824
+ "sixteen": 251117,
825
+ "sixth": 251089,
826
+ "sixty": 251088,
827
+ "skunk": 250869,
828
+ "slack": 251067,
829
+ "smooth": 251079,
830
+ "snail": 250892,
831
+ "sojhta": 250694,
832
+ "sojhtatunca": 250695,
833
+ "sojhtïri": 250696,
834
+ "solitary": 250888,
835
+ "someone stole my passport": 251025,
836
+ "son-in-law": 251105,
837
+ "soot": 251068,
838
+ "sorrowful": 251055,
839
+ "soup": 250996,
840
+ "sour": 250940,
841
+ "sparrow": 251032,
842
+ "sparrow hawk": 250855,
843
+ "squirrel": 251145,
844
+ "stomach": 251042,
845
+ "strawberries": 251035,
846
+ "stupid": 250924,
847
+ "sullcatata": 250697,
848
+ "sullu": 250698,
849
+ "suma": 250699,
850
+ "sunkha": 250700,
851
+ "suti": 250701,
852
+ "suxta": 250702,
853
+ "swallow": 250879,
854
+ "sweat": 250951,
855
+ "sweet corn": 251009,
856
+ "sweet potato": 251064,
857
+ "swimmer": 250983,
858
+ "swine": 250972,
859
+ "t'ant'a": 250703,
860
+ "t'anta": 250704,
861
+ "t'awra": 250705,
862
+ "t'inkha": 250706,
863
+ "t'ixni": 250707,
864
+ "t'ojho": 250708,
865
+ "t'una": 250709,
866
+ "tadpole": 250952,
867
+ "taksi": 250710,
868
+ "taqi": 250711,
869
+ "tarantula": 251058,
870
+ "taruka": 250712,
871
+ "tarwi": 250713,
872
+ "tasteless": 251049,
873
+ "tatter": 251095,
874
+ "tawaqu": 250714,
875
+ "taxa": 250715,
876
+ "tayca": 250716,
877
+ "taycch'i": 250717,
878
+ "tayka": 250718,
879
+ "tea": 251104,
880
+ "teeth": 250982,
881
+ "ten thousand": 251109,
882
+ "tepid": 250989,
883
+ "testicle": 251053,
884
+ "thaki": 250719,
885
+ "thank you": 251149,
886
+ "thank you very much": 251150,
887
+ "thantaha": 250720,
888
+ "thantha": 250721,
889
+ "thaxti": 250722,
890
+ "thaya": 250723,
891
+ "the bill, please": 251060,
892
+ "thievish": 250994,
893
+ "thirteen": 251116,
894
+ "thirty": 251073,
895
+ "thoqori": 250724,
896
+ "thorny": 250875,
897
+ "three hundred": 251070,
898
+ "thujsa": 250725,
899
+ "thuri": 250726,
900
+ "thusa": 250727,
901
+ "thutha": 250728,
902
+ "tiliphun numirusti": 250729,
903
+ "tiliphunu": 250730,
904
+ "tiliphunuy mayt'ita": 250731,
905
+ "tinta kawkhankisa": 250732,
906
+ "tirin istasyuna kawkinkisa": 250733,
907
+ "tirina": 250734,
908
+ "tirinchi": 250735,
909
+ "tiwu": 250736,
910
+ "tixi": 250737,
911
+ "tiyi": 250738,
912
+ "to disturb": 250877,
913
+ "toad": 250931,
914
+ "toe": 251057,
915
+ "tollqa": 250739,
916
+ "tomatoes": 251108,
917
+ "tongue": 250981,
918
+ "tonqo": 250740,
919
+ "tucha": 250741,
920
+ "tuktur nisisitta": 250742,
921
+ "tullpa": 250743,
922
+ "tullqa": 250744,
923
+ "tumati": 250745,
924
+ "tunca": 250746,
925
+ "tuncahuaranqa": 250747,
926
+ "tuncallätuncani": 250748,
927
+ "tuncamayani": 250749,
928
+ "tuncapaqallquni": 250750,
929
+ "tuncapayajalja": 250751,
930
+ "tuncapayani": 250752,
931
+ "tuncaphesqani": 250753,
932
+ "tuncapusini": 250754,
933
+ "tuncaqimsaqallquni": 250755,
934
+ "tuncaquimsani": 250756,
935
+ "tuncasojhtani": 250757,
936
+ "tunka": 250758,
937
+ "tunqu": 250759,
938
+ "tunu": 250760,
939
+ "turunja": 250761,
940
+ "tustat t'ant'a": 250762,
941
+ "tutuca": 250763,
942
+ "twelve": 251113,
943
+ "twin": 250926,
944
+ "twisted": 251052,
945
+ "two hundred": 251021,
946
+ "tï": 250764,
947
+ "uichinca": 250765,
948
+ "umata": 250766,
949
+ "umaña": 250767,
950
+ "umt'añani": 250768,
951
+ "uncle": 250946,
952
+ "untamed": 250959,
953
+ "uqi": 250769,
954
+ "uritu": 250770,
955
+ "urpu": 250771,
956
+ "urqu": 250772,
957
+ "urt'a": 250773,
958
+ "uspitala": 250774,
959
+ "usutjamätwa": 250775,
960
+ "usuyiri": 250776,
961
+ "utajak'a": 250777,
962
+ "utajanana": 250778,
963
+ "utajanaña": 250779,
964
+ "uturunqu": 250780,
965
+ "uturuqu": 250781,
966
+ "uwasa": 250782,
967
+ "uwija": 250783,
968
+ "uyhua": 250784,
969
+ "uywa": 250785,
970
+ "vagina": 250904,
971
+ "vinegar": 251140,
972
+ "waiter": 250918,
973
+ "wajcha": 250786,
974
+ "wajlli": 250787,
975
+ "wallpa": 250788,
976
+ "wallq'i": 250789,
977
+ "wanaku": 250790,
978
+ "wank'u": 250791,
979
+ "wanku kawkinkisa": 250792,
980
+ "warawara": 250793,
981
+ "warku": 250794,
982
+ "warmi": 250795,
983
+ "warmi yaq'aña": 250796,
984
+ "waruru": 250797,
985
+ "wasara": 250798,
986
+ "wasita": 250799,
987
+ "waterfall": 251029,
988
+ "waxra": 250800,
989
+ "wayk'a": 250801,
990
+ "wayu": 250802,
991
+ "waña": 250803,
992
+ "weasel": 250844,
993
+ "what is the telephone number?": 251099,
994
+ "what time is it?": 250979,
995
+ "what would you like to drink?": 250980,
996
+ "where are the suitcases?": 250997,
997
+ "where are you from?": 250871,
998
+ "where can i buy a ticket?": 250965,
999
+ "where can i get a taxi?": 250962,
1000
+ "where can i hire a car?": 250964,
1001
+ "where can i park the car?": 250963,
1002
+ "where is the bank?": 251136,
1003
+ "where is the beach?": 251018,
1004
+ "where is the chemist?": 251027,
1005
+ "where is the shop?": 251101,
1006
+ "where is the train station?": 251102,
1007
+ "whitish": 250938,
1008
+ "wich'inka": 250804,
1009
+ "widow": 250907,
1010
+ "wila": 250805,
1011
+ "wila-chipica": 250806,
1012
+ "wild olive": 251069,
1013
+ "wilderness": 251138,
1014
+ "willulli": 250807,
1015
+ "winagri": 250808,
1016
+ "winas taris": 250809,
1017
+ "winas täris": 250810,
1018
+ "winaya": 250811,
1019
+ "wintantuqiruw qunt'añ munta": 250812,
1020
+ "winu": 250813,
1021
+ "winus nuchis": 250814,
1022
+ "winus tartis": 250815,
1023
+ "winus tiyas": 250816,
1024
+ "wiryu wasu": 250817,
1025
+ "wisiklita": 250818,
1026
+ "wisk'achu": 250819,
1027
+ "wiñaya": 250820,
1028
+ "worn out": 251003,
1029
+ "wound": 250992,
1030
+ "wrist": 250857,
1031
+ "yanapt'ita!": 250821,
1032
+ "yanqha": 250822,
1033
+ "yant'a": 250823,
1034
+ "yapu": 250824,
1035
+ "yapuchiri": 250825,
1036
+ "yatichiri": 250826,
1037
+ "yawri": 250827,
1038
+ "yes": 250950,
1039
+ "yesterday": 250917,
1040
+ "yojhch'a": 250828,
1041
+ "yoqa": 250829,
1042
+ "yoqalla": 250830,
1043
+ "young woman": 251093,
1044
+ "yunca": 250831,
1045
+ "yuqa": 250832,
1046
+ "yuqalla": 250833,
1047
+ "yuspagara": 250834,
1048
+ "yuspajarkätam": 250835,
1049
+ "yuspara": 250836,
1050
+ "yuxch'a": 250837,
1051
+ "ñicuta": 250838,
1052
+ "ñik'uta": 250839,
1053
+ "ñuñu": 250840
1054
+ }
config.json ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "alvations/mt5-aym-lex",
3
+ "architectures": [
4
+ "MT5ForConditionalGeneration"
5
+ ],
6
+ "d_ff": 2048,
7
+ "d_kv": 64,
8
+ "d_model": 768,
9
+ "decoder_start_token_id": 0,
10
+ "dense_act_fn": "gelu_new",
11
+ "dropout_rate": 0.1,
12
+ "eos_token_id": 1,
13
+ "feed_forward_proj": "gated-gelu",
14
+ "initializer_factor": 1.0,
15
+ "is_encoder_decoder": true,
16
+ "is_gated_act": true,
17
+ "layer_norm_epsilon": 1e-06,
18
+ "model_type": "mt5",
19
+ "num_decoder_layers": 12,
20
+ "num_heads": 12,
21
+ "num_layers": 12,
22
+ "output_past": true,
23
+ "pad_token_id": 0,
24
+ "relative_attention_max_distance": 128,
25
+ "relative_attention_num_buckets": 32,
26
+ "tie_word_embeddings": false,
27
+ "tokenizer_class": "T5Tokenizer",
28
+ "torch_dtype": "float32",
29
+ "transformers_version": "4.29.1",
30
+ "use_cache": true,
31
+ "vocab_size": 251152
32
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a608c585403de1b3b7608a0b9073217e66ce1da90c334bcb687131d655693ec8
3
+ size 2336092213
runs/May16_09-23-39_8f80d7c5c961/1684229048.7773266/events.out.tfevents.1684229048.8f80d7c5c961.1279.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bbad7328412acfabe813095ddf577a7afe666480ef57cca5d925a444c6577425
3
+ size 6197
runs/May16_09-23-39_8f80d7c5c961/1684229053.1926608/events.out.tfevents.1684229053.8f80d7c5c961.1279.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fba5acb664ea3e7acd65e2f4700b9dad1c7b33b4c9cfd20b2067a81b74785917
3
+ size 6197
runs/May16_09-23-39_8f80d7c5c961/events.out.tfevents.1684229048.8f80d7c5c961.1279.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36856c1582c429d62cfe724f2702ec9dcd87ef07d22ae7384df81e0f19402d7e
3
+ size 8700
runs/May16_09-25-06_8f80d7c5c961/1684229119.5403051/events.out.tfevents.1684229119.8f80d7c5c961.1279.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:372a969107476b3f7d7239419706407a966793a82c4ae4cc3f05f7df73a0b75c
3
+ size 6197
runs/May16_09-25-06_8f80d7c5c961/1684229121.4736967/events.out.tfevents.1684229121.8f80d7c5c961.1279.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa52c76e67f9338f52693bf595540a954b63007913f3a64fe14942119731fabf
3
+ size 6197
runs/May16_09-25-06_8f80d7c5c961/events.out.tfevents.1684229119.8f80d7c5c961.1279.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:502b8beb15ff6fec1a78507b6af8ed24b83a8db3d5b591a2d3fe69bcf1236e43
3
+ size 8700
special_tokens_map.json ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ {
2
+ "eos_token": "</s>",
3
+ "pad_token": "<pad>",
4
+ "unk_token": "<unk>"
5
+ }
spiece.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef78f86560d809067d12bac6c09f19a462cb3af3f54d2b8acbba26e1433125d6
3
+ size 4309802
tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:812d584bfa2fbbd089f09abea7584511ff23db66c044460c061b10d00c3d3791
3
+ size 16592845
tokenizer_config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": null,
3
+ "clean_up_tokenization_spaces": true,
4
+ "eos_token": "</s>",
5
+ "extra_ids": 0,
6
+ "model_max_length": 1000000000000000019884624838656,
7
+ "pad_token": "<pad>",
8
+ "sp_model_kwargs": {},
9
+ "tokenizer_class": "T5Tokenizer",
10
+ "unk_token": "<unk>"
11
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9401d24fa242cc6b49ad27b796a580622af9892e5d9566108d919bccfa4acaae
3
+ size 4027