Text Generation
Transformers
PyTorch
Nigerian Pidgin
gpt2
goldfish
text-generation-inference
Inference Endpoints
goldfish-models commited on
Commit
5e84783
1 Parent(s): ec33043

Upload pcm_latn_10mb tokenizer.

Browse files
added_tokens.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"[XXXXX46]": 48433, "[XXXXX180]": 48567, "[XXXXX103]": 48490, "[XXXXX737]": 49124, "[XXXXX400]": 48787, "[XXXXX758]": 49145, "[XXXXX112]": 48499, "[XXXXX342]": 48729, "[XXXXX7]": 48394, "[XXXXX205]": 48592, "[XXXXX137]": 48524, "[XXXXX83]": 48470, "[XXXXX591]": 48978, "[XXXXX220]": 48607, "[XXXXX384]": 48771, "[XXXXX287]": 48674, "[XXXXX473]": 48860, "[XXXXX105]": 48492, "[XXXXX757]": 49144, "[XXXXX142]": 48529, "[XXXXX286]": 48673, "[XXXXX738]": 49125, "[XXXXX629]": 49016, "[XXXXX474]": 48861, "[XXXXX534]": 48921, "[XXXXX704]": 49091, "[XXXXX60]": 48447, "[XXXXX669]": 49056, "[XXXXX575]": 48962, "[XXXXX747]": 49134, "[XXXXX589]": 48976, "[XXXXX54]": 48441, "[XXXXX170]": 48557, "[XXXXX376]": 48763, "[XXXXX157]": 48544, "[XXXXX309]": 48696, "[XXXXX581]": 48968, "[XXXXX563]": 48950, "[XXXXX326]": 48713, "[XXXXX58]": 48445, "[XXXXX229]": 48616, "[XXXXX22]": 48409, "[XXXXX5]": 48392, "[XXXXX607]": 48994, "[XXXXX362]": 48749, "[XXXXX688]": 49075, "[XXXXX656]": 49043, "[XXXXX616]": 49003, "[XXXXX494]": 48881, "[XXXXX88]": 48475, "[XXXXX106]": 48493, "[XXXXX617]": 49004, "[XXXXX716]": 49103, "[XXXXX238]": 48625, "[XXXXX710]": 49097, "[XXXXX154]": 48541, "[XXXXX639]": 49026, "[XXXXX687]": 49074, "[XXXXX325]": 48712, "[XXXXX297]": 48684, "[XXXXX13]": 48400, "[XXXXX413]": 48800, "[XXXXX625]": 49012, "[XXXXX735]": 49122, "[XXXXX453]": 48840, "[XXXXX305]": 48692, "[XXXXX115]": 48502, "[XXXXX8]": 48395, "[XXXXX695]": 49082, "[XXXXX67]": 48454, "[XXXXX139]": 48526, "[XXXXX506]": 48893, "[XXXXX210]": 48597, "[XXXXX201]": 48588, "[XXXXX193]": 48580, "[XXXXX647]": 49034, "[XXXXX549]": 48936, "[XXXXX675]": 49062, "[XXXXX339]": 48726, "[XXXXX703]": 49090, "[XXXXX652]": 49039, "[XXXXX451]": 48838, "[XXXXX512]": 48899, "[XXXXX498]": 48885, "[XXXXX269]": 48656, "[XXXXX519]": 48906, "[XXXXX134]": 48521, "[XXXXX331]": 48718, "[XXXXX526]": 48913, "[XXXXX454]": 48841, "[XXXXX417]": 48804, "[XXXXX66]": 48453, "[XXXXX537]": 48924, "[XXXXX270]": 48657, "[XXXXX332]": 48719, "[XXXXX158]": 48545, "[XXXXX224]": 48611, "[XXXXX538]": 48925, "[XXXXX721]": 49108, "[XXXXX40]": 48427, "[XXXXX728]": 49115, "[XXXXX605]": 48992, "[XXXXX588]": 48975, "[XXXXX174]": 48561, "[XXXXX422]": 48809, "[XXXXX565]": 48952, "[XXXXX208]": 48595, "[XXXXX366]": 48753, "[XXXXX176]": 48563, "[XXXXX222]": 48609, "[XXXXX321]": 48708, "[XXXXX750]": 49137, "[XXXXX78]": 48465, "[XXXXX612]": 48999, "[XXXXX411]": 48798, "[XXXXX436]": 48823, "[XXXXX294]": 48681, "[XXXXX709]": 49096, "[XXXXX430]": 48817, "[XXXXX386]": 48773, "[XXXXX228]": 48615, "[XXXXX140]": 48527, "[XXXXX677]": 49064, "[XXXXX615]": 49002, "[XXXXX90]": 48477, "[XXXXX557]": 48944, "[XXXXX508]": 48895, "[XXXXX744]": 49131, "[XXXXX488]": 48875, "[XXXXX544]": 48931, "[XXXXX143]": 48530, "[XXXXX64]": 48451, "[XXXXX587]": 48974, "[XXXXX741]": 49128, "[XXXXX62]": 48449, "[XXXXX271]": 48658, "[XXXXX396]": 48783, "[XXXXX111]": 48498, "[XXXXX510]": 48897, "[XXXXX39]": 48426, "[XXXXX314]": 48701, "[XXXXX253]": 48640, "[XXXXX594]": 48981, "[XXXXX138]": 48525, "[XXXXX379]": 48766, "[XXXXX367]": 48754, "[XXXXX648]": 49035, "[XXXXX476]": 48863, "[XXXXX289]": 48676, "[XXXXX467]": 48854, "[XXXXX348]": 48735, "[XXXXX749]": 49136, "[XXXXX437]": 48824, "[XXXXX196]": 48583, "[XXXXX613]": 49000, "[XXXXX668]": 49055, "[XXXXX2]": 48389, "[XXXXX650]": 49037, "[XXXXX660]": 49047, "[XXXXX70]": 48457, "[XXXXX215]": 48602, "[XXXXX401]": 48788, "[XXXXX11]": 48398, "[XXXXX730]": 49117, "[XXXXX618]": 49005, "[XXXXX126]": 48513, "[XXXXX517]": 48904, "[XXXXX427]": 48814, "[XXXXX718]": 49105, "[XXXXX99]": 48486, "[XXXXX659]": 49046, "[XXXXX173]": 48560, "[XXXXX304]": 48691, "[XXXXX470]": 48857, "[XXXXX195]": 48582, "[XXXXX416]": 48803, "[XXXXX94]": 48481, "[XXXXX582]": 48969, "[XXXXX190]": 48577, "[XXXXX110]": 48497, "[XXXXX748]": 49135, "[XXXXX267]": 48654, "[XXXXX278]": 48665, "[XXXXX569]": 48956, "[XXXXX223]": 48610, "[XXXXX318]": 48705, "[XXXXX722]": 49109, "[XXXXX76]": 48463, "[XXXXX221]": 48608, "[XXXXX636]": 49023, "[XXXXX93]": 48480, "[XXXXX247]": 48634, "[XXXXX447]": 48834, "[XXXXX144]": 48531, "[XXXXX251]": 48638, "[XXXXX713]": 49100, "[XXXXX129]": 48516, "[XXXXX382]": 48769, "[XXXXX200]": 48587, "[XXXXX406]": 48793, "[XXXXX152]": 48539, "[XXXXX620]": 49007, "[XXXXX683]": 49070, "[XXXXX172]": 48559, "[XXXXX567]": 48954, "[XXXXX141]": 48528, "[XXXXX280]": 48667, "[XXXXX600]": 48987, "[XXXXX124]": 48511, "[XXXXX274]": 48661, "[XXXXX378]": 48765, "[XXXXX10]": 48397, "[XXXXX338]": 48725, "[XXXXX501]": 48888, "[XXXXX391]": 48778, "[XXXXX303]": 48690, "[XXXXX151]": 48538, "[XXXXX107]": 48494, "[XXXXX609]": 48996, "[XXXXX121]": 48508, "[XXXXX662]": 49049, "[XXXXX497]": 48884, "[XXXXX727]": 49114, "[XXXXX520]": 48907, "[XXXXX389]": 48776, "[XXXXX118]": 48505, "[XXXXX25]": 48412, "[XXXXX84]": 48471, "[XXXXX12]": 48399, "[XXXXX651]": 49038, "[XXXXX415]": 48802, "[XXXXX209]": 48596, "[XXXXX539]": 48926, "[XXXXX48]": 48435, "[XXXXX203]": 48590, "[XXXXX691]": 49078, "[XXXXX495]": 48882, "[XXXXX638]": 49025, "[XXXXX403]": 48790, "[XXXXX521]": 48908, "[XXXXX596]": 48983, "[XXXXX296]": 48683, "[XXXXX295]": 48682, "[XXXXX235]": 48622, "[XXXXX311]": 48698, "[XXXXX164]": 48551, "[XXXXX98]": 48485, "[XXXXX150]": 48537, "[XXXXX168]": 48555, "[XXXXX469]": 48856, "[XXXXX500]": 48887, "[XXXXX493]": 48880, "[XXXXX529]": 48916, "[XXXXX455]": 48842, "[XXXXX429]": 48816, "[XXXXX347]": 48734, "[XXXXX643]": 49030, "[XXXXX679]": 49066, "[XXXXX358]": 48745, "[XXXXX313]": 48700, "[XXXXX700]": 49087, "[XXXXX123]": 48510, "[XXXXX194]": 48581, "[XXXXX136]": 48523, "[XXXXX6]": 48393, "[XXXXX89]": 48476, "[XXXXX35]": 48422, "[XXXXX407]": 48794, "[XXXXX482]": 48869, "[XXXXX690]": 49077, "[XXXXX80]": 48467, "[XXXXX351]": 48738, "[XXXXX178]": 48565, "[XXXXX397]": 48784, "[XXXXX69]": 48456, "[XXXXX291]": 48678, "[XXXXX460]": 48847, "[XXXXX603]": 48990, "[XXXXX551]": 48938, "[XXXXX393]": 48780, "[XXXXX542]": 48929, "[XXXXX559]": 48946, "[XXXXX644]": 49031, "[XXXXX354]": 48741, "[XXXXX597]": 48984, "[XXXXX281]": 48668, "[XXXXX443]": 48830, "[XXXXX340]": 48727, "[XXXXX211]": 48598, "[XXXXX323]": 48710, "[XXXXX85]": 48472, "[XXXXX604]": 48991, "[XXXXX226]": 48613, "[XXXXX266]": 48653, "[XXXXX92]": 48479, "[XXXXX465]": 48852, "[XXXXX673]": 49060, "[XXXXX731]": 49118, "[XXXXX442]": 48829, "[XXXXX475]": 48862, "[XXXXX739]": 49126, "[XXXXX341]": 48728, "[XXXXX452]": 48839, "[XXXXX242]": 48629, "[XXXXX463]": 48850, "[XXXXX410]": 48797, "[XXXXX574]": 48961, "[XXXXX240]": 48627, "[XXXXX50]": 48437, "[XXXXX759]": 49146, "[XXXXX763]": 49150, "[XXXXX125]": 48512, "[XXXXX355]": 48742, "[XXXXX26]": 48413, "[XXXXX206]": 48593, "[XXXXX41]": 48428, "[XXXXX259]": 48646, "[XXXXX45]": 48432, "[XXXXX398]": 48785, "[XXXXX148]": 48535, "[XXXXX564]": 48951, "[XXXXX186]": 48573, "[XXXXX72]": 48459, "[XXXXX230]": 48617, "[XXXXX486]": 48873, "[XXXXX576]": 48963, "[XXXXX231]": 48618, "[XXXXX204]": 48591, "[XXXXX81]": 48468, "[XXXXX191]": 48578, "[XXXXX165]": 48552, "[XXXXX369]": 48756, "[XXXXX237]": 48624, "[XXXXX265]": 48652, "[XXXXX458]": 48845, "[XXXXX183]": 48570, "[XXXXX485]": 48872, "[XXXXX122]": 48509, "[XXXXX492]": 48879, "[XXXXX504]": 48891, "[XXXXX577]": 48964, "[XXXXX74]": 48461, "[XXXXX435]": 48822, "[XXXXX446]": 48833, "[XXXXX425]": 48812, "[XXXXX634]": 49021, "[XXXXX711]": 49098, "[XXXXX353]": 48740, "[XXXXX285]": 48672, "[XXXXX197]": 48584, "[XXXXX44]": 48431, "[XXXXX583]": 48970, "[XXXXX163]": 48550, "[XXXXX632]": 49019, "[XXXXX113]": 48500, "[XXXXX91]": 48478, "[XXXXX131]": 48518, "[XXXXX525]": 48912, "[XXXXX117]": 48504, "[XXXXX635]": 49022, "[XXXXX192]": 48579, "[XXXXX79]": 48466, "[XXXXX248]": 48635, "[XXXXX319]": 48706, "[XXXXX754]": 49141, "[XXXXX145]": 48532, "[XXXXX59]": 48446, "[XXXXX421]": 48808, "[XXXXX753]": 49140, "[XXXXX43]": 48430, "[XXXXX171]": 48558, "[XXXXX333]": 48720, "[XXXXX705]": 49092, "[XXXXX640]": 49027, "[XXXXX734]": 49121, "[XXXXX419]": 48806, "[XXXXX3]": 48390, "[XXXXX77]": 48464, "[XXXXX558]": 48945, "[XXXXX207]": 48594, "[XXXXX619]": 49006, "[XXXXX424]": 48811, "[XXXXX4]": 48391, "[XXXXX466]": 48853, "[XXXXX73]": 48460, "[XXXXX350]": 48737, "[XXXXX47]": 48434, "[XXXXX34]": 48421, "[XXXXX349]": 48736, "[XXXXX57]": 48444, "[XXXXX159]": 48546, "[XXXXX462]": 48849, "[XXXXX32]": 48419, "[XXXXX24]": 48411, "[XXXXX185]": 48572, "[XXXXX481]": 48868, "[XXXXX682]": 49069, "[XXXXX239]": 48626, "[XXXXX623]": 49010, "[XXXXX592]": 48979, "[XXXXX30]": 48417, "[XXXXX584]": 48971, "[XXXXX586]": 48973, "[SEP]": 48384, "[XXXXX692]": 49079, "[XXXXX23]": 48410, "[XXXXX61]": 48448, "[XXXXX255]": 48642, "[XXXXX502]": 48889, "[XXXXX56]": 48443, "[XXXXX483]": 48870, "[XXXXX97]": 48484, "[XXXXX352]": 48739, "[XXXXX116]": 48503, "[XXXXX676]": 49063, "[XXXXX664]": 49051, "[XXXXX216]": 48603, "[XXXXX65]": 48452, "[XXXXX329]": 48716, "[XXXXX189]": 48576, "[XXXXX68]": 48455, "[XXXXX363]": 48750, "[XXXXX86]": 48473, "[XXXXX428]": 48815, "[XXXXX27]": 48414, "[XXXXX75]": 48462, "[XXXXX119]": 48506, "[XXXXX52]": 48439, "[XXXXX666]": 49053, "[XXXXX202]": 48589, "[XXXXX630]": 49017, "[XXXXX698]": 49085, "[XXXXX132]": 48519, "[XXXXX633]": 49020, "[XXXXX702]": 49089, "[XXXXX166]": 48553, "[XXXXX624]": 49011, "[XXXXX531]": 48918, "[XXXXX322]": 48709, "[XXXXX642]": 49029, "[XXXXX412]": 48799, "[XXXXX507]": 48894, "[XXXXX249]": 48636, "[XXXXX51]": 48438, "[XXXXX480]": 48867, "[XXXXX491]": 48878, "[XXXXX302]": 48689, "[XXXXX133]": 48520, "[XXXXX646]": 49033, "[XXXXX162]": 48549, "[XXXXX28]": 48415, "[XXXXX71]": 48458, "[XXXXX373]": 48760, "[XXXXX182]": 48569, "[XXXXX459]": 48846, "[XXXXX524]": 48911, "[XXXXX292]": 48679, "[XXXXX225]": 48612, "[XXXXX149]": 48536, "[XXXXX343]": 48730, "[XXXXX503]": 48890, "[XXXXX335]": 48722, "[XXXXX478]": 48865, "[XXXXX127]": 48514, "[XXXXX523]": 48910, "[XXXXX579]": 48966, "[XXXXX404]": 48791, "[XXXXX562]": 48949, "[XXXXX360]": 48747, "[XXXXX324]": 48711, "[XXXXX627]": 49014, "[XXXXX156]": 48543, "[XXXXX670]": 49057, "[XXXXX570]": 48957, "[XXXXX15]": 48402, "[XXXXX213]": 48600, "[XXXXX626]": 49013, "[XXXXX212]": 48599, "[XXXXX746]": 49133, "[XXXXX334]": 48721, "[XXXXX357]": 48744, "[XXXXX628]": 49015, "[XXXXX468]": 48855, "[XXXXX614]": 49001, "[XXXXX756]": 49143, "[XXXXX653]": 49040, "[XXXXX761]": 49148, "[XXXXX499]": 48886, "[XXXXX49]": 48436, "[XXXXX602]": 48989, "[XXXXX377]": 48764, "[XXXXX762]": 49149, "[XXXXX637]": 49024, "[XXXXX621]": 49008, "[XXXXX365]": 48752, "[XXXXX720]": 49107, "[XXXXX742]": 49129, "[XXXXX359]": 48746, "[XXXXX293]": 48680, "[XXXXX699]": 49086, "[XXXXX645]": 49032, "[XXXXX312]": 48699, "[XXXXX608]": 48995, "[XXXXX315]": 48702, "[XXXXX694]": 49081, "[XXXXX611]": 48998, "[XXXXX264]": 48651, "[XXXXX300]": 48687, "[XXXXX63]": 48450, "[XXXXX187]": 48574, "[XXXXX245]": 48632, "[XXXXX262]": 48649, "[XXXXX545]": 48932, "[XXXXX496]": 48883, "[XXXXX261]": 48648, "[XXXXX751]": 49138, "[XXXXX169]": 48556, "[XXXXX540]": 48927, "[XXXXX36]": 48423, "[XXXXX250]": 48637, "[XXXXX535]": 48922, "[XXXXX233]": 48620, "[XXXXX234]": 48621, "[XXXXX477]": 48864, "[XXXXX31]": 48418, "[XXXXX580]": 48967, "[XXXXX439]": 48826, "[XXXXX693]": 49080, "[XXXXX515]": 48902, "[XXXXX456]": 48843, "[XXXXX561]": 48948, "[XXXXX16]": 48403, "[XXXXX715]": 49102, "[XXXXX18]": 48405, "[XXXXX479]": 48866, "[XXXXX135]": 48522, "[XXXXX33]": 48420, "[XXXXX308]": 48695, "[XXXXX423]": 48810, "[XXXXX316]": 48703, "[XXXXX42]": 48429, "[XXXXX522]": 48909, "[XXXXX461]": 48848, "[XXXXX554]": 48941, "[XXXXX654]": 49041, "[XXXXX96]": 48483, "[XXXXX578]": 48965, "[XXXXX420]": 48807, "[XXXXX532]": 48919, "[XXXXX19]": 48406, "[XXXXX530]": 48917, "[XXXXX199]": 48586, "[XXXXX745]": 49132, "[XXXXX546]": 48933, "[XXXXX307]": 48694, "[XXXXX590]": 48977, "[XXXXX513]": 48900, "[XXXXX484]": 48871, "[XXXXX450]": 48837, "[XXXXX218]": 48605, "[XXXXX181]": 48568, "[XXXXX431]": 48818, "[XXXXX725]": 49112, "[XXXXX552]": 48939, "[XXXXX610]": 48997, "[CLS]": 48383, "[XXXXX678]": 49065, "[XXXXX277]": 48664, "[XXXXX566]": 48953, "[XXXXX560]": 48947, "[XXXXX198]": 48585, "[XXXXX275]": 48662, "[XXXXX593]": 48980, "[XXXXX598]": 48985, "[XXXXX38]": 48425, "[XXXXX663]": 49050, "[XXXXX665]": 49052, "[XXXXX268]": 48655, "[XXXXX409]": 48796, "[XXXXX448]": 48835, "[XXXXX706]": 49093, "[XXXXX288]": 48675, "[XXXXX487]": 48874, "[XXXXX29]": 48416, "[XXXXX433]": 48820, "[XXXXX606]": 48993, "[XXXXX696]": 49083, "[XXXXX717]": 49104, "[XXXXX740]": 49127, "[XXXXX179]": 48566, "[XXXXX37]": 48424, "[XXXXX681]": 49068, "[XXXXX161]": 48548, "[XXXXX120]": 48507, "[XXXXX128]": 48515, "[XXXXX541]": 48928, "[XXXXX631]": 49018, "[XXXXX101]": 48488, "[XXXXX21]": 48408, "[XXXXX217]": 48604, "[XXXXX260]": 48647, "[XXXXX505]": 48892, "[XXXXX543]": 48930, "[XXXXX374]": 48761, "[XXXXX464]": 48851, "[XXXXX708]": 49095, "[XXXXX490]": 48877, "[XXXXX155]": 48542, "[XXXXX130]": 48517, "[XXXXX399]": 48786, "[XXXXX723]": 49110, "[XXXXX764]": 49151, "[XXXXX528]": 48915, "[XXXXX724]": 49111, "[XXXXX380]": 48767, "[XXXXX232]": 48619, "[XXXXX346]": 48733, "[XXXXX516]": 48903, "[XXXXX108]": 48495, "[XXXXX368]": 48755, "[XXXXX104]": 48491, "[XXXXX55]": 48442, "[XXXXX153]": 48540, "[XXXXX219]": 48606, "[XXXXX686]": 49073, "[XXXXX658]": 49045, "[XXXXX511]": 48898, "[XXXXX298]": 48685, "[XXXXX445]": 48832, "[XXXXX395]": 48782, "[XXXXX276]": 48663, "[XXXXX599]": 48986, "[XXXXX674]": 49061, "[XXXXX685]": 49072, "[XXXXX1]": 48388, "[XXXXX370]": 48757, "[XXXXX760]": 49147, "[XXXXX257]": 48644, "[XXXXX719]": 49106, "[XXXXX555]": 48942, "[XXXXX299]": 48686, "[XXXXX175]": 48562, "[XXXXX440]": 48827, "[XXXXX736]": 49123, "[XXXXX328]": 48715, "[XXXXX752]": 49139, "[XXXXX375]": 48762, "[XXXXX82]": 48469, "[XXXXX514]": 48901, "[XXXXX290]": 48677, "[XXXXX20]": 48407, "[XXXXX95]": 48482, "[XXXXX320]": 48707, "[XXXXX527]": 48914, "[XXXXX444]": 48831, "[XXXXX256]": 48643, "[XXXXX0]": 48387, "[XXXXX184]": 48571, "[XXXXX680]": 49067, "[XXXXX714]": 49101, "[XXXXX273]": 48660, "[XXXXX177]": 48564, "[XXXXX449]": 48836, "[XXXXX258]": 48645, "[XXXXX390]": 48777, "[XXXXX553]": 48940, "[XXXXX14]": 48401, "[XXXXX383]": 48770, "[XXXXX729]": 49116, "[XXXXX556]": 48943, "[XXXXX649]": 49036, "[XXXXX87]": 48474, "[XXXXX356]": 48743, "[XXXXX402]": 48789, "[XXXXX336]": 48723, "[XXXXX536]": 48923, "[XXXXX572]": 48959, "[XXXXX306]": 48693, "[XXXXX167]": 48554, "[XXXXX263]": 48650, "[XXXXX364]": 48751, "[XXXXX252]": 48639, "[XXXXX726]": 49113, "[XXXXX568]": 48955, "[XXXXX345]": 48732, "[XXXXX414]": 48801, "[XXXXX214]": 48601, "[XXXXX684]": 49071, "[XXXXX622]": 49009, "[XXXXX246]": 48633, "[XXXXX102]": 48489, "<pad>": 48385, "[XXXXX387]": 48774, "[XXXXX394]": 48781, "[XXXXX236]": 48623, "[XXXXX146]": 48533, "[XXXXX109]": 48496, "[XXXXX160]": 48547, "[XXXXX743]": 49130, "[XXXXX712]": 49099, "[XXXXX254]": 48641, "[XXXXX548]": 48935, "[XXXXX755]": 49142, "[XXXXX279]": 48666, "[XXXXX282]": 48669, "[XXXXX114]": 48501, "[XXXXX361]": 48748, "[XXXXX53]": 48440, "[XXXXX472]": 48859, "[XXXXX550]": 48937, "[XXXXX17]": 48404, "[XXXXX707]": 49094, "[XXXXX601]": 48988, "[XXXXX671]": 49058, "[XXXXX408]": 48795, "[XXXXX310]": 48697, "[XXXXX381]": 48768, "[XXXXX432]": 48819, "[XXXXX732]": 49119, "[XXXXX188]": 48575, "[XXXXX372]": 48759, "[XXXXX641]": 49028, "[XXXXX441]": 48828, "[XXXXX272]": 48659, "[XXXXX100]": 48487, "[XXXXX243]": 48630, "[XXXXX405]": 48792, "[XXXXX284]": 48671, "[XXXXX518]": 48905, "[XXXXX371]": 48758, "[XXXXX426]": 48813, "[XXXXX689]": 49076, "[XXXXX147]": 48534, "[XXXXX301]": 48688, "[XXXXX585]": 48972, "[XXXXX533]": 48920, "[XXXXX392]": 48779, "[XXXXX701]": 49088, "[XXXXX672]": 49059, "[XXXXX595]": 48982, "[XXXXX573]": 48960, "[XXXXX283]": 48670, "[XXXXX241]": 48628, "[XXXXX655]": 49042, "[XXXXX337]": 48724, "[XXXXX697]": 49084, "[MASK]": 48386, "[XXXXX344]": 48731, "[XXXXX438]": 48825, "[XXXXX571]": 48958, "[XXXXX327]": 48714, "[XXXXX418]": 48805, "[XXXXX227]": 48614, "[XXXXX547]": 48934, "[XXXXX317]": 48704, "[XXXXX661]": 49048, "[XXXXX330]": 48717, "[XXXXX509]": 48896, "[XXXXX489]": 48876, "[XXXXX9]": 48396, "[XXXXX733]": 49120, "[XXXXX244]": 48631, "[XXXXX385]": 48772, "[XXXXX471]": 48858, "[XXXXX388]": 48775, "[XXXXX657]": 49044, "[XXXXX667]": 49054, "[XXXXX457]": 48844, "[XXXXX434]": 48821}
special_tokens_map.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"bos_token": "[CLS]", "eos_token": "[SEP]", "unk_token": "<unk>", "sep_token": "[SEP]", "pad_token": "<pad>", "cls_token": "[CLS]", "mask_token": {"content": "[MASK]", "single_word": false, "lstrip": true, "rstrip": false, "normalized": false}, "additional_special_tokens": ["[XXXXX0]", "[XXXXX1]", "[XXXXX2]", "[XXXXX3]", "[XXXXX4]", "[XXXXX5]", "[XXXXX6]", "[XXXXX7]", "[XXXXX8]", "[XXXXX9]", "[XXXXX10]", "[XXXXX11]", "[XXXXX12]", "[XXXXX13]", "[XXXXX14]", "[XXXXX15]", "[XXXXX16]", "[XXXXX17]", "[XXXXX18]", "[XXXXX19]", "[XXXXX20]", "[XXXXX21]", "[XXXXX22]", "[XXXXX23]", "[XXXXX24]", "[XXXXX25]", "[XXXXX26]", "[XXXXX27]", "[XXXXX28]", "[XXXXX29]", "[XXXXX30]", "[XXXXX31]", "[XXXXX32]", "[XXXXX33]", "[XXXXX34]", "[XXXXX35]", "[XXXXX36]", "[XXXXX37]", "[XXXXX38]", "[XXXXX39]", "[XXXXX40]", "[XXXXX41]", "[XXXXX42]", "[XXXXX43]", "[XXXXX44]", "[XXXXX45]", "[XXXXX46]", "[XXXXX47]", "[XXXXX48]", "[XXXXX49]", "[XXXXX50]", "[XXXXX51]", "[XXXXX52]", "[XXXXX53]", "[XXXXX54]", "[XXXXX55]", "[XXXXX56]", "[XXXXX57]", "[XXXXX58]", "[XXXXX59]", "[XXXXX60]", "[XXXXX61]", "[XXXXX62]", "[XXXXX63]", "[XXXXX64]", "[XXXXX65]", "[XXXXX66]", "[XXXXX67]", "[XXXXX68]", "[XXXXX69]", "[XXXXX70]", "[XXXXX71]", "[XXXXX72]", "[XXXXX73]", "[XXXXX74]", "[XXXXX75]", "[XXXXX76]", "[XXXXX77]", "[XXXXX78]", "[XXXXX79]", "[XXXXX80]", "[XXXXX81]", "[XXXXX82]", "[XXXXX83]", "[XXXXX84]", "[XXXXX85]", "[XXXXX86]", "[XXXXX87]", "[XXXXX88]", "[XXXXX89]", "[XXXXX90]", "[XXXXX91]", "[XXXXX92]", "[XXXXX93]", "[XXXXX94]", "[XXXXX95]", "[XXXXX96]", "[XXXXX97]", "[XXXXX98]", "[XXXXX99]", "[XXXXX100]", "[XXXXX101]", "[XXXXX102]", "[XXXXX103]", "[XXXXX104]", "[XXXXX105]", "[XXXXX106]", "[XXXXX107]", "[XXXXX108]", "[XXXXX109]", "[XXXXX110]", "[XXXXX111]", "[XXXXX112]", "[XXXXX113]", "[XXXXX114]", "[XXXXX115]", "[XXXXX116]", "[XXXXX117]", "[XXXXX118]", "[XXXXX119]", "[XXXXX120]", "[XXXXX121]", "[XXXXX122]", "[XXXXX123]", "[XXXXX124]", "[XXXXX125]", "[XXXXX126]", "[XXXXX127]", "[XXXXX128]", "[XXXXX129]", "[XXXXX130]", "[XXXXX131]", "[XXXXX132]", "[XXXXX133]", "[XXXXX134]", "[XXXXX135]", "[XXXXX136]", "[XXXXX137]", "[XXXXX138]", "[XXXXX139]", "[XXXXX140]", "[XXXXX141]", "[XXXXX142]", "[XXXXX143]", "[XXXXX144]", "[XXXXX145]", "[XXXXX146]", "[XXXXX147]", "[XXXXX148]", "[XXXXX149]", "[XXXXX150]", "[XXXXX151]", "[XXXXX152]", "[XXXXX153]", "[XXXXX154]", "[XXXXX155]", "[XXXXX156]", "[XXXXX157]", "[XXXXX158]", "[XXXXX159]", "[XXXXX160]", "[XXXXX161]", "[XXXXX162]", "[XXXXX163]", "[XXXXX164]", "[XXXXX165]", "[XXXXX166]", "[XXXXX167]", "[XXXXX168]", "[XXXXX169]", "[XXXXX170]", "[XXXXX171]", "[XXXXX172]", "[XXXXX173]", "[XXXXX174]", "[XXXXX175]", "[XXXXX176]", "[XXXXX177]", "[XXXXX178]", "[XXXXX179]", "[XXXXX180]", "[XXXXX181]", "[XXXXX182]", "[XXXXX183]", "[XXXXX184]", "[XXXXX185]", "[XXXXX186]", "[XXXXX187]", "[XXXXX188]", "[XXXXX189]", "[XXXXX190]", "[XXXXX191]", "[XXXXX192]", "[XXXXX193]", "[XXXXX194]", "[XXXXX195]", "[XXXXX196]", "[XXXXX197]", "[XXXXX198]", "[XXXXX199]", "[XXXXX200]", "[XXXXX201]", "[XXXXX202]", "[XXXXX203]", "[XXXXX204]", "[XXXXX205]", "[XXXXX206]", "[XXXXX207]", "[XXXXX208]", "[XXXXX209]", "[XXXXX210]", "[XXXXX211]", "[XXXXX212]", "[XXXXX213]", "[XXXXX214]", "[XXXXX215]", "[XXXXX216]", "[XXXXX217]", "[XXXXX218]", "[XXXXX219]", "[XXXXX220]", "[XXXXX221]", "[XXXXX222]", "[XXXXX223]", "[XXXXX224]", "[XXXXX225]", "[XXXXX226]", "[XXXXX227]", "[XXXXX228]", "[XXXXX229]", "[XXXXX230]", "[XXXXX231]", "[XXXXX232]", "[XXXXX233]", "[XXXXX234]", "[XXXXX235]", "[XXXXX236]", "[XXXXX237]", "[XXXXX238]", "[XXXXX239]", "[XXXXX240]", "[XXXXX241]", "[XXXXX242]", "[XXXXX243]", "[XXXXX244]", "[XXXXX245]", "[XXXXX246]", "[XXXXX247]", "[XXXXX248]", "[XXXXX249]", "[XXXXX250]", "[XXXXX251]", "[XXXXX252]", "[XXXXX253]", "[XXXXX254]", "[XXXXX255]", "[XXXXX256]", "[XXXXX257]", "[XXXXX258]", "[XXXXX259]", "[XXXXX260]", "[XXXXX261]", "[XXXXX262]", "[XXXXX263]", "[XXXXX264]", "[XXXXX265]", "[XXXXX266]", "[XXXXX267]", "[XXXXX268]", "[XXXXX269]", "[XXXXX270]", "[XXXXX271]", "[XXXXX272]", "[XXXXX273]", "[XXXXX274]", "[XXXXX275]", "[XXXXX276]", "[XXXXX277]", "[XXXXX278]", "[XXXXX279]", "[XXXXX280]", "[XXXXX281]", "[XXXXX282]", "[XXXXX283]", "[XXXXX284]", "[XXXXX285]", "[XXXXX286]", "[XXXXX287]", "[XXXXX288]", "[XXXXX289]", "[XXXXX290]", "[XXXXX291]", "[XXXXX292]", "[XXXXX293]", "[XXXXX294]", "[XXXXX295]", "[XXXXX296]", "[XXXXX297]", "[XXXXX298]", "[XXXXX299]", "[XXXXX300]", "[XXXXX301]", "[XXXXX302]", "[XXXXX303]", "[XXXXX304]", "[XXXXX305]", "[XXXXX306]", "[XXXXX307]", "[XXXXX308]", "[XXXXX309]", "[XXXXX310]", "[XXXXX311]", "[XXXXX312]", "[XXXXX313]", "[XXXXX314]", "[XXXXX315]", "[XXXXX316]", "[XXXXX317]", "[XXXXX318]", "[XXXXX319]", "[XXXXX320]", "[XXXXX321]", "[XXXXX322]", "[XXXXX323]", "[XXXXX324]", "[XXXXX325]", "[XXXXX326]", "[XXXXX327]", "[XXXXX328]", "[XXXXX329]", "[XXXXX330]", "[XXXXX331]", "[XXXXX332]", "[XXXXX333]", "[XXXXX334]", "[XXXXX335]", "[XXXXX336]", "[XXXXX337]", "[XXXXX338]", "[XXXXX339]", "[XXXXX340]", "[XXXXX341]", "[XXXXX342]", "[XXXXX343]", "[XXXXX344]", "[XXXXX345]", "[XXXXX346]", "[XXXXX347]", "[XXXXX348]", "[XXXXX349]", "[XXXXX350]", "[XXXXX351]", "[XXXXX352]", "[XXXXX353]", "[XXXXX354]", "[XXXXX355]", "[XXXXX356]", "[XXXXX357]", "[XXXXX358]", "[XXXXX359]", "[XXXXX360]", "[XXXXX361]", "[XXXXX362]", "[XXXXX363]", "[XXXXX364]", "[XXXXX365]", "[XXXXX366]", "[XXXXX367]", "[XXXXX368]", "[XXXXX369]", "[XXXXX370]", "[XXXXX371]", "[XXXXX372]", "[XXXXX373]", "[XXXXX374]", "[XXXXX375]", "[XXXXX376]", "[XXXXX377]", "[XXXXX378]", "[XXXXX379]", "[XXXXX380]", "[XXXXX381]", "[XXXXX382]", "[XXXXX383]", "[XXXXX384]", "[XXXXX385]", "[XXXXX386]", "[XXXXX387]", "[XXXXX388]", "[XXXXX389]", "[XXXXX390]", "[XXXXX391]", "[XXXXX392]", "[XXXXX393]", "[XXXXX394]", "[XXXXX395]", "[XXXXX396]", "[XXXXX397]", "[XXXXX398]", "[XXXXX399]", "[XXXXX400]", "[XXXXX401]", "[XXXXX402]", "[XXXXX403]", "[XXXXX404]", "[XXXXX405]", "[XXXXX406]", "[XXXXX407]", "[XXXXX408]", "[XXXXX409]", "[XXXXX410]", "[XXXXX411]", "[XXXXX412]", "[XXXXX413]", "[XXXXX414]", "[XXXXX415]", "[XXXXX416]", "[XXXXX417]", "[XXXXX418]", "[XXXXX419]", "[XXXXX420]", "[XXXXX421]", "[XXXXX422]", "[XXXXX423]", "[XXXXX424]", "[XXXXX425]", "[XXXXX426]", "[XXXXX427]", "[XXXXX428]", "[XXXXX429]", "[XXXXX430]", "[XXXXX431]", "[XXXXX432]", "[XXXXX433]", "[XXXXX434]", "[XXXXX435]", "[XXXXX436]", "[XXXXX437]", "[XXXXX438]", "[XXXXX439]", "[XXXXX440]", "[XXXXX441]", "[XXXXX442]", "[XXXXX443]", "[XXXXX444]", "[XXXXX445]", "[XXXXX446]", "[XXXXX447]", "[XXXXX448]", "[XXXXX449]", "[XXXXX450]", "[XXXXX451]", "[XXXXX452]", "[XXXXX453]", "[XXXXX454]", "[XXXXX455]", "[XXXXX456]", "[XXXXX457]", "[XXXXX458]", "[XXXXX459]", "[XXXXX460]", "[XXXXX461]", "[XXXXX462]", "[XXXXX463]", "[XXXXX464]", "[XXXXX465]", "[XXXXX466]", "[XXXXX467]", "[XXXXX468]", "[XXXXX469]", "[XXXXX470]", "[XXXXX471]", "[XXXXX472]", "[XXXXX473]", "[XXXXX474]", "[XXXXX475]", "[XXXXX476]", "[XXXXX477]", "[XXXXX478]", "[XXXXX479]", "[XXXXX480]", "[XXXXX481]", "[XXXXX482]", "[XXXXX483]", "[XXXXX484]", "[XXXXX485]", "[XXXXX486]", "[XXXXX487]", "[XXXXX488]", "[XXXXX489]", "[XXXXX490]", "[XXXXX491]", "[XXXXX492]", "[XXXXX493]", "[XXXXX494]", "[XXXXX495]", "[XXXXX496]", "[XXXXX497]", "[XXXXX498]", "[XXXXX499]", "[XXXXX500]", "[XXXXX501]", "[XXXXX502]", "[XXXXX503]", "[XXXXX504]", "[XXXXX505]", "[XXXXX506]", "[XXXXX507]", "[XXXXX508]", "[XXXXX509]", "[XXXXX510]", "[XXXXX511]", "[XXXXX512]", "[XXXXX513]", "[XXXXX514]", "[XXXXX515]", "[XXXXX516]", "[XXXXX517]", "[XXXXX518]", "[XXXXX519]", "[XXXXX520]", "[XXXXX521]", "[XXXXX522]", "[XXXXX523]", "[XXXXX524]", "[XXXXX525]", "[XXXXX526]", "[XXXXX527]", "[XXXXX528]", "[XXXXX529]", "[XXXXX530]", "[XXXXX531]", "[XXXXX532]", "[XXXXX533]", "[XXXXX534]", "[XXXXX535]", "[XXXXX536]", "[XXXXX537]", "[XXXXX538]", "[XXXXX539]", "[XXXXX540]", "[XXXXX541]", "[XXXXX542]", "[XXXXX543]", "[XXXXX544]", "[XXXXX545]", "[XXXXX546]", "[XXXXX547]", "[XXXXX548]", "[XXXXX549]", "[XXXXX550]", "[XXXXX551]", "[XXXXX552]", "[XXXXX553]", "[XXXXX554]", "[XXXXX555]", "[XXXXX556]", "[XXXXX557]", "[XXXXX558]", "[XXXXX559]", "[XXXXX560]", "[XXXXX561]", "[XXXXX562]", "[XXXXX563]", "[XXXXX564]", "[XXXXX565]", "[XXXXX566]", "[XXXXX567]", "[XXXXX568]", "[XXXXX569]", "[XXXXX570]", "[XXXXX571]", "[XXXXX572]", "[XXXXX573]", "[XXXXX574]", "[XXXXX575]", "[XXXXX576]", "[XXXXX577]", "[XXXXX578]", "[XXXXX579]", "[XXXXX580]", "[XXXXX581]", "[XXXXX582]", "[XXXXX583]", "[XXXXX584]", "[XXXXX585]", "[XXXXX586]", "[XXXXX587]", "[XXXXX588]", "[XXXXX589]", "[XXXXX590]", "[XXXXX591]", "[XXXXX592]", "[XXXXX593]", "[XXXXX594]", "[XXXXX595]", "[XXXXX596]", "[XXXXX597]", "[XXXXX598]", "[XXXXX599]", "[XXXXX600]", "[XXXXX601]", "[XXXXX602]", "[XXXXX603]", "[XXXXX604]", "[XXXXX605]", "[XXXXX606]", "[XXXXX607]", "[XXXXX608]", "[XXXXX609]", "[XXXXX610]", "[XXXXX611]", "[XXXXX612]", "[XXXXX613]", "[XXXXX614]", "[XXXXX615]", "[XXXXX616]", "[XXXXX617]", "[XXXXX618]", "[XXXXX619]", "[XXXXX620]", "[XXXXX621]", "[XXXXX622]", "[XXXXX623]", "[XXXXX624]", "[XXXXX625]", "[XXXXX626]", "[XXXXX627]", "[XXXXX628]", "[XXXXX629]", "[XXXXX630]", "[XXXXX631]", "[XXXXX632]", "[XXXXX633]", "[XXXXX634]", "[XXXXX635]", "[XXXXX636]", "[XXXXX637]", "[XXXXX638]", "[XXXXX639]", "[XXXXX640]", "[XXXXX641]", "[XXXXX642]", "[XXXXX643]", "[XXXXX644]", "[XXXXX645]", "[XXXXX646]", "[XXXXX647]", "[XXXXX648]", "[XXXXX649]", "[XXXXX650]", "[XXXXX651]", "[XXXXX652]", "[XXXXX653]", "[XXXXX654]", "[XXXXX655]", "[XXXXX656]", "[XXXXX657]", "[XXXXX658]", "[XXXXX659]", "[XXXXX660]", "[XXXXX661]", "[XXXXX662]", "[XXXXX663]", "[XXXXX664]", "[XXXXX665]", "[XXXXX666]", "[XXXXX667]", "[XXXXX668]", "[XXXXX669]", "[XXXXX670]", "[XXXXX671]", "[XXXXX672]", "[XXXXX673]", "[XXXXX674]", "[XXXXX675]", "[XXXXX676]", "[XXXXX677]", "[XXXXX678]", "[XXXXX679]", "[XXXXX680]", "[XXXXX681]", "[XXXXX682]", "[XXXXX683]", "[XXXXX684]", "[XXXXX685]", "[XXXXX686]", "[XXXXX687]", "[XXXXX688]", "[XXXXX689]", "[XXXXX690]", "[XXXXX691]", "[XXXXX692]", "[XXXXX693]", "[XXXXX694]", "[XXXXX695]", "[XXXXX696]", "[XXXXX697]", "[XXXXX698]", "[XXXXX699]", "[XXXXX700]", "[XXXXX701]", "[XXXXX702]", "[XXXXX703]", "[XXXXX704]", "[XXXXX705]", "[XXXXX706]", "[XXXXX707]", "[XXXXX708]", "[XXXXX709]", "[XXXXX710]", "[XXXXX711]", "[XXXXX712]", "[XXXXX713]", "[XXXXX714]", "[XXXXX715]", "[XXXXX716]", "[XXXXX717]", "[XXXXX718]", "[XXXXX719]", "[XXXXX720]", "[XXXXX721]", "[XXXXX722]", "[XXXXX723]", "[XXXXX724]", "[XXXXX725]", "[XXXXX726]", "[XXXXX727]", "[XXXXX728]", "[XXXXX729]", "[XXXXX730]", "[XXXXX731]", "[XXXXX732]", "[XXXXX733]", "[XXXXX734]", "[XXXXX735]", "[XXXXX736]", "[XXXXX737]", "[XXXXX738]", "[XXXXX739]", "[XXXXX740]", "[XXXXX741]", "[XXXXX742]", "[XXXXX743]", "[XXXXX744]", "[XXXXX745]", "[XXXXX746]", "[XXXXX747]", "[XXXXX748]", "[XXXXX749]", "[XXXXX750]", "[XXXXX751]", "[XXXXX752]", "[XXXXX753]", "[XXXXX754]", "[XXXXX755]", "[XXXXX756]", "[XXXXX757]", "[XXXXX758]", "[XXXXX759]", "[XXXXX760]", "[XXXXX761]", "[XXXXX762]", "[XXXXX763]", "[XXXXX764]"]}
spiece.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d20073deff030667202fa9214b9d9dd81c5e3d7af03910207ce324c2fee3c1b
3
+ size 1010636
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"do_lower_case": false, "remove_space": true, "keep_accents": true, "bos_token": "[CLS]", "eos_token": "[SEP]", "unk_token": "<unk>", "sep_token": "[SEP]", "pad_token": "<pad>", "cls_token": "[CLS]", "mask_token": {"content": "[MASK]", "single_word": false, "lstrip": true, "rstrip": false, "normalized": false, "__type": "AddedToken"}, "sp_model_kwargs": {}, "name_or_path": "models/10mb/pcm_latn_10mb", "model_input_names": ["input_ids", "attention_mask"], "special_tokens_map_file": "models/10mb/pcm_latn_10mb/special_tokens_map.json", "tokenizer_class": "AlbertTokenizer"}