sngsng commited on
Commit
082215a
1 Parent(s): 97fe491

Upload 3 files

Browse files
Files changed (3) hide show
  1. added_tokens.json +506 -0
  2. spiece.model +3 -0
  3. training_args.bin +3 -0
added_tokens.json ADDED
@@ -0,0 +1,506 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "3c": 32461,
3
+ "Taigi": 32598,
4
+ "Taiwan": 32590,
5
+ "Taiwanese": 32589,
6
+ "ah": 32328,
7
+ "ai": 32435,
8
+ "bard": 32466,
9
+ "bing": 32155,
10
+ "bái": 32146,
11
+ "chatgpt": 32375,
12
+ "eleven": 32501,
13
+ "excel": 32494,
14
+ "facebook": 32196,
15
+ "fasion": 32551,
16
+ "france": 32507,
17
+ "germany": 32505,
18
+ "google": 32276,
19
+ "gè": 32575,
20
+ "hashtag": 32388,
21
+ "hashtag?": 32584,
22
+ "india": 32502,
23
+ "inspiring": 32549,
24
+ "instagram": 32324,
25
+ "italy": 32500,
26
+ "lo͘": 32452,
27
+ "lài": 32300,
28
+ "mart": 32492,
29
+ "m̀": 32583,
30
+ "m̀?": 32586,
31
+ "o͘": 32202,
32
+ "paintings": 32599,
33
+ "quotes": 32541,
34
+ "seven": 32491,
35
+ "spain": 32498,
36
+ "taigi": 32600,
37
+ "taigi?": 32601,
38
+ "twitter": 32266,
39
+ "tó͘": 32205,
40
+ "youtube": 32350,
41
+ "youtube?": 32585,
42
+ "、": 32481,
43
+ "。": 32560,
44
+ "䆀": 32265,
45
+ "一": 32377,
46
+ "上": 32383,
47
+ "下": 32283,
48
+ "不": 32437,
49
+ "世": 32104,
50
+ "个": 32381,
51
+ "中": 32367,
52
+ "主": 32423,
53
+ "久": 32234,
54
+ "之": 32132,
55
+ "予": 32248,
56
+ "事": 32306,
57
+ "人": 32148,
58
+ "今": 32106,
59
+ "介": 32323,
60
+ "仔": 32209,
61
+ "他": 32530,
62
+ "仝": 32517,
63
+ "代": 32192,
64
+ "件": 32427,
65
+ "伊": 32107,
66
+ "伙": 32152,
67
+ "伴": 32593,
68
+ "佇": 32133,
69
+ "位": 32159,
70
+ "住": 32432,
71
+ "佗": 32414,
72
+ "作": 32519,
73
+ "你": 32116,
74
+ "佮": 32268,
75
+ "使": 32339,
76
+ "來": 32243,
77
+ "便": 32513,
78
+ "俗": 32356,
79
+ "個": 32175,
80
+ "借": 32168,
81
+ "假": 32525,
82
+ "偌": 32250,
83
+ "做": 32351,
84
+ "傷": 32118,
85
+ "像": 32597,
86
+ "價": 32382,
87
+ "儉": 32352,
88
+ "元": 32136,
89
+ "先": 32358,
90
+ "光": 32170,
91
+ "免": 32449,
92
+ "兜": 32439,
93
+ "入": 32406,
94
+ "公": 32296,
95
+ "共": 32478,
96
+ "其": 32506,
97
+ "冊": 32490,
98
+ "再": 32126,
99
+ "凊": 32483,
100
+ "出": 32143,
101
+ "別": 32566,
102
+ "利": 32512,
103
+ "到": 32285,
104
+ "則": 32197,
105
+ "創": 32344,
106
+ "劇": 32221,
107
+ "力": 32368,
108
+ "動": 32556,
109
+ "勞": 32287,
110
+ "勢": 32398,
111
+ "化": 32321,
112
+ "卵": 32121,
113
+ "原": 32476,
114
+ "去": 32445,
115
+ "口": 32464,
116
+ "古": 32325,
117
+ "句": 32291,
118
+ "台": 32373,
119
+ "台灣": 32587,
120
+ "史": 32523,
121
+ "名": 32236,
122
+ "向": 32272,
123
+ "吵": 32105,
124
+ "告": 32261,
125
+ "呢": 32384,
126
+ "味": 32357,
127
+ "呵": 32559,
128
+ "和": 32602,
129
+ "咧": 32330,
130
+ "咱": 32176,
131
+ "咾": 32567,
132
+ "品": 32497,
133
+ "員": 32576,
134
+ "哪": 32302,
135
+ "哲": 32521,
136
+ "哺": 32475,
137
+ "商": 32499,
138
+ "啉": 32144,
139
+ "問": 32190,
140
+ "啥": 32239,
141
+ "啦": 32214,
142
+ "喜": 32141,
143
+ "嘛": 32177,
144
+ "嘿": 32391,
145
+ "器": 32195,
146
+ "四": 32362,
147
+ "回": 32337,
148
+ "囡": 32594,
149
+ "國": 32119,
150
+ "圓": 32109,
151
+ "圖": 32548,
152
+ "地": 32201,
153
+ "埔": 32581,
154
+ "報": 32460,
155
+ "塊": 32216,
156
+ "外": 32348,
157
+ "多": 32369,
158
+ "夜": 32447,
159
+ "夠": 32431,
160
+ "大": 32114,
161
+ "天": 32424,
162
+ "奅": 32568,
163
+ "奶": 32319,
164
+ "好": 32327,
165
+ "娛": 32555,
166
+ "媠": 32139,
167
+ "嫌": 32562,
168
+ "字": 32504,
169
+ "學": 32430,
170
+ "宗": 32531,
171
+ "客": 32264,
172
+ "家": 32426,
173
+ "寒": 32108,
174
+ "寡": 32484,
175
+ "寫": 32207,
176
+ "對": 32112,
177
+ "小": 32188,
178
+ "尚": 32544,
179
+ "就": 32533,
180
+ "山": 32122,
181
+ "島": 32280,
182
+ "峽": 32314,
183
+ "工": 32204,
184
+ "己": 32297,
185
+ "已": 32343,
186
+ "市": 32156,
187
+ "幾": 32134,
188
+ "座": 32436,
189
+ "廳": 32163,
190
+ "建": 32226,
191
+ "彩": 32405,
192
+ "影": 32407,
193
+ "得": 32453,
194
+ "心": 32271,
195
+ "快": 32386,
196
+ "怎": 32394,
197
+ "怪": 32246,
198
+ "恩": 32444,
199
+ "恬": 32194,
200
+ "息": 32408,
201
+ "想": 32286,
202
+ "意": 32187,
203
+ "愛": 32262,
204
+ "感": 32127,
205
+ "懸": 32256,
206
+ "我": 32309,
207
+ "戲": 32582,
208
+ "手": 32338,
209
+ "技": 32336,
210
+ "拍": 32284,
211
+ "招": 32142,
212
+ "按": 32410,
213
+ "捌": 32529,
214
+ "插": 32558,
215
+ "揣": 32292,
216
+ "揤": 32565,
217
+ "搜": 32150,
218
+ "搪": 32293,
219
+ "擺": 32390,
220
+ "攏": 32400,
221
+ "支": 32281,
222
+ "改": 32580,
223
+ "放": 32536,
224
+ "政": 32528,
225
+ "故": 32158,
226
+ "教": 32514,
227
+ "敢": 32355,
228
+ "敲": 32282,
229
+ "數": 32479,
230
+ "文": 32186,
231
+ "料": 32181,
232
+ "新": 32364,
233
+ "旅": 32125,
234
+ "日": 32488,
235
+ "早": 32147,
236
+ "明": 32395,
237
+ "昏": 32140,
238
+ "星": 32577,
239
+ "昨": 32289,
240
+ "是": 32240,
241
+ "時": 32552,
242
+ "晝": 32331,
243
+ "景": 32515,
244
+ "暗": 32129,
245
+ "暝": 32257,
246
+ "曉": 32520,
247
+ "最": 32166,
248
+ "會": 32403,
249
+ "月": 32219,
250
+ "有": 32379,
251
+ "望": 32301,
252
+ "本": 32164,
253
+ "果": 32342,
254
+ "某": 32578,
255
+ "查": 32172,
256
+ "案": 32508,
257
+ "條": 32458,
258
+ "楞": 32135,
259
+ "業": 32455,
260
+ "概": 32295,
261
+ "樂": 32130,
262
+ "機": 32263,
263
+ "檔": 32510,
264
+ "欠": 32182,
265
+ "欲": 32374,
266
+ "款": 32254,
267
+ "歇": 32471,
268
+ "歌": 32378,
269
+ "歐": 32366,
270
+ "歡": 32442,
271
+ "止": 32359,
272
+ "正": 32450,
273
+ "歧": 32315,
274
+ "歷": 32526,
275
+ "歹": 32290,
276
+ "死": 32218,
277
+ "毋": 32277,
278
+ "比": 32571,
279
+ "民": 32259,
280
+ "氣": 32210,
281
+ "水": 32333,
282
+ "求": 32495,
283
+ "池": 32365,
284
+ "沛": 32260,
285
+ "治": 32527,
286
+ "法": 32173,
287
+ "注": 32311,
288
+ "洲": 32467,
289
+ "活": 32572,
290
+ "流": 32543,
291
+ "海": 32433,
292
+ "消": 32227,
293
+ "涼": 32396,
294
+ "添": 32131,
295
+ "港": 32477,
296
+ "湯": 32547,
297
+ "滷": 32425,
298
+ "演": 32579,
299
+ "濟": 32422,
300
+ "灣": 32269,
301
+ "無": 32318,
302
+ "然": 32294,
303
+ "煞": 32222,
304
+ "熱": 32100,
305
+ "燒": 32247,
306
+ "爾": 32103,
307
+ "片": 32485,
308
+ "物": 32255,
309
+ "特": 32569,
310
+ "狗": 32596,
311
+ "猶": 32278,
312
+ "玉": 32415,
313
+ "理": 32545,
314
+ "甜": 32326,
315
+ "生": 32229,
316
+ "產": 32419,
317
+ "用": 32310,
318
+ "甲": 32474,
319
+ "界": 32487,
320
+ "畫": 32542,
321
+ "當": 32409,
322
+ "發": 32335,
323
+ "的": 32241,
324
+ "盒": 32165,
325
+ "相": 32380,
326
+ "看": 32151,
327
+ "真": 32230,
328
+ "着": 32179,
329
+ "矣": 32370,
330
+ "知": 32189,
331
+ "神": 32537,
332
+ "科": 32361,
333
+ "種": 32223,
334
+ "穩": 32371,
335
+ "空": 32123,
336
+ "穿": 32570,
337
+ "站": 32203,
338
+ "章": 32110,
339
+ "笑": 32411,
340
+ "箍": 32329,
341
+ "節": 32354,
342
+ "篇": 32145,
343
+ "築": 32561,
344
+ "米": 32316,
345
+ "粉": 32341,
346
+ "糕": 32443,
347
+ "約": 32509,
348
+ "細": 32451,
349
+ "紹": 32457,
350
+ "組": 32489,
351
+ "絞": 32307,
352
+ "絲": 32217,
353
+ "經": 32413,
354
+ "網": 32493,
355
+ "緊": 32267,
356
+ "緻": 32532,
357
+ "總": 32518,
358
+ "續": 32345,
359
+ "罔": 32469,
360
+ "罕": 32317,
361
+ "美": 32298,
362
+ "翕": 32524,
363
+ "翻": 32191,
364
+ "聞": 32249,
365
+ "聽": 32161,
366
+ "肉": 32397,
367
+ "育": 32535,
368
+ "能": 32120,
369
+ "膩": 32470,
370
+ "臺": 32313,
371
+ "臺灣": 32588,
372
+ "舞": 32252,
373
+ "花": 32553,
374
+ "芳": 32332,
375
+ "若": 32421,
376
+ "英": 32299,
377
+ "茶": 32160,
378
+ "莫": 32128,
379
+ "菜": 32233,
380
+ "落": 32462,
381
+ "著": 32353,
382
+ "蓋": 32237,
383
+ "蔬": 32275,
384
+ "藝": 32557,
385
+ "螺": 32456,
386
+ "行": 32167,
387
+ "術": 32540,
388
+ "衝": 32392,
389
+ "袂": 32385,
390
+ "要": 32198,
391
+ "見": 32459,
392
+ "覓": 32401,
393
+ "視": 32303,
394
+ "觀": 32157,
395
+ "言": 32153,
396
+ "記": 32200,
397
+ "試": 32468,
398
+ "詩": 32215,
399
+ "話": 32111,
400
+ "詼": 32312,
401
+ "誌": 32363,
402
+ "語": 32446,
403
+ "誠": 32274,
404
+ "說": 32402,
405
+ "請": 32270,
406
+ "論": 32184,
407
+ "講": 32273,
408
+ "謝": 32463,
409
+ "譯": 32349,
410
+ "議": 32412,
411
+ "讚": 32231,
412
+ "豐": 32225,
413
+ "貓": 32595,
414
+ "財": 32546,
415
+ "買": 32346,
416
+ "資": 32211,
417
+ "賢": 32232,
418
+ "賣": 32101,
419
+ "賽": 32564,
420
+ "起": 32183,
421
+ "超": 32503,
422
+ "趖": 32522,
423
+ "趣": 32441,
424
+ "足": 32429,
425
+ "路": 32238,
426
+ "踅": 32308,
427
+ "蹛": 32138,
428
+ "軍": 32454,
429
+ "較": 32154,
430
+ "載": 32304,
431
+ "輕": 32117,
432
+ "迌": 32574,
433
+ "近": 32417,
434
+ "透": 32224,
435
+ "逐": 32245,
436
+ "這": 32115,
437
+ "通": 32199,
438
+ "逝": 32149,
439
+ "造": 32288,
440
+ "連": 32399,
441
+ "進": 32169,
442
+ "遊": 32171,
443
+ "運": 32539,
444
+ "過": 32438,
445
+ "達": 32228,
446
+ "適": 32440,
447
+ "遮": 32178,
448
+ "酒": 32473,
449
+ "酥": 32372,
450
+ "醉": 32404,
451
+ "重": 32162,
452
+ "量": 32496,
453
+ "錐": 32591,
454
+ "錢": 32389,
455
+ "鎮": 32258,
456
+ "鑠": 32563,
457
+ "閒": 32480,
458
+ "間": 32554,
459
+ "閣": 32418,
460
+ "關": 32420,
461
+ "阮": 32174,
462
+ "隊": 32387,
463
+ "際": 32486,
464
+ "隻": 32516,
465
+ "雄": 32360,
466
+ "雖": 32180,
467
+ "雞": 32434,
468
+ "雨": 32416,
469
+ "雷": 32220,
470
+ "電": 32253,
471
+ "霆": 32340,
472
+ "面": 32347,
473
+ "韓": 32465,
474
+ "音": 32235,
475
+ "頁": 32511,
476
+ "頓": 32279,
477
+ "頭": 32137,
478
+ "題": 32208,
479
+ "類": 32102,
480
+ "風": 32472,
481
+ "食": 32322,
482
+ "飯": 32482,
483
+ "飽": 32124,
484
+ "餐": 32113,
485
+ "館": 32550,
486
+ "馬": 32428,
487
+ "驚": 32320,
488
+ "骨": 32448,
489
+ "體": 32534,
490
+ "鬆": 32376,
491
+ "鬥": 32393,
492
+ "鬼": 32193,
493
+ "鮮": 32206,
494
+ "鹹": 32244,
495
+ "麗": 32251,
496
+ "點": 32185,
497
+ "鼓": 32538,
498
+ "齣": 32334,
499
+ "龜": 32592,
500
+ "!": 32212,
501
+ ",": 32603,
502
+ ".": 32242,
503
+ ":": 32305,
504
+ "?": 32213,
505
+ "𨑨": 32573
506
+ }
spiece.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d60acb128cf7b7f2536e8f38a5b18a05535c9e14c7a355904270e15b0945ea86
3
+ size 791656
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68d169ee298a3f9179ae519a9fedecd8cd16dbe54f1317153b733af3cb29141b
3
+ size 3771