floriangardin commited on
Commit
8593e68
1 Parent(s): 6f348d6

Upload tokenizer

Browse files
Files changed (4) hide show
  1. added_tokens.json +1 -1
  2. merges.txt +0 -561
  3. tokenizer.json +3 -1126
  4. vocab.json +1 -1
added_tokens.json CHANGED
@@ -1,3 +1,3 @@
1
  {
2
- "<|endoftext|>": 821
3
  }
 
1
  {
2
+ "<|endoftext|>": 260
3
  }
merges.txt CHANGED
@@ -1,562 +1 @@
1
  #version: 0.2
2
- ) .
3
- ( -
4
- _ _
5
- m p
6
- n o
7
- p i
8
- a no
9
- pi ano
10
- ) +
11
- p p
12
- ) (
13
- )+ (
14
- I I
15
- e d
16
- ' ]
17
- [ '
18
- '] %
19
- q d
20
- s d
21
- f f
22
- e n
23
- r a
24
- a u
25
- f ra
26
- g m
27
- en t
28
- au gm
29
- fra c
30
- augm ent
31
- r i
32
- V II
33
- h t
34
- b ri
35
- g ht
36
- bri ght
37
- I V
38
- ) ,
39
- 1 1
40
- h d
41
- 1 0
42
- V I
43
- II I
44
- ) ).
45
- ) )+
46
- ff f
47
- 2 4
48
- )( )+(
49
- s u
50
- o n
51
- 6 4
52
- b a
53
- s a
54
- sa x
55
- 2 1
56
- ) )+(
57
- 6 5
58
- t e
59
- pp p
60
- w d
61
- t r
62
- 4 3
63
- o l
64
- s s
65
- e t
66
- a r
67
- o r
68
- on e
69
- ba ss
70
- t i
71
- h or
72
- hor n
73
- e l
74
- i ol
75
- v iol
76
- m b
77
- 5 6
78
- u mp
79
- tr ump
80
- trump et
81
- g u
82
- i t
83
- gu it
84
- guit ar
85
- t o
86
- o mb
87
- tr omb
88
- tromb one
89
- 4 0
90
- i s
91
- ri n
92
- 1 2
93
- c h
94
- no r
95
- te nor
96
- 1 3
97
- a l
98
- al to
99
- i n
100
- 1 5
101
- o p
102
- r ano
103
- s op
104
- sop rano
105
- a n
106
- g l
107
- h ar
108
- har p
109
- c el
110
- en gl
111
- is h
112
- engl ish
113
- f r
114
- t u
115
- tu ba
116
- b o
117
- t one
118
- ri tone
119
- ba ritone
120
- l o
121
- o bo
122
- obo e
123
- c c
124
- cel lo
125
- c l
126
- a rin
127
- viol in
128
- en ch
129
- fr ench
130
- pi cc
131
- ol o
132
- picc olo
133
- o on
134
- bass oon
135
- cl arin
136
- clarin et
137
- d r
138
- m s
139
- u ms
140
- dr ums
141
- viol a
142
- f l
143
- u te
144
- fl ute
145
- c on
146
- t ra
147
- con tra
148
- contra bass
149
- mp an
150
- ti mpan
151
- timpan i
152
- 3 5
153
- ) ),
154
- s e
155
- 1 4
156
- ti on
157
- s te
158
- ste el
159
- 1 6
160
- ) <
161
- d o
162
- f te
163
- x t
164
- | >
165
- en do
166
- )< |
167
- fte xt
168
- endo ftext
169
- |> (
170
- 1 7
171
- a c
172
- o u
173
- s ti
174
- ac ou
175
- sti c
176
- acou stic
177
- a d
178
- { -
179
- l e
180
- } ']%
181
- 3 0
182
- 4 2
183
- 1 8
184
- s t
185
- 3 2
186
- b ra
187
- bra ss
188
- ad d
189
- en se
190
- mb le
191
- rin g
192
- st ring
193
- ense mble
194
- c tion
195
- se ction
196
- ) ']%
197
- d is
198
- t or
199
- dis tor
200
- distor tion
201
- 1 9
202
- h h
203
- 2 0
204
- 2 2
205
- ( +
206
- (+ )']%
207
- ] {-
208
- 2 3
209
- s n
210
- 2 5
211
- i c
212
- a to
213
- z z
214
- pi zz
215
- ic ato
216
- pizz icato
217
- b d
218
- c t
219
- e ct
220
- ri c
221
- el ect
222
- elect ric
223
- 2 7
224
- 2 6
225
- i r
226
- o ir
227
- ch oir
228
- h s
229
- a a
230
- aa hs
231
- e r
232
- t d
233
- 2 8
234
- 2 9
235
- m m
236
- ) ))+(
237
- 3 1
238
- o c
239
- f in
240
- g er
241
- fin ger
242
- g an
243
- or gan
244
- 3 3
245
- oc k
246
- [' (+)']%
247
- j o
248
- n jo
249
- ba njo
250
- p ad
251
- 3 4
252
- ] ']%
253
- r ock
254
- 3 7
255
- 3 9
256
- 4 1
257
- 4 4
258
- r s
259
- 8 4
260
- 6 9
261
- )( )<|
262
- 3 6
263
- w ar
264
- war m
265
- et le
266
- fr etle
267
- fretle ss
268
- 5 3
269
- [' [
270
- m ba
271
- 4 5
272
- a ri
273
- m ari
274
- mari mba
275
- 4 7
276
- g pi
277
- p e
278
- ba gpi
279
- bagpi pe
280
- ) )<|
281
- 4 8
282
- 3 8
283
- ] [
284
- e st
285
- cel est
286
- celest a
287
- f i
288
- t h
289
- c p
290
- 16 8
291
- 5 2
292
- f x
293
- e an
294
- cl ean
295
- 4 9
296
- arin a
297
- oc arina
298
- 4 6
299
- o h
300
- 6 0
301
- c i
302
- s ci
303
- 5 1
304
- a cc
305
- d i
306
- or di
307
- acc ordi
308
- accordi on
309
- 5 0
310
- 5 4
311
- n th
312
- s y
313
- sy nth
314
- 5 5
315
- 5 9
316
- le ad
317
- v er
318
- on k
319
- r ch
320
- u rch
321
- ch urch
322
- 12 0
323
- d ri
324
- o ver
325
- v en
326
- dri ven
327
- over driven
328
- 7 0
329
- } {-
330
- 7 3
331
- b t
332
- 6 1
333
- n e
334
- 8 7
335
- 8 0
336
- a p
337
- l ap
338
- s lap
339
- a g
340
- d d
341
- o ic
342
- v oic
343
- fi dd
344
- ne w
345
- ag e
346
- voic e
347
- fidd le
348
- 8 3
349
- h onk
350
- s pi
351
- t onk
352
- en spi
353
- gl ock
354
- honk y
355
- enspi el
356
- glock enspiel
357
- 6 7
358
- o th
359
- w to
360
- sa wto
361
- sawto oth
362
- 8 1
363
- 7 7
364
- m t
365
- 5 7
366
- 10 1
367
- 10 9
368
- 7 9
369
- 11 2
370
- 8 9
371
- 6 2
372
- 11 3
373
- 1 40
374
- l t
375
- 7 1
376
- 10 3
377
- 9 7
378
- b lo
379
- t t
380
- w n
381
- bo tt
382
- blo wn
383
- bott le
384
- 9 5
385
- 11 5
386
- 15 1
387
- 8 5
388
- 28 0
389
- 13 7
390
- 1 43
391
- 24 0
392
- 9 1
393
- 12 5
394
- 24 1
395
- 1 21
396
- 9 2
397
- 11 6
398
- 12 3
399
- 18 7
400
- a t
401
- h er
402
- m o
403
- p her
404
- s pher
405
- 12 7
406
- 13 1
407
- 22 9
408
- at mo
409
- spher e
410
- atmo sphere
411
- 6 3
412
- 8 2
413
- 11 9
414
- 17 3
415
- 22 3
416
- 17 9
417
- 9 3
418
- 12 9
419
- 8 40
420
- 10 5
421
- 29 3
422
- a ra
423
- n g
424
- bright ne
425
- ch ara
426
- brightne ss
427
- chara ng
428
- 11 7
429
- 13 9
430
- 16 9
431
- ) ))<|
432
- 16 7
433
- 18 5
434
- 13 3
435
- 15 7
436
- 18 1
437
- 3 65
438
- m u
439
- t ed
440
- mu ted
441
- 2 10
442
- 2 21
443
- 7 6
444
- o o
445
- 19 9
446
- oo hs
447
- c y
448
- e ver
449
- r ever
450
- 20 7
451
- 28 9
452
- 33 6
453
- mba l
454
- 109 4
455
- cy mbal
456
- rever se
457
- 19 7
458
- 10 7
459
- 14 7
460
- 9 9
461
- 7 5
462
- 15 3
463
- 25 7
464
- 28 1
465
- 38 9
466
- 2 11
467
- 5 29
468
- 5 53
469
- 6 8
470
- 10 87
471
- 21 3
472
- 19 1
473
- 20 9
474
- 27 1
475
- 29 5
476
- 46 7
477
- 3 43
478
- 7 19
479
- 7 37
480
- 8 43
481
- 9 17
482
- 24 7
483
- 43 7
484
- 40 9
485
- 12 8
486
- 35 9
487
- 14 5
488
- 20 5
489
- 29 7
490
- 37 1
491
- 39 1
492
- 69 7
493
- 45 1
494
- 67 1
495
- 67 9
496
- 3 19
497
- 6 23
498
- 6 69
499
- 7 33
500
- 7 67
501
- 7 57
502
- 8 11
503
- 8 83
504
- 9 13
505
- 9 35
506
- 24 3
507
- 21 2
508
- 21 7
509
- 56 0
510
- 56 9
511
- 15 2
512
- 15 5
513
- 15 21
514
- 16 1
515
- 16 3
516
- 16 27
517
- 17 7
518
- 18 6
519
- 32 3
520
- 32 7
521
- 25 5
522
- 26 3
523
- 26 8
524
- 33 4
525
- 34 5
526
- 39 2
527
- 39 9
528
- 69 5
529
- 69 9
530
- 47 5
531
- 48 9
532
- 49 1
533
- 59 1
534
- 70 5
535
- 80 1
536
- 365 3
537
- 99 43
538
- 14 9
539
- 9 22
540
- 15 9
541
- b l
542
- o bl
543
- in s
544
- gl obl
545
- 19 3
546
- 37 7
547
- globl ins
548
- 5 8
549
- 22 7
550
- 46 3
551
- 2 35
552
- 3 11
553
- 11 1
554
- 14 1
555
- 14 8
556
- 16 91
557
- 17 0
558
- 42 2
559
- 18 8
560
- 20 1
561
- 26 9
562
- 48 1
 
1
  #version: 0.2
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tokenizer.json CHANGED
@@ -4,7 +4,7 @@
4
  "padding": null,
5
  "added_tokens": [
6
  {
7
- "id": 821,
8
  "content": "<|endoftext|>",
9
  "single_word": false,
10
  "lstrip": false,
@@ -300,1131 +300,8 @@
300
  "ŀ": 256,
301
  "Ł": 257,
302
  "ł": 258,
303
- "Ń": 259,
304
- ").": 260,
305
- "(-": 261,
306
- "__": 262,
307
- "mp": 263,
308
- "no": 264,
309
- "pi": 265,
310
- "ano": 266,
311
- "piano": 267,
312
- ")+": 268,
313
- "pp": 269,
314
- ")(": 270,
315
- ")+(": 271,
316
- "II": 272,
317
- "ed": 273,
318
- "']": 274,
319
- "['": 275,
320
- "']%": 276,
321
- "qd": 277,
322
- "sd": 278,
323
- "ff": 279,
324
- "en": 280,
325
- "ra": 281,
326
- "au": 282,
327
- "fra": 283,
328
- "gm": 284,
329
- "ent": 285,
330
- "augm": 286,
331
- "frac": 287,
332
- "augment": 288,
333
- "ri": 289,
334
- "VII": 290,
335
- "ht": 291,
336
- "bri": 292,
337
- "ght": 293,
338
- "bright": 294,
339
- "IV": 295,
340
- "),": 296,
341
- "11": 297,
342
- "hd": 298,
343
- "10": 299,
344
- "VI": 300,
345
- "III": 301,
346
- ")).": 302,
347
- "))+": 303,
348
- "fff": 304,
349
- "24": 305,
350
- ")()+(": 306,
351
- "su": 307,
352
- "on": 308,
353
- "64": 309,
354
- "ba": 310,
355
- "sa": 311,
356
- "sax": 312,
357
- "21": 313,
358
- "))+(": 314,
359
- "65": 315,
360
- "te": 316,
361
- "ppp": 317,
362
- "wd": 318,
363
- "tr": 319,
364
- "43": 320,
365
- "ol": 321,
366
- "ss": 322,
367
- "et": 323,
368
- "ar": 324,
369
- "or": 325,
370
- "one": 326,
371
- "bass": 327,
372
- "ti": 328,
373
- "hor": 329,
374
- "horn": 330,
375
- "el": 331,
376
- "iol": 332,
377
- "viol": 333,
378
- "mb": 334,
379
- "56": 335,
380
- "ump": 336,
381
- "trump": 337,
382
- "trumpet": 338,
383
- "gu": 339,
384
- "it": 340,
385
- "guit": 341,
386
- "guitar": 342,
387
- "to": 343,
388
- "omb": 344,
389
- "tromb": 345,
390
- "trombone": 346,
391
- "40": 347,
392
- "is": 348,
393
- "rin": 349,
394
- "12": 350,
395
- "ch": 351,
396
- "nor": 352,
397
- "tenor": 353,
398
- "13": 354,
399
- "al": 355,
400
- "alto": 356,
401
- "in": 357,
402
- "15": 358,
403
- "op": 359,
404
- "rano": 360,
405
- "sop": 361,
406
- "soprano": 362,
407
- "an": 363,
408
- "gl": 364,
409
- "har": 365,
410
- "harp": 366,
411
- "cel": 367,
412
- "engl": 368,
413
- "ish": 369,
414
- "english": 370,
415
- "fr": 371,
416
- "tu": 372,
417
- "tuba": 373,
418
- "bo": 374,
419
- "tone": 375,
420
- "ritone": 376,
421
- "baritone": 377,
422
- "lo": 378,
423
- "obo": 379,
424
- "oboe": 380,
425
- "cc": 381,
426
- "cello": 382,
427
- "cl": 383,
428
- "arin": 384,
429
- "violin": 385,
430
- "ench": 386,
431
- "french": 387,
432
- "picc": 388,
433
- "olo": 389,
434
- "piccolo": 390,
435
- "oon": 391,
436
- "bassoon": 392,
437
- "clarin": 393,
438
- "clarinet": 394,
439
- "dr": 395,
440
- "ms": 396,
441
- "ums": 397,
442
- "drums": 398,
443
- "viola": 399,
444
- "fl": 400,
445
- "ute": 401,
446
- "flute": 402,
447
- "con": 403,
448
- "tra": 404,
449
- "contra": 405,
450
- "contrabass": 406,
451
- "mpan": 407,
452
- "timpan": 408,
453
- "timpani": 409,
454
- "35": 410,
455
- ")),": 411,
456
- "se": 412,
457
- "14": 413,
458
- "tion": 414,
459
- "ste": 415,
460
- "steel": 416,
461
- "16": 417,
462
- ")<": 418,
463
- "do": 419,
464
- "fte": 420,
465
- "xt": 421,
466
- "|>": 422,
467
- "endo": 423,
468
- ")<|": 424,
469
- "ftext": 425,
470
- "endoftext": 426,
471
- "|>(": 427,
472
- "17": 428,
473
- "ac": 429,
474
- "ou": 430,
475
- "sti": 431,
476
- "acou": 432,
477
- "stic": 433,
478
- "acoustic": 434,
479
- "ad": 435,
480
- "{-": 436,
481
- "le": 437,
482
- "}']%": 438,
483
- "30": 439,
484
- "42": 440,
485
- "18": 441,
486
- "st": 442,
487
- "32": 443,
488
- "bra": 444,
489
- "brass": 445,
490
- "add": 446,
491
- "ense": 447,
492
- "mble": 448,
493
- "ring": 449,
494
- "string": 450,
495
- "ensemble": 451,
496
- "ction": 452,
497
- "section": 453,
498
- ")']%": 454,
499
- "dis": 455,
500
- "tor": 456,
501
- "distor": 457,
502
- "distortion": 458,
503
- "19": 459,
504
- "hh": 460,
505
- "20": 461,
506
- "22": 462,
507
- "(+": 463,
508
- "(+)']%": 464,
509
- "]{-": 465,
510
- "23": 466,
511
- "sn": 467,
512
- "25": 468,
513
- "ic": 469,
514
- "ato": 470,
515
- "zz": 471,
516
- "pizz": 472,
517
- "icato": 473,
518
- "pizzicato": 474,
519
- "bd": 475,
520
- "ct": 476,
521
- "ect": 477,
522
- "ric": 478,
523
- "elect": 479,
524
- "electric": 480,
525
- "27": 481,
526
- "26": 482,
527
- "ir": 483,
528
- "oir": 484,
529
- "choir": 485,
530
- "hs": 486,
531
- "aa": 487,
532
- "aahs": 488,
533
- "er": 489,
534
- "td": 490,
535
- "28": 491,
536
- "29": 492,
537
- "mm": 493,
538
- ")))+(": 494,
539
- "31": 495,
540
- "oc": 496,
541
- "fin": 497,
542
- "ger": 498,
543
- "finger": 499,
544
- "gan": 500,
545
- "organ": 501,
546
- "33": 502,
547
- "ock": 503,
548
- "['(+)']%": 504,
549
- "jo": 505,
550
- "njo": 506,
551
- "banjo": 507,
552
- "pad": 508,
553
- "34": 509,
554
- "]']%": 510,
555
- "rock": 511,
556
- "37": 512,
557
- "39": 513,
558
- "41": 514,
559
- "44": 515,
560
- "rs": 516,
561
- "84": 517,
562
- "69": 518,
563
- ")()<|": 519,
564
- "36": 520,
565
- "war": 521,
566
- "warm": 522,
567
- "etle": 523,
568
- "fretle": 524,
569
- "fretless": 525,
570
- "53": 526,
571
- "['[": 527,
572
- "mba": 528,
573
- "45": 529,
574
- "ari": 530,
575
- "mari": 531,
576
- "marimba": 532,
577
- "47": 533,
578
- "gpi": 534,
579
- "pe": 535,
580
- "bagpi": 536,
581
- "bagpipe": 537,
582
- "))<|": 538,
583
- "48": 539,
584
- "38": 540,
585
- "][": 541,
586
- "est": 542,
587
- "celest": 543,
588
- "celesta": 544,
589
- "fi": 545,
590
- "th": 546,
591
- "cp": 547,
592
- "168": 548,
593
- "52": 549,
594
- "fx": 550,
595
- "ean": 551,
596
- "clean": 552,
597
- "49": 553,
598
- "arina": 554,
599
- "ocarina": 555,
600
- "46": 556,
601
- "oh": 557,
602
- "60": 558,
603
- "ci": 559,
604
- "sci": 560,
605
- "51": 561,
606
- "acc": 562,
607
- "di": 563,
608
- "ordi": 564,
609
- "accordi": 565,
610
- "accordion": 566,
611
- "50": 567,
612
- "54": 568,
613
- "nth": 569,
614
- "sy": 570,
615
- "synth": 571,
616
- "55": 572,
617
- "59": 573,
618
- "lead": 574,
619
- "ver": 575,
620
- "onk": 576,
621
- "rch": 577,
622
- "urch": 578,
623
- "church": 579,
624
- "120": 580,
625
- "dri": 581,
626
- "over": 582,
627
- "ven": 583,
628
- "driven": 584,
629
- "overdriven": 585,
630
- "70": 586,
631
- "}{-": 587,
632
- "73": 588,
633
- "bt": 589,
634
- "61": 590,
635
- "ne": 591,
636
- "87": 592,
637
- "80": 593,
638
- "ap": 594,
639
- "lap": 595,
640
- "slap": 596,
641
- "ag": 597,
642
- "dd": 598,
643
- "oic": 599,
644
- "voic": 600,
645
- "fidd": 601,
646
- "new": 602,
647
- "age": 603,
648
- "voice": 604,
649
- "fiddle": 605,
650
- "83": 606,
651
- "honk": 607,
652
- "spi": 608,
653
- "tonk": 609,
654
- "enspi": 610,
655
- "glock": 611,
656
- "honky": 612,
657
- "enspiel": 613,
658
- "glockenspiel": 614,
659
- "67": 615,
660
- "oth": 616,
661
- "wto": 617,
662
- "sawto": 618,
663
- "sawtooth": 619,
664
- "81": 620,
665
- "77": 621,
666
- "mt": 622,
667
- "57": 623,
668
- "101": 624,
669
- "109": 625,
670
- "79": 626,
671
- "112": 627,
672
- "89": 628,
673
- "62": 629,
674
- "113": 630,
675
- "140": 631,
676
- "lt": 632,
677
- "71": 633,
678
- "103": 634,
679
- "97": 635,
680
- "blo": 636,
681
- "tt": 637,
682
- "wn": 638,
683
- "bott": 639,
684
- "blown": 640,
685
- "bottle": 641,
686
- "95": 642,
687
- "115": 643,
688
- "151": 644,
689
- "85": 645,
690
- "280": 646,
691
- "137": 647,
692
- "143": 648,
693
- "240": 649,
694
- "91": 650,
695
- "125": 651,
696
- "241": 652,
697
- "121": 653,
698
- "92": 654,
699
- "116": 655,
700
- "123": 656,
701
- "187": 657,
702
- "at": 658,
703
- "her": 659,
704
- "mo": 660,
705
- "pher": 661,
706
- "spher": 662,
707
- "127": 663,
708
- "131": 664,
709
- "229": 665,
710
- "atmo": 666,
711
- "sphere": 667,
712
- "atmosphere": 668,
713
- "63": 669,
714
- "82": 670,
715
- "119": 671,
716
- "173": 672,
717
- "223": 673,
718
- "179": 674,
719
- "93": 675,
720
- "129": 676,
721
- "840": 677,
722
- "105": 678,
723
- "293": 679,
724
- "ara": 680,
725
- "ng": 681,
726
- "brightne": 682,
727
- "chara": 683,
728
- "brightness": 684,
729
- "charang": 685,
730
- "117": 686,
731
- "139": 687,
732
- "169": 688,
733
- ")))<|": 689,
734
- "167": 690,
735
- "185": 691,
736
- "133": 692,
737
- "157": 693,
738
- "181": 694,
739
- "365": 695,
740
- "mu": 696,
741
- "ted": 697,
742
- "muted": 698,
743
- "210": 699,
744
- "221": 700,
745
- "76": 701,
746
- "oo": 702,
747
- "199": 703,
748
- "oohs": 704,
749
- "cy": 705,
750
- "ever": 706,
751
- "rever": 707,
752
- "207": 708,
753
- "289": 709,
754
- "336": 710,
755
- "mbal": 711,
756
- "1094": 712,
757
- "cymbal": 713,
758
- "reverse": 714,
759
- "197": 715,
760
- "107": 716,
761
- "147": 717,
762
- "99": 718,
763
- "75": 719,
764
- "153": 720,
765
- "257": 721,
766
- "281": 722,
767
- "389": 723,
768
- "211": 724,
769
- "529": 725,
770
- "553": 726,
771
- "68": 727,
772
- "1087": 728,
773
- "213": 729,
774
- "191": 730,
775
- "209": 731,
776
- "271": 732,
777
- "295": 733,
778
- "467": 734,
779
- "343": 735,
780
- "719": 736,
781
- "737": 737,
782
- "843": 738,
783
- "917": 739,
784
- "247": 740,
785
- "437": 741,
786
- "409": 742,
787
- "128": 743,
788
- "359": 744,
789
- "145": 745,
790
- "205": 746,
791
- "297": 747,
792
- "371": 748,
793
- "391": 749,
794
- "697": 750,
795
- "451": 751,
796
- "671": 752,
797
- "679": 753,
798
- "319": 754,
799
- "623": 755,
800
- "669": 756,
801
- "733": 757,
802
- "767": 758,
803
- "757": 759,
804
- "811": 760,
805
- "883": 761,
806
- "913": 762,
807
- "935": 763,
808
- "243": 764,
809
- "212": 765,
810
- "217": 766,
811
- "560": 767,
812
- "569": 768,
813
- "152": 769,
814
- "155": 770,
815
- "1521": 771,
816
- "161": 772,
817
- "163": 773,
818
- "1627": 774,
819
- "177": 775,
820
- "186": 776,
821
- "323": 777,
822
- "327": 778,
823
- "255": 779,
824
- "263": 780,
825
- "268": 781,
826
- "334": 782,
827
- "345": 783,
828
- "392": 784,
829
- "399": 785,
830
- "695": 786,
831
- "699": 787,
832
- "475": 788,
833
- "489": 789,
834
- "491": 790,
835
- "591": 791,
836
- "705": 792,
837
- "801": 793,
838
- "3653": 794,
839
- "9943": 795,
840
- "149": 796,
841
- "922": 797,
842
- "159": 798,
843
- "bl": 799,
844
- "obl": 800,
845
- "ins": 801,
846
- "globl": 802,
847
- "193": 803,
848
- "377": 804,
849
- "globlins": 805,
850
- "58": 806,
851
- "227": 807,
852
- "463": 808,
853
- "235": 809,
854
- "311": 810,
855
- "111": 811,
856
- "141": 812,
857
- "148": 813,
858
- "1691": 814,
859
- "170": 815,
860
- "422": 816,
861
- "188": 817,
862
- "201": 818,
863
- "269": 819,
864
- "481": 820
865
  },
866
- "merges": [
867
- ") .",
868
- "( -",
869
- "_ _",
870
- "m p",
871
- "n o",
872
- "p i",
873
- "a no",
874
- "pi ano",
875
- ") +",
876
- "p p",
877
- ") (",
878
- ")+ (",
879
- "I I",
880
- "e d",
881
- "' ]",
882
- "[ '",
883
- "'] %",
884
- "q d",
885
- "s d",
886
- "f f",
887
- "e n",
888
- "r a",
889
- "a u",
890
- "f ra",
891
- "g m",
892
- "en t",
893
- "au gm",
894
- "fra c",
895
- "augm ent",
896
- "r i",
897
- "V II",
898
- "h t",
899
- "b ri",
900
- "g ht",
901
- "bri ght",
902
- "I V",
903
- ") ,",
904
- "1 1",
905
- "h d",
906
- "1 0",
907
- "V I",
908
- "II I",
909
- ") ).",
910
- ") )+",
911
- "ff f",
912
- "2 4",
913
- ")( )+(",
914
- "s u",
915
- "o n",
916
- "6 4",
917
- "b a",
918
- "s a",
919
- "sa x",
920
- "2 1",
921
- ") )+(",
922
- "6 5",
923
- "t e",
924
- "pp p",
925
- "w d",
926
- "t r",
927
- "4 3",
928
- "o l",
929
- "s s",
930
- "e t",
931
- "a r",
932
- "o r",
933
- "on e",
934
- "ba ss",
935
- "t i",
936
- "h or",
937
- "hor n",
938
- "e l",
939
- "i ol",
940
- "v iol",
941
- "m b",
942
- "5 6",
943
- "u mp",
944
- "tr ump",
945
- "trump et",
946
- "g u",
947
- "i t",
948
- "gu it",
949
- "guit ar",
950
- "t o",
951
- "o mb",
952
- "tr omb",
953
- "tromb one",
954
- "4 0",
955
- "i s",
956
- "ri n",
957
- "1 2",
958
- "c h",
959
- "no r",
960
- "te nor",
961
- "1 3",
962
- "a l",
963
- "al to",
964
- "i n",
965
- "1 5",
966
- "o p",
967
- "r ano",
968
- "s op",
969
- "sop rano",
970
- "a n",
971
- "g l",
972
- "h ar",
973
- "har p",
974
- "c el",
975
- "en gl",
976
- "is h",
977
- "engl ish",
978
- "f r",
979
- "t u",
980
- "tu ba",
981
- "b o",
982
- "t one",
983
- "ri tone",
984
- "ba ritone",
985
- "l o",
986
- "o bo",
987
- "obo e",
988
- "c c",
989
- "cel lo",
990
- "c l",
991
- "a rin",
992
- "viol in",
993
- "en ch",
994
- "fr ench",
995
- "pi cc",
996
- "ol o",
997
- "picc olo",
998
- "o on",
999
- "bass oon",
1000
- "cl arin",
1001
- "clarin et",
1002
- "d r",
1003
- "m s",
1004
- "u ms",
1005
- "dr ums",
1006
- "viol a",
1007
- "f l",
1008
- "u te",
1009
- "fl ute",
1010
- "c on",
1011
- "t ra",
1012
- "con tra",
1013
- "contra bass",
1014
- "mp an",
1015
- "ti mpan",
1016
- "timpan i",
1017
- "3 5",
1018
- ") ),",
1019
- "s e",
1020
- "1 4",
1021
- "ti on",
1022
- "s te",
1023
- "ste el",
1024
- "1 6",
1025
- ") <",
1026
- "d o",
1027
- "f te",
1028
- "x t",
1029
- "| >",
1030
- "en do",
1031
- ")< |",
1032
- "fte xt",
1033
- "endo ftext",
1034
- "|> (",
1035
- "1 7",
1036
- "a c",
1037
- "o u",
1038
- "s ti",
1039
- "ac ou",
1040
- "sti c",
1041
- "acou stic",
1042
- "a d",
1043
- "{ -",
1044
- "l e",
1045
- "} ']%",
1046
- "3 0",
1047
- "4 2",
1048
- "1 8",
1049
- "s t",
1050
- "3 2",
1051
- "b ra",
1052
- "bra ss",
1053
- "ad d",
1054
- "en se",
1055
- "mb le",
1056
- "rin g",
1057
- "st ring",
1058
- "ense mble",
1059
- "c tion",
1060
- "se ction",
1061
- ") ']%",
1062
- "d is",
1063
- "t or",
1064
- "dis tor",
1065
- "distor tion",
1066
- "1 9",
1067
- "h h",
1068
- "2 0",
1069
- "2 2",
1070
- "( +",
1071
- "(+ )']%",
1072
- "] {-",
1073
- "2 3",
1074
- "s n",
1075
- "2 5",
1076
- "i c",
1077
- "a to",
1078
- "z z",
1079
- "pi zz",
1080
- "ic ato",
1081
- "pizz icato",
1082
- "b d",
1083
- "c t",
1084
- "e ct",
1085
- "ri c",
1086
- "el ect",
1087
- "elect ric",
1088
- "2 7",
1089
- "2 6",
1090
- "i r",
1091
- "o ir",
1092
- "ch oir",
1093
- "h s",
1094
- "a a",
1095
- "aa hs",
1096
- "e r",
1097
- "t d",
1098
- "2 8",
1099
- "2 9",
1100
- "m m",
1101
- ") ))+(",
1102
- "3 1",
1103
- "o c",
1104
- "f in",
1105
- "g er",
1106
- "fin ger",
1107
- "g an",
1108
- "or gan",
1109
- "3 3",
1110
- "oc k",
1111
- "[' (+)']%",
1112
- "j o",
1113
- "n jo",
1114
- "ba njo",
1115
- "p ad",
1116
- "3 4",
1117
- "] ']%",
1118
- "r ock",
1119
- "3 7",
1120
- "3 9",
1121
- "4 1",
1122
- "4 4",
1123
- "r s",
1124
- "8 4",
1125
- "6 9",
1126
- ")( )<|",
1127
- "3 6",
1128
- "w ar",
1129
- "war m",
1130
- "et le",
1131
- "fr etle",
1132
- "fretle ss",
1133
- "5 3",
1134
- "[' [",
1135
- "m ba",
1136
- "4 5",
1137
- "a ri",
1138
- "m ari",
1139
- "mari mba",
1140
- "4 7",
1141
- "g pi",
1142
- "p e",
1143
- "ba gpi",
1144
- "bagpi pe",
1145
- ") )<|",
1146
- "4 8",
1147
- "3 8",
1148
- "] [",
1149
- "e st",
1150
- "cel est",
1151
- "celest a",
1152
- "f i",
1153
- "t h",
1154
- "c p",
1155
- "16 8",
1156
- "5 2",
1157
- "f x",
1158
- "e an",
1159
- "cl ean",
1160
- "4 9",
1161
- "arin a",
1162
- "oc arina",
1163
- "4 6",
1164
- "o h",
1165
- "6 0",
1166
- "c i",
1167
- "s ci",
1168
- "5 1",
1169
- "a cc",
1170
- "d i",
1171
- "or di",
1172
- "acc ordi",
1173
- "accordi on",
1174
- "5 0",
1175
- "5 4",
1176
- "n th",
1177
- "s y",
1178
- "sy nth",
1179
- "5 5",
1180
- "5 9",
1181
- "le ad",
1182
- "v er",
1183
- "on k",
1184
- "r ch",
1185
- "u rch",
1186
- "ch urch",
1187
- "12 0",
1188
- "d ri",
1189
- "o ver",
1190
- "v en",
1191
- "dri ven",
1192
- "over driven",
1193
- "7 0",
1194
- "} {-",
1195
- "7 3",
1196
- "b t",
1197
- "6 1",
1198
- "n e",
1199
- "8 7",
1200
- "8 0",
1201
- "a p",
1202
- "l ap",
1203
- "s lap",
1204
- "a g",
1205
- "d d",
1206
- "o ic",
1207
- "v oic",
1208
- "fi dd",
1209
- "ne w",
1210
- "ag e",
1211
- "voic e",
1212
- "fidd le",
1213
- "8 3",
1214
- "h onk",
1215
- "s pi",
1216
- "t onk",
1217
- "en spi",
1218
- "gl ock",
1219
- "honk y",
1220
- "enspi el",
1221
- "glock enspiel",
1222
- "6 7",
1223
- "o th",
1224
- "w to",
1225
- "sa wto",
1226
- "sawto oth",
1227
- "8 1",
1228
- "7 7",
1229
- "m t",
1230
- "5 7",
1231
- "10 1",
1232
- "10 9",
1233
- "7 9",
1234
- "11 2",
1235
- "8 9",
1236
- "6 2",
1237
- "11 3",
1238
- "1 40",
1239
- "l t",
1240
- "7 1",
1241
- "10 3",
1242
- "9 7",
1243
- "b lo",
1244
- "t t",
1245
- "w n",
1246
- "bo tt",
1247
- "blo wn",
1248
- "bott le",
1249
- "9 5",
1250
- "11 5",
1251
- "15 1",
1252
- "8 5",
1253
- "28 0",
1254
- "13 7",
1255
- "1 43",
1256
- "24 0",
1257
- "9 1",
1258
- "12 5",
1259
- "24 1",
1260
- "1 21",
1261
- "9 2",
1262
- "11 6",
1263
- "12 3",
1264
- "18 7",
1265
- "a t",
1266
- "h er",
1267
- "m o",
1268
- "p her",
1269
- "s pher",
1270
- "12 7",
1271
- "13 1",
1272
- "22 9",
1273
- "at mo",
1274
- "spher e",
1275
- "atmo sphere",
1276
- "6 3",
1277
- "8 2",
1278
- "11 9",
1279
- "17 3",
1280
- "22 3",
1281
- "17 9",
1282
- "9 3",
1283
- "12 9",
1284
- "8 40",
1285
- "10 5",
1286
- "29 3",
1287
- "a ra",
1288
- "n g",
1289
- "bright ne",
1290
- "ch ara",
1291
- "brightne ss",
1292
- "chara ng",
1293
- "11 7",
1294
- "13 9",
1295
- "16 9",
1296
- ") ))<|",
1297
- "16 7",
1298
- "18 5",
1299
- "13 3",
1300
- "15 7",
1301
- "18 1",
1302
- "3 65",
1303
- "m u",
1304
- "t ed",
1305
- "mu ted",
1306
- "2 10",
1307
- "2 21",
1308
- "7 6",
1309
- "o o",
1310
- "19 9",
1311
- "oo hs",
1312
- "c y",
1313
- "e ver",
1314
- "r ever",
1315
- "20 7",
1316
- "28 9",
1317
- "33 6",
1318
- "mba l",
1319
- "109 4",
1320
- "cy mbal",
1321
- "rever se",
1322
- "19 7",
1323
- "10 7",
1324
- "14 7",
1325
- "9 9",
1326
- "7 5",
1327
- "15 3",
1328
- "25 7",
1329
- "28 1",
1330
- "38 9",
1331
- "2 11",
1332
- "5 29",
1333
- "5 53",
1334
- "6 8",
1335
- "10 87",
1336
- "21 3",
1337
- "19 1",
1338
- "20 9",
1339
- "27 1",
1340
- "29 5",
1341
- "46 7",
1342
- "3 43",
1343
- "7 19",
1344
- "7 37",
1345
- "8 43",
1346
- "9 17",
1347
- "24 7",
1348
- "43 7",
1349
- "40 9",
1350
- "12 8",
1351
- "35 9",
1352
- "14 5",
1353
- "20 5",
1354
- "29 7",
1355
- "37 1",
1356
- "39 1",
1357
- "69 7",
1358
- "45 1",
1359
- "67 1",
1360
- "67 9",
1361
- "3 19",
1362
- "6 23",
1363
- "6 69",
1364
- "7 33",
1365
- "7 67",
1366
- "7 57",
1367
- "8 11",
1368
- "8 83",
1369
- "9 13",
1370
- "9 35",
1371
- "24 3",
1372
- "21 2",
1373
- "21 7",
1374
- "56 0",
1375
- "56 9",
1376
- "15 2",
1377
- "15 5",
1378
- "15 21",
1379
- "16 1",
1380
- "16 3",
1381
- "16 27",
1382
- "17 7",
1383
- "18 6",
1384
- "32 3",
1385
- "32 7",
1386
- "25 5",
1387
- "26 3",
1388
- "26 8",
1389
- "33 4",
1390
- "34 5",
1391
- "39 2",
1392
- "39 9",
1393
- "69 5",
1394
- "69 9",
1395
- "47 5",
1396
- "48 9",
1397
- "49 1",
1398
- "59 1",
1399
- "70 5",
1400
- "80 1",
1401
- "365 3",
1402
- "99 43",
1403
- "14 9",
1404
- "9 22",
1405
- "15 9",
1406
- "b l",
1407
- "o bl",
1408
- "in s",
1409
- "gl obl",
1410
- "19 3",
1411
- "37 7",
1412
- "globl ins",
1413
- "5 8",
1414
- "22 7",
1415
- "46 3",
1416
- "2 35",
1417
- "3 11",
1418
- "11 1",
1419
- "14 1",
1420
- "14 8",
1421
- "16 91",
1422
- "17 0",
1423
- "42 2",
1424
- "18 8",
1425
- "20 1",
1426
- "26 9",
1427
- "48 1"
1428
- ]
1429
  }
1430
  }
 
4
  "padding": null,
5
  "added_tokens": [
6
  {
7
+ "id": 260,
8
  "content": "<|endoftext|>",
9
  "single_word": false,
10
  "lstrip": false,
 
300
  "ŀ": 256,
301
  "Ł": 257,
302
  "ł": 258,
303
+ "Ń": 259
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
304
  },
305
+ "merges": []
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
306
  }
307
  }
vocab.json CHANGED
@@ -1 +1 @@
1
- {"<s>":0,"</s>":1,"<unk>":2,"<mask>":3,"!":4,"\"":5,"#":6,"$":7,"%":8,"&":9,"'":10,"(":11,")":12,"*":13,"+":14,",":15,"-":16,".":17,"/":18,"0":19,"1":20,"2":21,"3":22,"4":23,"5":24,"6":25,"7":26,"8":27,"9":28,":":29,";":30,"<":31,"=":32,">":33,"?":34,"@":35,"A":36,"B":37,"C":38,"D":39,"E":40,"F":41,"G":42,"H":43,"I":44,"J":45,"K":46,"L":47,"M":48,"N":49,"O":50,"P":51,"Q":52,"R":53,"S":54,"T":55,"U":56,"V":57,"W":58,"X":59,"Y":60,"Z":61,"[":62,"\\":63,"]":64,"^":65,"_":66,"`":67,"a":68,"b":69,"c":70,"d":71,"e":72,"f":73,"g":74,"h":75,"i":76,"j":77,"k":78,"l":79,"m":80,"n":81,"o":82,"p":83,"q":84,"r":85,"s":86,"t":87,"u":88,"v":89,"w":90,"x":91,"y":92,"z":93,"{":94,"|":95,"}":96,"~":97,"¡":98,"¢":99,"£":100,"¤":101,"¥":102,"¦":103,"§":104,"¨":105,"©":106,"ª":107,"«":108,"¬":109,"®":110,"¯":111,"°":112,"±":113,"²":114,"³":115,"´":116,"µ":117,"¶":118,"·":119,"¸":120,"¹":121,"º":122,"»":123,"¼":124,"½":125,"¾":126,"¿":127,"À":128,"Á":129,"Â":130,"Ã":131,"Ä":132,"Å":133,"Æ":134,"Ç":135,"È":136,"É":137,"Ê":138,"Ë":139,"Ì":140,"Í":141,"Î":142,"Ï":143,"Ð":144,"Ñ":145,"Ò":146,"Ó":147,"Ô":148,"Õ":149,"Ö":150,"×":151,"Ø":152,"Ù":153,"Ú":154,"Û":155,"Ü":156,"Ý":157,"Þ":158,"ß":159,"à":160,"á":161,"â":162,"ã":163,"ä":164,"å":165,"æ":166,"ç":167,"è":168,"é":169,"ê":170,"ë":171,"ì":172,"í":173,"î":174,"ï":175,"ð":176,"ñ":177,"ò":178,"ó":179,"ô":180,"õ":181,"ö":182,"÷":183,"ø":184,"ù":185,"ú":186,"û":187,"ü":188,"ý":189,"þ":190,"ÿ":191,"Ā":192,"ā":193,"Ă":194,"ă":195,"Ą":196,"ą":197,"Ć":198,"ć":199,"Ĉ":200,"ĉ":201,"Ċ":202,"ċ":203,"Č":204,"č":205,"Ď":206,"ď":207,"Đ":208,"đ":209,"Ē":210,"ē":211,"Ĕ":212,"ĕ":213,"Ė":214,"ė":215,"Ę":216,"ę":217,"Ě":218,"ě":219,"Ĝ":220,"ĝ":221,"Ğ":222,"ğ":223,"Ġ":224,"ġ":225,"Ģ":226,"ģ":227,"Ĥ":228,"ĥ":229,"Ħ":230,"ħ":231,"Ĩ":232,"ĩ":233,"Ī":234,"ī":235,"Ĭ":236,"ĭ":237,"Į":238,"į":239,"İ":240,"ı":241,"IJ":242,"ij":243,"Ĵ":244,"ĵ":245,"Ķ":246,"ķ":247,"ĸ":248,"Ĺ":249,"ĺ":250,"Ļ":251,"ļ":252,"Ľ":253,"ľ":254,"Ŀ":255,"ŀ":256,"Ł":257,"ł":258,"Ń":259,").":260,"(-":261,"__":262,"mp":263,"no":264,"pi":265,"ano":266,"piano":267,")+":268,"pp":269,")(":270,")+(":271,"II":272,"ed":273,"']":274,"['":275,"']%":276,"qd":277,"sd":278,"ff":279,"en":280,"ra":281,"au":282,"fra":283,"gm":284,"ent":285,"augm":286,"frac":287,"augment":288,"ri":289,"VII":290,"ht":291,"bri":292,"ght":293,"bright":294,"IV":295,"),":296,"11":297,"hd":298,"10":299,"VI":300,"III":301,")).":302,"))+":303,"fff":304,"24":305,")()+(":306,"su":307,"on":308,"64":309,"ba":310,"sa":311,"sax":312,"21":313,"))+(":314,"65":315,"te":316,"ppp":317,"wd":318,"tr":319,"43":320,"ol":321,"ss":322,"et":323,"ar":324,"or":325,"one":326,"bass":327,"ti":328,"hor":329,"horn":330,"el":331,"iol":332,"viol":333,"mb":334,"56":335,"ump":336,"trump":337,"trumpet":338,"gu":339,"it":340,"guit":341,"guitar":342,"to":343,"omb":344,"tromb":345,"trombone":346,"40":347,"is":348,"rin":349,"12":350,"ch":351,"nor":352,"tenor":353,"13":354,"al":355,"alto":356,"in":357,"15":358,"op":359,"rano":360,"sop":361,"soprano":362,"an":363,"gl":364,"har":365,"harp":366,"cel":367,"engl":368,"ish":369,"english":370,"fr":371,"tu":372,"tuba":373,"bo":374,"tone":375,"ritone":376,"baritone":377,"lo":378,"obo":379,"oboe":380,"cc":381,"cello":382,"cl":383,"arin":384,"violin":385,"ench":386,"french":387,"picc":388,"olo":389,"piccolo":390,"oon":391,"bassoon":392,"clarin":393,"clarinet":394,"dr":395,"ms":396,"ums":397,"drums":398,"viola":399,"fl":400,"ute":401,"flute":402,"con":403,"tra":404,"contra":405,"contrabass":406,"mpan":407,"timpan":408,"timpani":409,"35":410,")),":411,"se":412,"14":413,"tion":414,"ste":415,"steel":416,"16":417,")<":418,"do":419,"fte":420,"xt":421,"|>":422,"endo":423,")<|":424,"ftext":425,"endoftext":426,"|>(":427,"17":428,"ac":429,"ou":430,"sti":431,"acou":432,"stic":433,"acoustic":434,"ad":435,"{-":436,"le":437,"}']%":438,"30":439,"42":440,"18":441,"st":442,"32":443,"bra":444,"brass":445,"add":446,"ense":447,"mble":448,"ring":449,"string":450,"ensemble":451,"ction":452,"section":453,")']%":454,"dis":455,"tor":456,"distor":457,"distortion":458,"19":459,"hh":460,"20":461,"22":462,"(+":463,"(+)']%":464,"]{-":465,"23":466,"sn":467,"25":468,"ic":469,"ato":470,"zz":471,"pizz":472,"icato":473,"pizzicato":474,"bd":475,"ct":476,"ect":477,"ric":478,"elect":479,"electric":480,"27":481,"26":482,"ir":483,"oir":484,"choir":485,"hs":486,"aa":487,"aahs":488,"er":489,"td":490,"28":491,"29":492,"mm":493,")))+(":494,"31":495,"oc":496,"fin":497,"ger":498,"finger":499,"gan":500,"organ":501,"33":502,"ock":503,"['(+)']%":504,"jo":505,"njo":506,"banjo":507,"pad":508,"34":509,"]']%":510,"rock":511,"37":512,"39":513,"41":514,"44":515,"rs":516,"84":517,"69":518,")()<|":519,"36":520,"war":521,"warm":522,"etle":523,"fretle":524,"fretless":525,"53":526,"['[":527,"mba":528,"45":529,"ari":530,"mari":531,"marimba":532,"47":533,"gpi":534,"pe":535,"bagpi":536,"bagpipe":537,"))<|":538,"48":539,"38":540,"][":541,"est":542,"celest":543,"celesta":544,"fi":545,"th":546,"cp":547,"168":548,"52":549,"fx":550,"ean":551,"clean":552,"49":553,"arina":554,"ocarina":555,"46":556,"oh":557,"60":558,"ci":559,"sci":560,"51":561,"acc":562,"di":563,"ordi":564,"accordi":565,"accordion":566,"50":567,"54":568,"nth":569,"sy":570,"synth":571,"55":572,"59":573,"lead":574,"ver":575,"onk":576,"rch":577,"urch":578,"church":579,"120":580,"dri":581,"over":582,"ven":583,"driven":584,"overdriven":585,"70":586,"}{-":587,"73":588,"bt":589,"61":590,"ne":591,"87":592,"80":593,"ap":594,"lap":595,"slap":596,"ag":597,"dd":598,"oic":599,"voic":600,"fidd":601,"new":602,"age":603,"voice":604,"fiddle":605,"83":606,"honk":607,"spi":608,"tonk":609,"enspi":610,"glock":611,"honky":612,"enspiel":613,"glockenspiel":614,"67":615,"oth":616,"wto":617,"sawto":618,"sawtooth":619,"81":620,"77":621,"mt":622,"57":623,"101":624,"109":625,"79":626,"112":627,"89":628,"62":629,"113":630,"140":631,"lt":632,"71":633,"103":634,"97":635,"blo":636,"tt":637,"wn":638,"bott":639,"blown":640,"bottle":641,"95":642,"115":643,"151":644,"85":645,"280":646,"137":647,"143":648,"240":649,"91":650,"125":651,"241":652,"121":653,"92":654,"116":655,"123":656,"187":657,"at":658,"her":659,"mo":660,"pher":661,"spher":662,"127":663,"131":664,"229":665,"atmo":666,"sphere":667,"atmosphere":668,"63":669,"82":670,"119":671,"173":672,"223":673,"179":674,"93":675,"129":676,"840":677,"105":678,"293":679,"ara":680,"ng":681,"brightne":682,"chara":683,"brightness":684,"charang":685,"117":686,"139":687,"169":688,")))<|":689,"167":690,"185":691,"133":692,"157":693,"181":694,"365":695,"mu":696,"ted":697,"muted":698,"210":699,"221":700,"76":701,"oo":702,"199":703,"oohs":704,"cy":705,"ever":706,"rever":707,"207":708,"289":709,"336":710,"mbal":711,"1094":712,"cymbal":713,"reverse":714,"197":715,"107":716,"147":717,"99":718,"75":719,"153":720,"257":721,"281":722,"389":723,"211":724,"529":725,"553":726,"68":727,"1087":728,"213":729,"191":730,"209":731,"271":732,"295":733,"467":734,"343":735,"719":736,"737":737,"843":738,"917":739,"247":740,"437":741,"409":742,"128":743,"359":744,"145":745,"205":746,"297":747,"371":748,"391":749,"697":750,"451":751,"671":752,"679":753,"319":754,"623":755,"669":756,"733":757,"767":758,"757":759,"811":760,"883":761,"913":762,"935":763,"243":764,"212":765,"217":766,"560":767,"569":768,"152":769,"155":770,"1521":771,"161":772,"163":773,"1627":774,"177":775,"186":776,"323":777,"327":778,"255":779,"263":780,"268":781,"334":782,"345":783,"392":784,"399":785,"695":786,"699":787,"475":788,"489":789,"491":790,"591":791,"705":792,"801":793,"3653":794,"9943":795,"149":796,"922":797,"159":798,"bl":799,"obl":800,"ins":801,"globl":802,"193":803,"377":804,"globlins":805,"58":806,"227":807,"463":808,"235":809,"311":810,"111":811,"141":812,"148":813,"1691":814,"170":815,"422":816,"188":817,"201":818,"269":819,"481":820}
 
1
+ {"<s>":0,"</s>":1,"<unk>":2,"<mask>":3,"!":4,"\"":5,"#":6,"$":7,"%":8,"&":9,"'":10,"(":11,")":12,"*":13,"+":14,",":15,"-":16,".":17,"/":18,"0":19,"1":20,"2":21,"3":22,"4":23,"5":24,"6":25,"7":26,"8":27,"9":28,":":29,";":30,"<":31,"=":32,">":33,"?":34,"@":35,"A":36,"B":37,"C":38,"D":39,"E":40,"F":41,"G":42,"H":43,"I":44,"J":45,"K":46,"L":47,"M":48,"N":49,"O":50,"P":51,"Q":52,"R":53,"S":54,"T":55,"U":56,"V":57,"W":58,"X":59,"Y":60,"Z":61,"[":62,"\\":63,"]":64,"^":65,"_":66,"`":67,"a":68,"b":69,"c":70,"d":71,"e":72,"f":73,"g":74,"h":75,"i":76,"j":77,"k":78,"l":79,"m":80,"n":81,"o":82,"p":83,"q":84,"r":85,"s":86,"t":87,"u":88,"v":89,"w":90,"x":91,"y":92,"z":93,"{":94,"|":95,"}":96,"~":97,"¡":98,"¢":99,"£":100,"¤":101,"¥":102,"¦":103,"§":104,"¨":105,"©":106,"ª":107,"«":108,"¬":109,"®":110,"¯":111,"°":112,"±":113,"²":114,"³":115,"´":116,"µ":117,"¶":118,"·":119,"¸":120,"¹":121,"º":122,"»":123,"¼":124,"½":125,"¾":126,"¿":127,"À":128,"Á":129,"Â":130,"Ã":131,"Ä":132,"Å":133,"Æ":134,"Ç":135,"È":136,"É":137,"Ê":138,"Ë":139,"Ì":140,"Í":141,"Î":142,"Ï":143,"Ð":144,"Ñ":145,"Ò":146,"Ó":147,"Ô":148,"Õ":149,"Ö":150,"×":151,"Ø":152,"Ù":153,"Ú":154,"Û":155,"Ü":156,"Ý":157,"Þ":158,"ß":159,"à":160,"á":161,"â":162,"ã":163,"ä":164,"å":165,"æ":166,"ç":167,"è":168,"é":169,"ê":170,"ë":171,"ì":172,"í":173,"î":174,"ï":175,"ð":176,"ñ":177,"ò":178,"ó":179,"ô":180,"õ":181,"ö":182,"÷":183,"ø":184,"ù":185,"ú":186,"û":187,"ü":188,"ý":189,"þ":190,"ÿ":191,"Ā":192,"ā":193,"Ă":194,"ă":195,"Ą":196,"ą":197,"Ć":198,"ć":199,"Ĉ":200,"ĉ":201,"Ċ":202,"ċ":203,"Č":204,"č":205,"Ď":206,"ď":207,"Đ":208,"đ":209,"Ē":210,"ē":211,"Ĕ":212,"ĕ":213,"Ė":214,"ė":215,"Ę":216,"ę":217,"Ě":218,"ě":219,"Ĝ":220,"ĝ":221,"Ğ":222,"ğ":223,"Ġ":224,"ġ":225,"Ģ":226,"ģ":227,"Ĥ":228,"ĥ":229,"Ħ":230,"ħ":231,"Ĩ":232,"ĩ":233,"Ī":234,"ī":235,"Ĭ":236,"ĭ":237,"Į":238,"į":239,"İ":240,"ı":241,"IJ":242,"ij":243,"Ĵ":244,"ĵ":245,"Ķ":246,"ķ":247,"ĸ":248,"Ĺ":249,"ĺ":250,"Ļ":251,"ļ":252,"Ľ":253,"ľ":254,"Ŀ":255,"ŀ":256,"Ł":257,"ł":258,"Ń":259}