| { |
| "version": "1.0", |
| "truncation": null, |
| "padding": null, |
| "added_tokens": [ |
| { |
| "id": 0, |
| "special": true, |
| "content": "[STOP]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false |
| }, |
| { |
| "id": 1, |
| "special": true, |
| "content": "[UNK]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false |
| }, |
| { |
| "id": 2, |
| "special": true, |
| "content": "[SPACE]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false |
| }, |
| { |
| "id": 255, |
| "special": true, |
| "content": "[START]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false |
| }, |
| { |
| "id": 604, |
| "content": "[UH]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 605, |
| "content": "[UM]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 606, |
| "content": "[giggle]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 607, |
| "content": "[laughter]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 608, |
| "content": "[guffaw]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 609, |
| "content": "[inhale]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 610, |
| "content": "[exhale]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 611, |
| "content": "[sigh]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 612, |
| "content": "[cry]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 613, |
| "content": "[bark]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 614, |
| "content": "[howl]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 615, |
| "content": "[meow]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 616, |
| "content": "[singing]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 617, |
| "content": "[music]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 618, |
| "content": "[whistle]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 619, |
| "content": "[humming]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 620, |
| "content": "[gasp]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 621, |
| "content": "[groan]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 622, |
| "content": "[whisper]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 623, |
| "content": "[mumble]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 624, |
| "content": "[sniff]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 625, |
| "content": "[sneeze]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 626, |
| "content": "[cough]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 627, |
| "content": "[snore]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 628, |
| "content": "[chew]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 629, |
| "content": "[sip]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 630, |
| "content": "[clear_throat]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 631, |
| "content": "[kiss]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 632, |
| "content": "[shhh]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 633, |
| "content": "[gibberish]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 634, |
| "content": "[fr]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 635, |
| "content": "[es]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 636, |
| "content": "[de]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 637, |
| "content": "[it]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 638, |
| "content": "[ipa]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 639, |
| "content": "[end_of_label]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 695, |
| "content": "[PLACEHOLDER55]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 696, |
| "content": "[PLACEHOLDER56]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 697, |
| "content": "[PLACEHOLDER57]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 698, |
| "content": "[PLACEHOLDER58]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 699, |
| "content": "[PLACEHOLDER59]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 700, |
| "content": "[PLACEHOLDER60]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 701, |
| "content": "[PLACEHOLDER61]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 702, |
| "content": "[PLACEHOLDER62]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 703, |
| "content": "[PLACEHOLDER63]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| } |
| ], |
| "normalizer": null, |
| "pre_tokenizer": { |
| "type": "Whitespace" |
| }, |
| "post_processor": null, |
| "decoder": null, |
| "model": { |
| "type": "BPE", |
| "dropout": null, |
| "unk_token": "[UNK]", |
| "continuing_subword_prefix": null, |
| "end_of_word_suffix": null, |
| "fuse_unk": false, |
| "vocab": { |
| "[STOP]": 0, |
| "[UNK]": 1, |
| "[SPACE]": 2, |
| "!": 3, |
| "'": 4, |
| "(": 5, |
| ")": 6, |
| ",": 7, |
| "-": 8, |
| ".": 9, |
| "/": 10, |
| ":": 11, |
| ";": 12, |
| "?": 13, |
| "a": 14, |
| "b": 15, |
| "c": 16, |
| "d": 17, |
| "e": 18, |
| "f": 19, |
| "g": 20, |
| "h": 21, |
| "i": 22, |
| "j": 23, |
| "k": 24, |
| "l": 25, |
| "m": 26, |
| "n": 27, |
| "o": 28, |
| "p": 29, |
| "q": 30, |
| "r": 31, |
| "s": 32, |
| "t": 33, |
| "u": 34, |
| "v": 35, |
| "w": 36, |
| "x": 37, |
| "y": 38, |
| "z": 39, |
| "th": 40, |
| "in": 41, |
| "the": 42, |
| "an": 43, |
| "er": 44, |
| "ou": 45, |
| "re": 46, |
| "on": 47, |
| "at": 48, |
| "ed": 49, |
| "en": 50, |
| "to": 51, |
| "ing": 52, |
| "and": 53, |
| "is": 54, |
| "as": 55, |
| "al": 56, |
| "or": 57, |
| "of": 58, |
| "ar": 59, |
| "it": 60, |
| "es": 61, |
| "he": 62, |
| "st": 63, |
| "le": 64, |
| "om": 65, |
| "se": 66, |
| "be": 67, |
| "ad": 68, |
| "ow": 69, |
| "ly": 70, |
| "ch": 71, |
| "wh": 72, |
| "that": 73, |
| "you": 74, |
| "li": 75, |
| "ve": 76, |
| "ac": 77, |
| "ti": 78, |
| "ld": 79, |
| "me": 80, |
| "was": 81, |
| "gh": 82, |
| "id": 83, |
| "ll": 84, |
| "wi": 85, |
| "ent": 86, |
| "for": 87, |
| "ay": 88, |
| "ro": 89, |
| "ver": 90, |
| "ic": 91, |
| "her": 92, |
| "ke": 93, |
| "his": 94, |
| "no": 95, |
| "ut": 96, |
| "un": 97, |
| "ir": 98, |
| "lo": 99, |
| "we": 100, |
| "ri": 101, |
| "ha": 102, |
| "with": 103, |
| "ght": 104, |
| "out": 105, |
| "im": 106, |
| "ion": 107, |
| "all": 108, |
| "ab": 109, |
| "one": 110, |
| "ne": 111, |
| "ge": 112, |
| "ould": 113, |
| "ter": 114, |
| "mo": 115, |
| "had": 116, |
| "ce": 117, |
| "she": 118, |
| "go": 119, |
| "sh": 120, |
| "ur": 121, |
| "am": 122, |
| "so": 123, |
| "pe": 124, |
| "my": 125, |
| "de": 126, |
| "are": 127, |
| "but": 128, |
| "ome": 129, |
| "fr": 130, |
| "ther": 131, |
| "fe": 132, |
| "su": 133, |
| "do": 134, |
| "con": 135, |
| "te": 136, |
| "ain": 137, |
| "ere": 138, |
| "po": 139, |
| "if": 140, |
| "they": 141, |
| "us": 142, |
| "ag": 143, |
| "tr": 144, |
| "now": 145, |
| "oun": 146, |
| "this": 147, |
| "have": 148, |
| "not": 149, |
| "sa": 150, |
| "il": 151, |
| "up": 152, |
| "thing": 153, |
| "from": 154, |
| "ap": 155, |
| "him": 156, |
| "ack": 157, |
| "ation": 158, |
| "ant": 159, |
| "our": 160, |
| "op": 161, |
| "like": 162, |
| "ust": 163, |
| "ess": 164, |
| "bo": 165, |
| "ok": 166, |
| "ul": 167, |
| "ind": 168, |
| "ex": 169, |
| "com": 170, |
| "some": 171, |
| "there": 172, |
| "ers": 173, |
| "co": 174, |
| "res": 175, |
| "man": 176, |
| "ard": 177, |
| "pl": 178, |
| "wor": 179, |
| "way": 180, |
| "tion": 181, |
| "fo": 182, |
| "ca": 183, |
| "were": 184, |
| "by": 185, |
| "ate": 186, |
| "pro": 187, |
| "ted": 188, |
| "ound": 189, |
| "own": 190, |
| "would": 191, |
| "ts": 192, |
| "what": 193, |
| "qu": 194, |
| "ally": 195, |
| "ight": 196, |
| "ck": 197, |
| "gr": 198, |
| "when": 199, |
| "ven": 200, |
| "can": 201, |
| "ough": 202, |
| "ine": 203, |
| "end": 204, |
| "per": 205, |
| "ous": 206, |
| "od": 207, |
| "ide": 208, |
| "know": 209, |
| "ty": 210, |
| "very": 211, |
| "si": 212, |
| "ak": 213, |
| "who": 214, |
| "about": 215, |
| "ill": 216, |
| "them": 217, |
| "est": 218, |
| "red": 219, |
| "ye": 220, |
| "could": 221, |
| "ong": 222, |
| "your": 223, |
| "their": 224, |
| "em": 225, |
| "just": 226, |
| "other": 227, |
| "into": 228, |
| "any": 229, |
| "whi": 230, |
| "um": 231, |
| "tw": 232, |
| "ast": 233, |
| "der": 234, |
| "did": 235, |
| "ie": 236, |
| "been": 237, |
| "ace": 238, |
| "ink": 239, |
| "ity": 240, |
| "back": 241, |
| "ting": 242, |
| "br": 243, |
| "more": 244, |
| "ake": 245, |
| "pp": 246, |
| "then": 247, |
| "sp": 248, |
| "el": 249, |
| "use": 250, |
| "bl": 251, |
| "said": 252, |
| "over": 253, |
| "get": 254, |
| "[START]": 255, |
| "\"": 256, |
| "#": 257, |
| "$": 258, |
| "%": 259, |
| "&": 260, |
| "*": 261, |
| "+": 262, |
| "0": 263, |
| "1": 264, |
| "2": 265, |
| "3": 266, |
| "4": 267, |
| "5": 268, |
| "6": 269, |
| "7": 270, |
| "8": 271, |
| "9": 272, |
| "<": 273, |
| "=": 274, |
| ">": 275, |
| "@": 276, |
| "A": 277, |
| "B": 278, |
| "C": 279, |
| "D": 280, |
| "E": 281, |
| "F": 282, |
| "G": 283, |
| "H": 284, |
| "I": 285, |
| "J": 286, |
| "K": 287, |
| "L": 288, |
| "M": 289, |
| "N": 290, |
| "O": 291, |
| "P": 292, |
| "Q": 293, |
| "R": 294, |
| "S": 295, |
| "T": 296, |
| "U": 297, |
| "V": 298, |
| "W": 299, |
| "X": 300, |
| "Y": 301, |
| "Z": 302, |
| "[": 303, |
| "\\": 304, |
| "]": 305, |
| "^": 306, |
| "_": 307, |
| "`": 308, |
| "{": 309, |
| "|": 310, |
| "}": 311, |
| "~": 312, |
| "‐": 313, |
| "‑": 314, |
| "‒": 315, |
| "–": 316, |
| "—": 317, |
| "―": 318, |
| "‖": 319, |
| "‗": 320, |
| "‘": 321, |
| "’": 322, |
| "‚": 323, |
| "‛": 324, |
| "“": 325, |
| "”": 326, |
| "„": 327, |
| "‟": 328, |
| " ": 329, |
| "¡": 330, |
| "¢": 331, |
| "£": 332, |
| "¤": 333, |
| "¥": 334, |
| "¦": 335, |
| "§": 336, |
| "¨": 337, |
| "©": 338, |
| "ª": 339, |
| "«": 340, |
| "¬": 341, |
| "": 342, |
| "®": 343, |
| "¯": 344, |
| "°": 345, |
| "±": 346, |
| "²": 347, |
| "³": 348, |
| "´": 349, |
| "µ": 350, |
| "¶": 351, |
| "·": 352, |
| "¸": 353, |
| "¹": 354, |
| "º": 355, |
| "»": 356, |
| "¼": 357, |
| "½": 358, |
| "¾": 359, |
| "¿": 360, |
| "À": 361, |
| "Á": 362, |
| "Â": 363, |
| "Ã": 364, |
| "Ä": 365, |
| "Å": 366, |
| "Æ": 367, |
| "Ç": 368, |
| "È": 369, |
| "É": 370, |
| "Ê": 371, |
| "Ë": 372, |
| "Ì": 373, |
| "Í": 374, |
| "Î": 375, |
| "Ï": 376, |
| "Ð": 377, |
| "Ñ": 378, |
| "Ò": 379, |
| "Ó": 380, |
| "Ô": 381, |
| "Õ": 382, |
| "Ö": 383, |
| "×": 384, |
| "Ø": 385, |
| "Ù": 386, |
| "Ú": 387, |
| "Û": 388, |
| "Ü": 389, |
| "Ý": 390, |
| "Þ": 391, |
| "ß": 392, |
| "à": 393, |
| "á": 394, |
| "â": 395, |
| "ã": 396, |
| "ä": 397, |
| "å": 398, |
| "æ": 399, |
| "ç": 400, |
| "è": 401, |
| "é": 402, |
| "ê": 403, |
| "ë": 404, |
| "ì": 405, |
| "í": 406, |
| "î": 407, |
| "ï": 408, |
| "ð": 409, |
| "ñ": 410, |
| "ò": 411, |
| "ó": 412, |
| "ô": 413, |
| "õ": 414, |
| "ö": 415, |
| "÷": 416, |
| "ø": 417, |
| "ù": 418, |
| "ú": 419, |
| "û": 420, |
| "ü": 421, |
| "ý": 422, |
| "þ": 423, |
| "ÿ": 424, |
| "ɐ": 425, |
| "ɑ": 426, |
| "ɒ": 427, |
| "ɓ": 428, |
| "ɔ": 429, |
| "ɕ": 430, |
| "ɖ": 431, |
| "ɗ": 432, |
| "ɘ": 433, |
| "ə": 434, |
| "ɚ": 435, |
| "ɛ": 436, |
| "ɜ": 437, |
| "ɝ": 438, |
| "ɞ": 439, |
| "ɟ": 440, |
| "ɠ": 441, |
| "ɡ": 442, |
| "ɢ": 443, |
| "ɣ": 444, |
| "ɤ": 445, |
| "ɥ": 446, |
| "ɦ": 447, |
| "ɧ": 448, |
| "ɨ": 449, |
| "ɩ": 450, |
| "ɪ": 451, |
| "ɫ": 452, |
| "ɬ": 453, |
| "ɭ": 454, |
| "ɮ": 455, |
| "ɯ": 456, |
| "ɰ": 457, |
| "ɱ": 458, |
| "ɲ": 459, |
| "ɳ": 460, |
| "ɴ": 461, |
| "ɵ": 462, |
| "ɶ": 463, |
| "ɷ": 464, |
| "ɸ": 465, |
| "ɹ": 466, |
| "ɺ": 467, |
| "ɻ": 468, |
| "ɼ": 469, |
| "ɽ": 470, |
| "ɾ": 471, |
| "ɿ": 472, |
| "ʀ": 473, |
| "ʁ": 474, |
| "ʂ": 475, |
| "ʃ": 476, |
| "ʄ": 477, |
| "ʅ": 478, |
| "ʆ": 479, |
| "ʇ": 480, |
| "ʈ": 481, |
| "ʉ": 482, |
| "ʊ": 483, |
| "ʋ": 484, |
| "ʌ": 485, |
| "ʍ": 486, |
| "ʎ": 487, |
| "ʏ": 488, |
| "ʐ": 489, |
| "ʑ": 490, |
| "ʒ": 491, |
| "ʓ": 492, |
| "ʔ": 493, |
| "ʕ": 494, |
| "ʖ": 495, |
| "ʗ": 496, |
| "ʘ": 497, |
| "ʙ": 498, |
| "ʚ": 499, |
| "ʛ": 500, |
| "ʜ": 501, |
| "ʝ": 502, |
| "ʞ": 503, |
| "ʟ": 504, |
| "ʠ": 505, |
| "ʡ": 506, |
| "ʢ": 507, |
| "ʣ": 508, |
| "ʤ": 509, |
| "ʥ": 510, |
| "ʦ": 511, |
| "ʧ": 512, |
| "ʨ": 513, |
| "ʩ": 514, |
| "ʪ": 515, |
| "ʫ": 516, |
| "ʬ": 517, |
| "ʭ": 518, |
| "ʮ": 519, |
| "ʯ": 520, |
| "ʰ": 521, |
| "ʱ": 522, |
| "ʲ": 523, |
| "ʳ": 524, |
| "ʴ": 525, |
| "ʵ": 526, |
| "ʶ": 527, |
| "ʷ": 528, |
| "ʸ": 529, |
| "ʹ": 530, |
| "ʺ": 531, |
| "ʻ": 532, |
| "ʼ": 533, |
| "ʽ": 534, |
| "ʾ": 535, |
| "ʿ": 536, |
| "ˀ": 537, |
| "ˁ": 538, |
| "˂": 539, |
| "˃": 540, |
| "˄": 541, |
| "˅": 542, |
| "ˆ": 543, |
| "ˇ": 544, |
| "ˈ": 545, |
| "ˉ": 546, |
| "ˊ": 547, |
| "ˋ": 548, |
| "ˌ": 549, |
| "ˍ": 550, |
| "ˎ": 551, |
| "ˏ": 552, |
| "ː": 553, |
| "ˑ": 554, |
| "˒": 555, |
| "˓": 556, |
| "˔": 557, |
| "˕": 558, |
| "˖": 559, |
| "˗": 560, |
| "˘": 561, |
| "˙": 562, |
| "˚": 563, |
| "˛": 564, |
| "˜": 565, |
| "˝": 566, |
| "˞": 567, |
| "˟": 568, |
| "ˠ": 569, |
| "ˡ": 570, |
| "ˢ": 571, |
| "ˣ": 572, |
| "ˤ": 573, |
| "˥": 574, |
| "˦": 575, |
| "˧": 576, |
| "˨": 577, |
| "˩": 578, |
| "˪": 579, |
| "˫": 580, |
| "ˬ": 581, |
| "˭": 582, |
| "ˮ": 583, |
| "˯": 584, |
| "˰": 585, |
| "˱": 586, |
| "˲": 587, |
| "˳": 588, |
| "˴": 589, |
| "˵": 590, |
| "˶": 591, |
| "˷": 592, |
| "˸": 593, |
| "˹": 594, |
| "˺": 595, |
| "˻": 596, |
| "˼": 597, |
| "˽": 598, |
| "˾": 599, |
| "˿": 600, |
| "ā": 601, |
| "ō": 602, |
| "…": 603, |
| "[UH]": 604, |
| "[UM]": 605, |
| "[giggle]": 606, |
| "[laughter]": 607, |
| "[guffaw]": 608, |
| "[inhale]": 609, |
| "[exhale]": 610, |
| "[sigh]": 611, |
| "[cry]": 612, |
| "[bark]": 613, |
| "[howl]": 614, |
| "[meow]": 615, |
| "[singing]": 616, |
| "[music]": 617, |
| "[whistle]": 618, |
| "[humming]": 619, |
| "[gasp]": 620, |
| "[groan]": 621, |
| "[whisper]": 622, |
| "[mumble]": 623, |
| "[sniff]": 624, |
| "[sneeze]": 625, |
| "[cough]": 626, |
| "[snore]": 627, |
| "[chew]": 628, |
| "[sip]": 629, |
| "[clear_throat]": 630, |
| "[kiss]": 631, |
| "[shhh]": 632, |
| "[gibberish]": 633, |
| "[fr]": 634, |
| "[es]": 635, |
| "[de]": 636, |
| "[it]": 637, |
| "[ipa]": 638, |
| "[end_of_label]": 639, |
| "ŋ": 640, |
| "ᵻ": 641, |
| "θ": 642, |
| "̩": 643, |
| "\u0303": 644, |
| "ɑː": 645, |
| "iː": 646, |
| "uː": 647, |
| "ɜː": 648, |
| "ɔː": 649, |
| "oː": 650, |
| "eɪ": 651, |
| "oʊ": 652, |
| "aɪ": 653, |
| "aʊ": 654, |
| "ɔɪ": 655, |
| "dʒ": 656, |
| "tʃ": 657, |
| "ɪŋ": 658, |
| "ᵻd": 659, |
| "ˈiː": 660, |
| "ˌiː": 661, |
| "ˈɪ": 662, |
| "ˌɪ": 663, |
| "ˈeɪ": 664, |
| "ˌeɪ": 665, |
| "ˈɛ": 666, |
| "ˌɛ": 667, |
| "ˈæ": 668, |
| "ˌæ": 669, |
| "ˈɑː": 670, |
| "ˌɑː": 671, |
| "ˈɔː": 672, |
| "ˌɔː": 673, |
| "oːɹ": 674, |
| "ˈoːɹ": 675, |
| "ˌoːɹ": 676, |
| "ˈoʊ": 677, |
| "ˌoʊ": 678, |
| "ˈʊ": 679, |
| "ˌʊ": 680, |
| "ˈuː": 681, |
| "ˌuː": 682, |
| "ˈɜː": 683, |
| "ˌɜː": 684, |
| "ˈʌ": 685, |
| "ˌʌ": 686, |
| "ˈaɪ": 687, |
| "ˌaɪ": 688, |
| "ˈaʊ": 689, |
| "ˌaʊ": 690, |
| "ˈɔɪ": 691, |
| "ˌɔɪ": 692, |
| "ˈɚ": 693, |
| "ˌɐ": 694, |
| "[PLACEHOLDER55]": 695, |
| "[PLACEHOLDER56]": 696, |
| "[PLACEHOLDER57]": 697, |
| "[PLACEHOLDER58]": 698, |
| "[PLACEHOLDER59]": 699, |
| "[PLACEHOLDER60]": 700, |
| "[PLACEHOLDER61]": 701, |
| "[PLACEHOLDER62]": 702, |
| "[PLACEHOLDER63]": 703 |
| }, |
| "merges": [ |
| "t h", |
| "i n", |
| "th e", |
| "a n", |
| "e r", |
| "o u", |
| "r e", |
| "o n", |
| "a t", |
| "e d", |
| "e n", |
| "t o", |
| "in g", |
| "an d", |
| "i s", |
| "a s", |
| "a l", |
| "o r", |
| "o f", |
| "a r", |
| "i t", |
| "e s", |
| "h e", |
| "s t", |
| "l e", |
| "o m", |
| "s e", |
| "b e", |
| "a d", |
| "o w", |
| "l y", |
| "c h", |
| "w h", |
| "th at", |
| "y ou", |
| "l i", |
| "v e", |
| "a c", |
| "t i", |
| "l d", |
| "m e", |
| "w as", |
| "g h", |
| "i d", |
| "l l", |
| "w i", |
| "en t", |
| "f or", |
| "a y", |
| "r o", |
| "v er", |
| "i c", |
| "h er", |
| "k e", |
| "h is", |
| "n o", |
| "u t", |
| "u n", |
| "i r", |
| "l o", |
| "w e", |
| "r i", |
| "h a", |
| "wi th", |
| "gh t", |
| "ou t", |
| "i m", |
| "i on", |
| "al l", |
| "a b", |
| "on e", |
| "n e", |
| "g e", |
| "ou ld", |
| "t er", |
| "m o", |
| "h ad", |
| "c e", |
| "s he", |
| "g o", |
| "s h", |
| "u r", |
| "a m", |
| "s o", |
| "p e", |
| "m y", |
| "d e", |
| "a re", |
| "b ut", |
| "om e", |
| "f r", |
| "the r", |
| "f e", |
| "s u", |
| "d o", |
| "c on", |
| "t e", |
| "a in", |
| "er e", |
| "p o", |
| "i f", |
| "the y", |
| "u s", |
| "a g", |
| "t r", |
| "n ow", |
| "ou n", |
| "th is", |
| "ha ve", |
| "no t", |
| "s a", |
| "i l", |
| "u p", |
| "th ing", |
| "fr om", |
| "a p", |
| "h im", |
| "ac k", |
| "at ion", |
| "an t", |
| "ou r", |
| "o p", |
| "li ke", |
| "u st", |
| "es s", |
| "b o", |
| "o k", |
| "u l", |
| "in d", |
| "e x", |
| "c om", |
| "s ome", |
| "the re", |
| "er s", |
| "c o", |
| "re s", |
| "m an", |
| "ar d", |
| "p l", |
| "w or", |
| "w ay", |
| "ti on", |
| "f o", |
| "c a", |
| "w ere", |
| "b y", |
| "at e", |
| "p ro", |
| "t ed", |
| "oun d", |
| "ow n", |
| "w ould", |
| "t s", |
| "wh at", |
| "q u", |
| "al ly", |
| "i ght", |
| "c k", |
| "g r", |
| "wh en", |
| "v en", |
| "c an", |
| "ou gh", |
| "in e", |
| "en d", |
| "p er", |
| "ou s", |
| "o d", |
| "id e", |
| "k now", |
| "t y", |
| "ver y", |
| "s i", |
| "a k", |
| "wh o", |
| "ab out", |
| "i ll", |
| "the m", |
| "es t", |
| "re d", |
| "y e", |
| "c ould", |
| "on g", |
| "you r", |
| "the ir", |
| "e m", |
| "j ust", |
| "o ther", |
| "in to", |
| "an y", |
| "wh i", |
| "u m", |
| "t w", |
| "as t", |
| "d er", |
| "d id", |
| "i e", |
| "be en", |
| "ac e", |
| "in k", |
| "it y", |
| "b ack", |
| "t ing", |
| "b r", |
| "mo re", |
| "a ke", |
| "p p", |
| "the n", |
| "s p", |
| "e l", |
| "u se", |
| "b l", |
| "sa id", |
| "o ver", |
| "ge t", |
| "ɑ ː", |
| "i ː", |
| "u ː", |
| "ɜ ː", |
| "ɔ ː", |
| "o ː", |
| "e ɪ", |
| "o ʊ", |
| "a ɪ", |
| "a ʊ", |
| "ɔ ɪ", |
| "d ʒ", |
| "t ʃ", |
| "ɪ ŋ", |
| "ᵻ d", |
| "ˈ iː", |
| "ˌ iː", |
| "ˈ ɪ", |
| "ˌ ɪ", |
| "ˈ eɪ", |
| "ˌ eɪ", |
| "ˈ ɛ", |
| "ˌ ɛ", |
| "ˈ æ", |
| "ˌ æ", |
| "ˈ ɑː", |
| "ˌ ɑː", |
| "ˈ ɔː", |
| "ˌ ɔː", |
| "oː ɹ", |
| "ˈ oːɹ", |
| "ˌ oːɹ", |
| "ˈ oʊ", |
| "ˌ oʊ", |
| "ˈ ʊ", |
| "ˌ ʊ", |
| "ˈ uː", |
| "ˌ uː", |
| "ˈ ɜː", |
| "ˌ ɜː", |
| "ˈ ʌ", |
| "ˌ ʌ", |
| "ˈ aɪ", |
| "ˌ aɪ", |
| "ˈ aʊ", |
| "ˌ aʊ", |
| "ˈ ɔɪ", |
| "ˌ ɔɪ", |
| "ˈ ɚ", |
| "ˌ ɐ" |
| ] |
| } |
| } |