{ "version": "1.0", "truncation": null, "padding": null, "added_tokens": [ { "id": 0, "content": "!", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true }, { "id": 1, "content": "<|startoftext|>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "special": true }, { "id": 2, "content": "<|endoftext|>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "special": true } ], "normalizer": { "type": "Sequence", "normalizers": [ { "type": "NFC" }, { "type": "Replace", "pattern": { "Regex": "\\s+" }, "content": " " }, { "type": "Lowercase" } ] }, "pre_tokenizer": { "type": "Sequence", "pretokenizers": [ { "type": "Split", "pattern": { "Regex": "'s|'t|'re|'ve|'m|'ll|'d|[\\p{L}]+|[\\p{N}]|[^\\s\\p{L}\\p{N}]+" }, "behavior": "Removed", "invert": true }, { "type": "ByteLevel", "add_prefix_space": false, "trim_offsets": true, "use_regex": true } ] }, "post_processor": { "type": "RobertaProcessing", "sep": [ "<|endoftext|>", 2 ], "cls": [ "<|startoftext|>", 1 ], "trim_offsets": false, "add_prefix_space": false }, "decoder": { "type": "ByteLevel", "add_prefix_space": true, "trim_offsets": true, "use_regex": true }, "model": { "type": "BPE", "dropout": null, "unk_token": "<|endoftext|>", "continuing_subword_prefix": "", "end_of_word_suffix": "", "fuse_unk": false, "vocab": { "!": 0, "<|startoftext|>": 1, "<|endoftext|>": 2, "\"": 3, "#": 4, "$": 5, "%": 6, "&": 7, "'": 8, "(": 9, ")": 10, "*": 11, "+": 12, ",": 13, "-": 14, ".": 15, "/": 16, "0": 17, "1": 18, "2": 19, "3": 20, "4": 21, "5": 22, "6": 23, "7": 24, "8": 25, "9": 26, ":": 27, ";": 28, "<": 29, "=": 30, ">": 31, "?": 32, "@": 33, "[": 34, "\\": 35, "]": 36, "^": 37, "_": 38, "`": 39, "a": 40, "b": 41, "c": 42, "d": 43, "e": 44, "f": 45, "g": 46, "h": 47, "i": 48, "j": 49, "k": 50, "l": 51, "m": 52, "n": 53, "o": 54, "p": 55, "q": 56, "r": 57, "s": 58, "t": 59, "u": 60, "v": 61, "w": 62, "x": 63, "y": 64, "z": 65, "|": 66, "}": 67, "~": 68, "¡": 69, "¢": 70, "£": 71, "¤": 72, "¥": 73, "¦": 74, "§": 75, "¨": 76, "©": 77, "ª": 78, "«": 79, "¬": 80, "®": 81, "¯": 82, "°": 83, "±": 84, "²": 85, "³": 86, "´": 87, "µ": 88, "¶": 89, "·": 90, "¸": 91, "¹": 92, "º": 93, "»": 94, "¼": 95, "½": 96, "¾": 97, "¿": 98, "Â": 99, "Ã": 100, "Ä": 101, "Å": 102, "Æ": 103, "Ç": 104, "È": 105, "É": 106, "Ê": 107, "Ë": 108, "Ì": 109, "Í": 110, "Î": 111, "Ï": 112, "Ð": 113, "Ñ": 114, "Ö": 115, "×": 116, "Ø": 117, "Ù": 118, "Ü": 119, "à": 120, "á": 121, "â": 122, "ã": 123, "ä": 124, "å": 125, "æ": 126, "ç": 127, "è": 128, "é": 129, "ë": 130, "ì": 131, "ï": 132, "Ģ": 133, "ģ": 134, "Ĥ": 135, "ĥ": 136, "Ħ": 137, "ħ": 138, "Ĩ": 139, "ĩ": 140, "Ī": 141, "ī": 142, "Ĭ": 143, "ĭ": 144, "Į": 145, "į": 146, "İ": 147, "ı": 148, "IJ": 149, "ij": 150, "Ĵ": 151, "ĵ": 152, "Ķ": 153, "ķ": 154, "ĸ": 155, "Ĺ": 156, "ĺ": 157, "Ļ": 158, "ļ": 159, "Ľ": 160, "ľ": 161, "Ŀ": 162, "ŀ": 163, "Ł": 164, "ł": 165, "Ń": 166, "e": 167, "n": 168, "s": 169, "o": 170, "g": 171, "a": 172, "r": 173, "t": 174, "w": 175, "d": 176, "y": 177, "i": 178, "p": 179, "l": 180, "h": 181, "f": 182, "k": 183, "c": 184, "v": 185, "m": 186, "x": 187, "z": 188, "u": 189, "ľ": 190, "[": 191, "ģ": 192, "|": 193, "¼": 194, "j": 195, "į": 196, "²": 197, "b": 198, "ĩ": 199, "Ļ": 200, "¿": 201, "¡": 202, "'": 203, ">": 204, "¢": 205, "±": 206, "·": 207, "¶": 208, "«": 209, "¤": 210, "©": 211, "½": 212, "³": 213, "Ń": 214, "\\": 215, "+": 216, "¸": 217, "¨": 218, "Ł": 219, "ĺ": 220, "Ľ": 221, "¹": 222, "Ĩ": 223, "Ģ": 224, "Ĺ": 225, "°": 226, "-": 227, "Ĥ": 228, "Į": 229, "ħ": 230, "Ĭ": 231, "§": 232, "IJ": 233, "`": 234, "q": 235, "ķ": 236, "µ": 237, "ī": 238, "º": 239, "!": 240, "¯": 241, "Ŀ": 242, "Ħ": 243, "ł": 244, "%": 245, "£": 246, "¦": 247, "ŀ": 248, "¾": 249, "´": 250, "ĵ": 251, "^": 252, "Ķ": 253, "ª": 254, "»": 255, "0": 256, "5": 257, "ĸ": 258, "ļ": 259, "İ": 260, "=": 261, "Ĵ": 262, "Ī": 263, "ĥ": 264, "¥": 265, "®": 266, "3": 267, "¬": 268, ".": 269, "1": 270, "ĭ": 271, "ij": 272, "@": 273, "&": 274, "ı": 275, "~": 276, "8": 277, "}": 278, "*": 279, ";": 280, "\"": 281, "2": 282, "(": 283, ")": 284, "4": 285, "9": 286, "/": 287, ":": 288, "#": 289, ",": 290, "$": 291, "]": 292, "<": 293, "_": 294, "?": 295, "6": 296, "7": 297, "th": 298, "the": 299, "in": 300, "an": 301, "ed": 302, "er": 303, "re": 304, "ar": 305, "ti": 306, "on": 307, "en": 308, "of": 309, "or": 310, "and": 311, "er": 312, "on": 313, "in": 314, "ing": 315, "st": 316, "ro": 317, "al": 318, "it": 319, "to": 320, "as": 321, "at": 322, "es": 323, "ou": 324, "hi": 325, "ac": 326, "si": 327, "at": 328, "ri": 329, "al": 330, "el": 331, "an": 332, "am": 333, "or": 334, "st": 335, "li": 336, "ur": 337, "ec": 338, "om": 339, "di": 340, "was": 341, "ly": 342, "en": 343, "ea": 344, "ch": 345, "un": 346, "tion": 347, "la": 348, "is": 349, "fi": 350, "ol": 351, "de": 352, "-@": 353, "@-@": 354, "ra": 355, "vi": 356, "le": 357, "lo": 358, "sh": 359, "em": 360, "be": 361, "that": 362, "'s": 363, "con": 364, "ma": 365, "for": 366, "ha": 367, "su": 368, "by": 369, "ith": 370, "ve": 371, "with": 372, "se": 373, "ch": 374, "the": 375, "ent": 376, "po": 377, "ce": 378, "il": 379, "se": 380, "ent": 381, "le": 382, "com": 383, "sp": 384, "ere": 385, "pro": 386, "no": 387, "bu": 388, "wh": 389, "it": 390, "th": 391, "ver": 392, "ne": 393, "ca": 394, "is": 395, "for": 396, "ag": 397, "ers": 398, "mo": 399, "gh": 400, "fro": 401, "ted": 402, "from": 403, "tion": 404, "op": 405, "his": 406, "ad": 407, "ab": 408, "ic": 409, "he": 410, "oun": 411, "as": 412, "ts": 413, "sc": 414, "de": 415, "ow": 416, "ex": 417, "whi": 418, "ru": 419, "ter": 420, "ap": 421, "ds": 422, "were": 423, "pre": 424, "du": 425, "gu": 426, "par": 427, "ir": 428, "bo": 429, "ther": 430, "qu": 431, "lu": 432, "ter": 433, "tw": 434, "es": 435, "rec": 436, "per": 437, "ta": 438, "ate": 439, "ver": 440, "ated": 441, "ding": 442, "ity": 443, "man": 444, "ear": 445, "sed": 446, "ded": 447, "au": 448, "all": 449, "ame": 450, "ci": 451, "one": 452, "ing": 453, "are": 454, "af": 455, "ir": 456, "ation": 457, "âĢ": 458, "had": 459, "tr": 460, "ul": 461, "ld": 462, "which": 463, "wa": 464, "im": 465, "lea": 466, "be": 467, "to": 468, "tim": 469, "fir": 470, "wor": 471, "ong": 472, "por": 473, "mar": 474, "me": 475, "ally": 476, "so": 477, "out": 478, "tions": 479, "its": 480, "gh": 481, "ge": 482, "ber": 483, "fe": 484, "pu": 485, "ser": 486, "der": 487, "pl": 488, "ss": 489, "ine": 490, "inc": 491, "mi": 492, "ght": 493, "go": 494, "this": 495, "tur": 496, "da": 497, "rou": 498, "but": 499, "um": 500, "son": 501, "we": 502, "ved": 503, "sion": 504, "ke": 505, "pla": 506, "their": 507, "ies": 508, "first": 509, "sa": 510, "oc": 511, "att": 512, "of": 513, "pe": 514, "not": 515, "gi": 516, "na": 517, "ary": 518, "mu": 519, "led": 520, "âĢĵ": 521, "her": 522, "ran": 523, "co": 524, "they": 525, "der": 526, "ali": 527, "also": 528, "ore": 529, "ep": 530, "ould": 531, "after": 532, "shi": 533, "us": 534, "et": 535, "tic": 536, "stor": 537, "wi": 538, "ev": 539, "other": 540, "sh": 541, "ting": 542, "ard": 543, "te": 544, "two": 545, "ni": 546, "have": 547, "our": 548, "comm": 549, "te": 550, "ack": 551, "oo": 552, "fin": 553, "sec": 554, "ents": 555, "has": 556, "comp": 557, "bec": 558, "ks": 559, "cont": 560, "land": 561, "been": 562, "ence": 563, "king": 564, "el": 565, "age": 566, "low": 567, "min": 568, ".@": 569, "@.@": 570, "ome": 571, "ment": 572, "char": 573, "ge": 574, "ater": 575, "nor": 576, "ho": 577, "ous": 578, "who": 579, "ear": 580, "spec": 581, "col": 582, "ely": 583, "ty": 584, "jo": 585, "uring": 586, "duc": 587, "bri": 588, "str": 589, "can": 590, "ori": 591, "tra": 592, "pa": 593, "she": 594, "do": 595, "tive": 596, "mon": 597, "new": 598, "rit": 599, "time": 600, "ons": 601, "so": 602, "man": 603, "dec": 604, "cent": 605, "lan": 606, "pi": 607, "our": 608, "inter": 609, "fer": 610, "gra": 611, "gre": 612, "res": 613, "inclu": 614, "mil": 615, "during": 616, "own": 617, "pres": 618, "ju": 619, "ned": 620, "ell": 621, ",@": 622, "@,@": 623, "ite": 624, "gen": 625, "when": 626, "sig": 627, "bi": 628, "ren": 629, "fa": 630, "ga": 631, "play": 632, "eng": 633, "tional": 634, "ound": 635, "thou": 636, "more": 637, "ree": 638, "ember": 639, "ei": 640, "sou": 641, "sur": 642, "sti": 643, "car": 644, "form": 645, "lar": 646, "ses": 647, "ten": 648, "into": 649, "tu": 650, "ces": 651, "most": 652, "ked": 653, "way": 654, "cre": 655, "coun": 656, "up": 657, "les": 658, "ace": 659, "als": 660, "ke": 661, "would": 662, "ant": 663, "ber": 664, "fu": 665, "ited": 666, "pri": 667, "while": 668, "over": 669, "ings": 670, "re": 671, "fil": 672, "sy": 673, "est": 674, "able": 675, "wn": 676, "sea": 677, "ach": 678, "sing": 679, "ins": 680, "tic": 681, "id": 682, "only": 683, "ates": 684, "tri": 685, "ving": 686, "ba": 687, "vel": 688, "ance": 689, "sta": 690, "ern": 691, "fol": 692, "een": 693, "ined": 694, "stru": 695, "uni": 696, "game": 697, "lar": 698, "sel": 699, "bli": 700, "used": 701, "ning": 702, "ps": 703, "ties": 704, "kno": 705, "cor": 706, "ft": 707, "recor": 708, "ble": 709, "vie": 710, "ys": 711, "wil": 712, "ical": 713, "app": 714, "tro": 715, "three": 716, "cla": 717, "old": 718, "shed": 719, "hea": 720, "about": 721, "writ": 722, "than": 723, "ste": 724, "later": 725, "ari": 726, "dy": 727, "publi": 728, "loc": 729, "aga": 730, "throu": 731, "ssi": 732, "end": 733, "may": 734, "ang": 735, "ach": 736, "ves": 737, "og": 738, "him": 739, "betw": 740, "though": 741, "between": 742, "um": 743, "star": 744, "scri": 745, "rea": 746, "ond": 747, "ship": 748, "ok": 749, "hel": 750, "song": 751, "chi": 752, "cap": 753, "ever": 754, "day": 755, "cri": 756, "some": 757, "bro": 758, "no": 759, "there": 760, "ans": 761, "all": 762, "num": 763, "red": 764, "ears": 765, "sts": 766, "any": 767, "war": 768, "ph": 769, "pp": 770, "gin": 771, "struc": 772, "amer": 773, "produc": 774, "sch": 775, "ces": 776, "ure": 777, "ating": 778, "emp": 779, "tor": 780, "season": 781, "fore": 782, "ic": 783, "city": 784, "gro": 785, "follow": 786, "sub": 787, "bel": 788, "year": 789, "can": 790, "sin": 791, "where": 792, "and": 793, "made": 794, "relea": 795, "sm": 796, "bl": 797, "ten": 798, "with": 799, "son": 800, "many": 801, "are": 802, "ed": 803, "how": 804, "americ": 805, "ury": 806, "stu": 807, "musi": 808, "cu": 809, "nam": 810, "ement": 811, "such": 812, "albu": 813, "buil": 814, "before": 815, "ef": 816, "arm": 817, "ton": 818, "them": 819, "cal": 820, "bar": 821, "des": 822, "mat": 823, "gener": 824, "od": 825, "series": 826, "cer": 827, "sho": 828, "enti": 829, "her": 830, "over": 831, "ann": 832, "well": 833, "world": 834, "gan": 835, "est": 836, "second": 837, "ters": 838, "side": 839, "tran": 840, "line": 841, "ture": 842, "port": 843, "being": 844, "years": 845, "both": 846, "indi": 847, "these": 848, "national": 849, "histor": 850, "fe": 851, "vo": 852, "sted": 853, "ani": 854, "bas": 855, "poin": 856, "sing": 857, "film": 858, "pen": 859, "sup": 860, "mis": 861, "cro": 862, "stri": 863, "lin": 864, "tre": 865, "war": 866, "however": 867, "ying": 868, "ling": 869, "yp": 870, "ected": 871, "direc": 872, "vision": 873, "album": 874, "then": 875, "ll": 876, "sever": 877, "through": 878, "known": 879, "bor": 880, "cul": 881, "clu": 882, "ster": 883, "south": 884, "ry": 885, "ect": 886, "low": 887, "pr": 888, "sk": 889, "iso": 890, "north": 891, "part": 892, "fac": 893, "tly": 894, "peri": 895, "eu": 896, "batt": 897, "state": 898, "ced": 899, "consi": 900, "inf": 901, "poli": 902, "olog": 903, "early": 904, "posi": 905, "ames": 906, "win": 907, "devel": 908, "ob": 909, "ve": 910, "ven": 911, "oper": 912, "ger": 913, "offi": 914, "charac": 915, "ms": 916, "high": 917, "ad": 918, "tho": 919, "several": 920, "dre": 921, "descri": 922, "ale": 923, "number": 924, "air": 925, "including": 926, "inst": 927, "against": 928, "ls": 929, "sul": 930, "episo": 931, "cam": 932, "dif": 933, "soci": 934, "became": 935, "like": 936, "tel": 937, "four": 938, "âĢĶ": 939, "hou": 940, "joh": 941, "united": 942, "inv": 943, "under": 944, "nov": 945, "tiv": 946, "suc": 947, "ations": 948, "ack": 949, "tor": 950, "ron": 951, "und": 952, "ws": 953, "fo": 954, "gr": 955, "develop": 956, "although": 957, "contin": 958, "west": 959, "origin": 960, "music": 961, "ors": 962, "don": 963, "century": 964, "ward": 965, "work": 966, "me": 967, "ami": 968, "cha": 969, "very": 970, "har": 971, "dis": 972, "zed": 973, "do": 974, "gs": 975, "tow": 976, "sol": 977, "following": 978, "lion": 979, "rema": 980, "ns": 981, "tish": 982, "chur": 983, "som": 984, "mp": 985, "tle": 986, "gover": 987, "del": 988, "comple": 989, "cur": 990, "use": 991, "back": 992, "hu": 993, "stern": 994, "began": 995, "fiel": 996, "ause": 997, "dra": 998, "pas": 999, "bil": 1000, "cation": 1001, "dent": 1002, "bed": 1003, "because": 1004, "ant": 1005, "eam": 1006, "phi": 1007, "yo": 1008, "continu": 1009, "tain": 1010, "try": 1011, "fre": 1012, "peop": 1013, "called": 1014, "found": 1015, "episode": 1016, "desig": 1017, "mor": 1018, "set": 1019, "ley": 1020, "east": 1021, "trac": 1022, "cra": 1023 }, "merges": [ "t h", "th e", "i n", "a n", "e d", "e r", "r e", "a r", "t i", "o n", "e n", "o f", "o r", "an d", "e r", "o n", "i n", "in g", "s t", "r o", "a l", "i t", "t o", "a s", "a t", "e s", "o u", "h i", "a c", "s i", "a t", "r i", "a l", "e l", "a n", "a m", "o r", "s t", "l i", "u r", "e c", "o m", "d i", "w as", "l y", "e n", "e a", "c h", "u n", "ti on", "l a", "i s", "f i", "o l", "d e", "- @", "@ -@", "r a", "v i", "l e", "l o", "s h", "e m", "b e", "th at", "' s", "c on", "m a", "f or", "h a", "s u", "b y", "it h", "v e", "w ith", "s e", "c h", "th e", "en t", "p o", "c e", "i l", "s e", "en t", "l e", "c om", "s p", "er e", "p ro", "n o", "b u", "w h", "i t", "t h", "v er", "n e", "c a", "i s", "f or", "a g", "er s", "m o", "g h", "f ro", "t ed", "fro m", "ti on", "o p", "hi s", "a d", "a b", "i c", "h e", "ou n", "a s", "t s", "s c", "d e", "o w", "e x", "w hi", "r u", "t er", "a p", "d s", "w ere", "p re", "d u", "g u", "p ar", "i r", "b o", "th er", "q u", "l u", "t er", "t w", "e s", "re c", "p er", "t a", "at e", "v er", "at ed", "d ing", "it y", "m an", "e ar", "s ed", "d ed", "a u", "al l", "am e", "c i", "on e", "in g", "ar e", "a f", "i r", "a tion", "â Ģ", "ha d", "t r", "u l", "l d", "whi ch", "w a", "i m", "l ea", "b e", "t o", "ti m", "fi r", "w or", "on g", "p or", "m ar", "m e", "al ly", "s o", "ou t", "tion s", "it s", "g h", "g e", "b er", "f e", "p u", "s er", "d er", "p l", "s s", "in e", "in c", "m i", "gh t", "g o", "th is", "t ur", "d a", "ro u", "bu t", "u m", "s on", "w e", "v ed", "si on", "k e", "p la", "the ir", "i es", "fir st", "s a", "o c", "at t", "o f", "p e", "no t", "g i", "n a", "ar y", "m u", "l ed", "âĢ ĵ", "h er", "r an", "c o", "the y", "d er", "al i", "al so", "or e", "e p", "ou ld", "af ter", "s hi", "u s", "e t", "ti c", "st or", "w i", "e v", "o ther", "s h", "t ing", "ar d", "t e", "tw o", "n i", "ha ve", "ou r", "com m", "t e", "ac k", "o o", "f in", "s ec", "ent s", "h as", "com p", "b ec", "k s", "con t", "l and", "be en", "en ce", "k ing", "e l", "ag e", "lo w", "m in", ". @", "@ .@", "om e", "m ent", "ch ar", "g e", "at er", "n or", "h o", "ou s", "wh o", "ea r", "sp ec", "c ol", "el y", "t y", "j o", "ur ing", "du c", "b ri", "st r", "c an", "or i", "t ra", "p a", "sh e", "d o", "ti ve", "m on", "ne w", "r it", "tim e", "on s", "s o", "m an", "d ec", "c ent", "l an", "p i", "ou r", "in ter", "f er", "g ra", "g re", "re s", "inc lu", "m il", "d uring", "ow n", "pre s", "j u", "n ed", "el l", ", @", "@ ,@", "it e", "g en", "wh en", "si g", "b i", "re n", "f a", "g a", "pla y", "en g", "tion al", "oun d", "th ou", "m ore", "re e", "em ber", "e i", "s ou", "s ur", "s ti", "c ar", "for m", "l ar", "s es", "t en", "in to", "t u", "c es", "mo st", "k ed", "wa y", "c re", "c oun", "u p", "l es", "ac e", "al s", "k e", "w ould", "an t", "b er", "f u", "it ed", "p ri", "whi le", "o ver", "ing s", "r e", "fi l", "s y", "e st", "ab le", "w n", "s ea", "ac h", "s ing", "in s", "ti c", "i d", "on ly", "at es", "t ri", "v ing", "b a", "v el", "an ce", "st a", "er n", "f ol", "e en", "in ed", "st ru", "un i", "g ame", "la r", "s el", "b li", "u sed", "n ing", "p s", "ti es", "k no", "c or", "f t", "rec or", "b le", "vi e", "y s", "w il", "ic al", "ap p", "t ro", "th ree", "c la", "ol d", "sh ed", "h ea", "ab out", "w rit", "th an", "st e", "l ater", "ar i", "d y", "pu bli", "lo c", "ag a", "th rou", "s si", "en d", "ma y", "an g", "ac h", "v es", "o g", "hi m", "be tw", "thou gh", "betw een", "u m", "st ar", "sc ri", "re a", "on d", "shi p", "o k", "h el", "s ong", "c hi", "ca p", "e ver", "da y", "c ri", "s ome", "b ro", "n o", "th ere", "an s", "al l", "n um", "r ed", "ear s", "st s", "an y", "w ar", "p h", "p p", "g in", "stru c", "am er", "pro duc", "s ch", "c es", "ur e", "at ing", "em p", "t or", "sea son", "for e", "i c", "c ity", "g ro", "fol low", "su b", "b el", "y ear", "c an", "s in", "wh ere", "an d", "ma de", "re lea", "s m", "b l", "t en", "wi th", "s on", "man y", "a re", "e d", "h ow", "amer ic", "ur y", "st u", "mu si", "c u", "n am", "em ent", "su ch", "al bu", "bu il", "be fore", "e f", "ar m", "t on", "the m", "c al", "b ar", "d es", "m at", "gen er", "o d", "ser ies", "c er", "sh o", "en ti", "h er", "o ver", "an n", "w ell", "wor ld", "g an", "e st", "sec ond", "t ers", "si de", "tr an", "l ine", "tur e", "por t", "be ing", "y ears", "bo th", "in di", "the se", "na tional", "hi stor", "f e", "v o", "st ed", "an i", "b as", "po in", "s ing", "fil m", "p en", "su p", "m is", "c ro", "st ri", "l in", "t re", "wa r", "how ever", "y ing", "l ing", "y p", "ec ted", "di rec", "vi sion", "albu m", "th en", "l l", "se ver", "throu gh", "kno wn", "b or", "c ul", "c lu", "st er", "sou th", "r y", "ec t", "lo w", "p r", "s k", "is o", "nor th", "par t", "f ac", "t ly", "per i", "e u", "b att", "st ate", "c ed", "con si", "in f", "po li", "ol og", "ear ly", "po si", "am es", "w in", "de vel", "o b", "v e", "v en", "op er", "g er", "of fi", "char ac", "m s", "hi gh", "a d", "th o", "sever al", "d re", "de scri", "al e", "num ber", "a ir", "inclu ding", "in st", "aga inst", "l s", "su l", "ep iso", "c am", "di f", "so ci", "bec ame", "li ke", "t el", "f our", "âĢ Ķ", "h ou", "jo h", "un ited", "in v", "un der", "no v", "ti v", "su c", "a tions", "ac k", "t or", "r on", "un d", "w s", "f o", "g r", "devel op", "al though", "cont in", "we st", "ori gin", "musi c", "or s", "d on", "cent ury", "w ard", "wor k", "m e", "am i", "ch a", "ver y", "h ar", "di s", "z ed", "d o", "g s", "t ow", "s ol", "follow ing", "li on", "re ma", "n s", "ti sh", "ch ur", "s om", "m p", "t le", "go ver", "d el", "comp le", "c ur", "u se", "b ack", "h u", "st ern", "be gan", "fi el", "au se", "d ra", "p as", "b il", "ca tion", "d ent", "b ed", "bec ause", "an t", "ea m", "p hi", "y o", "contin u", "ta in", "tr y", "f re", "pe op", "cal led", "f ound", "episo de", "de sig", "m or", "se t", "le y", "ea st", "tr ac", "c ra" ] } }