Upload vocab.json
Browse files- vocab.json +1 -0
vocab.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"<unk>": 0, "<s>": 1, "</s>": 2, ",": 3, ".": 4, "\u2581the": 5, "\u2581": 6, "s": 7, "\u2581I": 8, "\u2581to": 9, "t": 10, "\u2581a": 11, "ed": 12, "\u2581and": 13, "\u2581of": 14, "e": 15, "ing": 16, "d": 17, "a": 18, "o": 19, "\u2581in": 20, "n": 21, "\u2581was": 22, "i": 23, "\u2581\"": 24, "m": 25, "\u2581it": 26, "p": 27, "r": 28, "\u2581me": 29, "c": 30, "'": 31, "l": 32, "y": 33, "-": 34, "\u2581that": 35, "\u2581be": 36, "g": 37, "\u2581he": 38, "ly": 39, "\u2581for": 40, "k": 41, "\u2581with": 42, "\u2581my": 43, "u": 44, "er": 45, "\u2581not": 46, "\u2581is": 47, "\u2581s": 48, "\u2581you": 49, "\u2581as": 50, "h": 51, "\u2581but": 52, "or": 53, "in": 54, "re": 55, ".\"": 56, "f": 57, "\u2581on": 58, "ar": 59, "\u2581at": 60, "\u2581or": 61, "\u2581had": 62, "\u2581p": 63, "b": 64, "\u2581this": 65, "\u2581would": 66, "\u2581re": 67, "\u2581The": 68, "at": 69, "\u2581so": 70, "\u2581his": 71, "\u2581f": 72, "\u2581c": 73, "an": 74, "\u2581by": 75, "\u2581have": 76, "\u2581b": 77, "\u2581no": 78, "w": 79, "en": 80, "\u2581one": 81, "le": 82, "al": 83, "st": 84, "ri": 85, "it": 86, "v": 87, "ll": 88, "\u2581him": 89, "\u2581all": 90, "\u2581de": 91, "ch": 92, "\u2581if": 93, "\u2581do": 94, "\u2581Shirt": 95, "\u2581Red": 96, "se": 97, "\u2581w": 98, "th": 99, "\u2581out": 100, "\u2581from": 101, "I": 102, "\u2581they": 103, "\u2581A": 104, "ur": 105, "\u2581go": 106, "\u2581about": 107, "\u2581there": 108, "ent": 109, "\u2581said": 110, "\u2581like": 111, "on": 112, "ow": 113, ";": 114, "\u2581we": 115, "\u2581were": 116, "\u2581who": 117, "es": 118, "\u2581up": 119, "\u2581Porcupine": 120, "\u2581are": 121, "\u2581them": 122, "\u2581school": 123, "ic": 124, "\u2581co": 125, "il": 126, ",\"": 127, "ce": 128, "\u2581any": 129, "ve": 130, "is": 131, "\u2581when": 132, "ro": 133, "un": 134, "\u2581get": 135, "\u2581room": 136, "ne": 137, "\u2581which": 138, "H": 139, "id": 140, "te": 141, "\"": 142, "\u2581did": 143, "um": 144, "?\"": 145, "\u2581some": 146, "!": 147, "\u2581house": 148, "ir": 149, "\u2581see": 150, "ation": 151, "\u2581He": 152, "?": 153, "\u2581l": 154, "\u2581been": 155, "pe": 156, "\u2581what": 157, "\u2581could": 158, "\u2581M": 159, "\u2581If": 160, "\u2581fellow": 161, "\u2581such": 162, "E": 163, "ut": 164, "\u2581can": 165, "\u2581she": 166, "\u2581an": 167, "\u2581more": 168, "\u2581S": 169, "\u2581time": 170, "\u2581will": 171, "el": 172, "\u2581other": 173, "\u2581should": 174, "\u2581may": 175, "\u2581her": 176, "T": 177, "\u2581Clown": 178, "\u2581sh": 179, "\u2581old": 180, "\u2581way": 181, "able": 182, "ng": 183, "\u2581back": 184, "\u2581make": 185, "\u2581come": 186, "la": 187, "\u2581Gutenberg": 188, "\u2581than": 189, "\u2581us": 190, "A": 191, "\u2581right": 192, "ate": 193, "ous": 194, "\u2581only": 195, "\u2581teacher": 196, "\u2581thought": 197, "us": 198, "R": 199, "qu": 200, "\u2581students": 201, "\u2581know": 202, "\u2581going": 203, "\u2581Project": 204, "\u2581their": 205, "\u2581take": 206, "N": 207, "\u2581say": 208, "ke": 209, "\u2581don": 210, "ter": 211, "\u2581two": 212, "\u2581work": 213, "\u2581asked": 214, "ot": 215, "ive": 216, "\u2581am": 217, "\u2581night": 218, ":": 219, "\u2581Kiyo": 220, "\u2581un": 221, "\u2581after": 222, "\u2581pro": 223, "\u2581gr": 224, "\u2581head": 225, "\u2581ex": 226, "\u2581But": 227, "ul": 228, "ment": 229, "\u2581ma": 230, "\u2581might": 231, "\u2581even": 232, "\u2581face": 233, "!\"": 234, "and": 235, "\u2581T": 236, "\u2581dis": 237, "\u2581principal": 238, "\u2581three": 239, "ance": 240, "\u2581It": 241, "\u2581down": 242, "\u2581made": 243, "\u2581off": 244, ",--": 245, "\u2581con": 246, "\u2581your": 247, "\u2581bo": 248, "\u2581over": 249, "ence": 250, "\u2581has": 251, "he": 252, "]": 253, "\u2581want": 254, "\u2581into": 255, "O": 256, "\u2581mo": 257, "ad": 258, "\u2581think": 259, "\u2581sp": 260, "\u2581much": 261, "......": 262, "\u2581told": 263, "ity": 264, "led": 265, "op": 266, "\u2581far": 267, "if": 268, "\u2581F": 269, "S": 270, "\u2581No": 271, "That": 272, "\u2581This": 273, "ty": 274, "L": 275, "\u2581something": 276, "ward": 277, "\u2581own": 278, "\u2581our": 279, "\u2581man": 280, "\u2581Then": 281, "ough": 282, "\u2581came": 283, "ally": 284, "\u2581ga": 285, "\u2581mean": 286, "\u2581B": 287, "ant": 288, "\u2581Tokyo": 289, "\u2581ha": 290, "ish": 291, "ver": 292, "\u2581When": 293, "\u2581good": 294, "x": 295, "\u2581first": 296, "\u2581thing": 297, "\u2581D": 298, "\u2581K": 299, "tion": 300, "\u2581place": 301, "\u2581long": 302, "\u2581better": 303, "\u2581tell": 304, "\u2581how": 305, "age": 306, "\u2581went": 307, "\u2581day": 308, "\u2581just": 309, "\u2581sure": 310, "\u2581part": 311, "\u2581town": 312, "\u2581away": 313, "W": 314, "\u2581On": 315, "\u2581before": 316, "\u2581kind": 317, "ful": 318, "less": 319, "em": 320, "\u2581looked": 321, "ion": 322, "\u2581talk": 323, "\u2581heard": 324, "tm": 325, "\u2581now": 326, "\u2581sen": 327, "ther": 328, "ry": 329, "J": 330, "\u2581What": 331, "\u2581P": 332, "\u2581Squash": 333, "\u2581wrong": 334, "\u2581without": 335, "\u2581sha": 336, "\u2581where": 337, "\u2581They": 338, "0": 339, "U": 340, "\u2581Hubbard": 341, "\u2581return": 342, "\u2581here": 343, "\u2581same": 344, "ling": 345, "\u2581many": 346, "\u2581well": 347, "\u2581once": 348, "\u2581You": 349, "1": 350, "\u2581because": 351, "\u2581matter": 352, "\u2581And": 353, "ever": 354, "F": 355, "\u2581give": 356, "\u2581letter": 357, "\u2581show": 358, "\u2581fish": 359, "up": 360, "\u2581look": 361, "The": 362, "\u2581myself": 363, "\u2581laugh": 364, "\u2581yen": 365, "\u2581O": 366, "D": 367, "\u2581bu": 368, "\u2581anything": 369, "\u2581care": 370, "\u2581days": 371, "\u2581ra": 372, "\u2581There": 373, "\u2581saying": 374, "\u2581So": 375, "\u2581having": 376, "\u2581hand": 377, "\u2581ho": 378, "\u2581being": 379, "\u2581As": 380, "\u2581comp": 381, ")": 382, "\u2581while": 383, "\u2581Koga": 384, "\u2581class": 385, "\u2581never": 386, "\u25811.": 387, "\u2581set": 388, "est": 389, "\u2581mi": 390, "C": 391, "\u2581follow": 392, "\u2581left": 393, "\u2581C": 394, "\u2581new": 395, "\u2581very": 396, "\u2581seemed": 397, "\u2581di": 398, "\u2581dr": 399, "ction": 400, "\u2581person": 401, "\u2581must": 402, "\u2581bad": 403, "\u2581We": 404, "--": 405, "ble": 406, "\u2581again": 407, "\u2581watch": 408, "body": 409, "\u2581(": 410, "\u2581per": 411, "\u2581tra": 412, "\u2581those": 413, "\u2581teachers": 414, "P": 415, "\u2581read": 416, "\u2581sat": 417, "\u2581da": 418, "\u2581hot": 419, "\u2581start": 420, "\u2581became": 421, "\u2581felt": 422, "\u2581found": 423, "M": 424, "ust": 425, "\u2581started": 426, "\u2581[": 427, "\u2581middle": 428, "\u2581salary": 429, "\u2581through": 430, "\u2581half": 431, "\u2581raise": 432, "\u2581took": 433, "You": 434, "\u2581upon": 435, "\u2581soon": 436, "ies": 437, "\u2581E": 438, "\u2581pai": 439, "\u2581str": 440, "\u2581works": 441, "\u2581cannot": 442, "\u2581pass": 443, "\u2581hard": 444, "\u2581mind": 445, "\u2581began": 446, "\u2581saw": 447, "\u2581nothing": 448, "ash": 449, "\u2581mar": 450, "\u2581Badger": 451, "\u2581next": 452, "\u2581quite": 453, "\u2581keep": 454, "\u2581still": 455, "\u2581become": 456, "\u2581She": 457, "\u2581hour": 458, "fter": 459, "ound": 460, "\u2581Madonna": 461, "\u2581voice": 462, "\u2581remark": 463, "\u2581turn": 464, "\u2581name": 465, "\u2581live": 466, "\u2581line": 467, "\u2581boarding": 468, "\u2581To": 469, "\u2581called": 470, "\u2581consider": 471, "\u2581electronic": 472, "\u2581woman": 473, "\u2581reason": 474, "\u2581money": 475, "\u2581year": 476, "\u2581since": 477, "\u2581round": 478, "\u2581help": 479, "\u2581full": 480, "[": 481, "\u2581put": 482, "\u2581appeared": 483, "\u2581appear": 484, "\u2581cha": 485, "ome": 486, "No": 487, "\u2581country": 488, "\u2581geisha": 489, "\u2581resign": 490, "\u2581leave": 491, "\u2581paper": 492, "\u2581open": 493, "\u2581home": 494, "\u2581find": 495, "\u2581side": 496, "Well": 497, "ness": 498, "\u2581answered": 499, "\u2581G": 500, "ook": 501, "way": 502, "\u2581While": 503, "\u2581fight": 504, "Yes": 505, "Say": 506, "tain": 507, "\u2581feet": 508, "G": 509, "light": 510, "\u2581front": 511, "\u2581brother": 512, "\u2581fool": 513, "\u2581stay": 514, "\u2581walk": 515, "\u2581bath": 516, "\u2581pay": 517, "B": 518, "day": 519, "\u2581sea": 520, "\u2581little": 521, "\u2581people": 522, "\u2581second": 523, "\u2581terms": 524, "\u2581stop": 525, "\u2581end": 526, "\u2581ti": 527, "\u2581hu": 528, "\u2581One": 529, "5": 530, "\u2581affair": 531, "\u2581straight": 532, "\u2581written": 533, "\u2581Foundation": 534, "\u2581wonder": 535, "\u2581story": 536, "\u2581lady": 537, "\u2581six": 538, "\u2581eat": 539, "\u2581does": 540, "\u2581hi": 541, "\u2581My": 542, "\u2581call": 543, "\u2581expect": 544, "\u2581trouble": 545, "\u2581strange": 546, "\u2581why": 547, "\u2581four": 548, "\u2581bang": 549, "high": 550, "\u2581kid": 551, "ame": 552, "\u2581tea": 553, "What": 554, "night": 555, "\u2581already": 556, "\u2581kept": 557, "\u2581fact": 558, "\u2581dango": 559, "\u2581draw": 560, "\u2581manner": 561, "\u2581great": 562, "\u2581enough": 563, "\u2581every": 564, "\u2581last": 565, "\u2581coming": 566, "\u2581state": 567, "\u2581heart": 568, "\u2581Sir": 569, "\u2581though": 570, "Y": 571, "2": 572, "\u2581dinner": 573, "\u2581life": 574, "\u2581water": 575, "\u2581copy": 576, "\u2581stand": 577, "\u2581however": 578, "\u2581hotel": 579, "\u2581let": 580, "\u2581train": 581, "\u2581five": 582, "\u2581boat": 583, "ical": 584, "\u2581bra": 585, "head": 586, "\u2581Hotta": 587, "\u2581accept": 588, "\u2581happen": 589, "\u2581himself": 590, "\u2581stood": 591, "\u2581regard": 592, "\u2581noodle": 593, "\u2581eyes": 594, "\u2581clear": 595, "\u2581short": 596, "\u2581big": 597, "\u2581rather": 598, "\u2581dance": 599, "\u2581mother": 600, "ER": 601, "\u2581against": 602, "\u2581sound": 603, "\u2581most": 604, "\u2581both": 605, "\u2581simple": 606, "\u2581tak": 607, "amp": 608, "\u2581star": 609, "\u2581either": 610, "\u2581springs": 611, "\u2581another": 612, "\u2581father": 613, "\u2581also": 614, "\u2581under": 615, "\u2581receiv": 616, "\u2581agreement": 617, "\u2581near": 618, "\u2581act": 619, "\u2581need": 620, "\u2581feel": 621, "\u2581wish": 622, "aster": 623, "gue": 624, "\u2581answer": 625, "\u2581believe": 626, "\u2581business": 627, "\u2581farewell": 628, "\u2581position": 629, "\u2581question": 630, "\u2581surprise": 631, "\u2581brought": 632, "empura": 633, "\u2581serious": 634, "\u2581sleep": 635, "\u2581treat": 636, "\u2581each": 637, "\u2581hold": 638, "mper": 639, "time": 640, "where": 641, "\u2581va": 642, "\u2581board": 643, "\u2581public": 644, "\u2581friend": 645, "\u2581understand": 646, "\u2581gentle": 647, "\u2581everything": 648, "\u2581strong": 649, "\u2581month": 650, "\u2581tree": 651, "\u2581case": 652, "\u2581unless": 653, "\u2581moment": 654, "\u2581unti": 655, "\u2581tri": 656, "cial": 657, "bout": 658, "6": 659, "\u2581English": 660, "\u2581apologize": 661, "\u2581effort": 662, "\u2581original": 663, "\u2581particular": 664, "\u2581quiet": 665, "\u2581floor": 666, "\u2581Yedo": 667, "\u2581always": 668, "\u2581declar": 669, "\u2581please": 670, "\u2581small": 671, "\u2581certain": 672, "Why": 673, "CHA": 674, "\u2581blow": 675, "\u2581yet": 676, "\u2581direction": 677, "\u2581wait": 678, "\u2581poor": 679, "\u2581fine": 680, "\u2581hung": 681, "\u2581Some": 682, "\u2581account": 683, "\u2581attempt": 684, "\u2581grasshopper": 685, "\u2581sight": 686, "\u2581impress": 687, "\u2581knew": 688, "\u2581whether": 689, "\u2581Darling": 690, "\u2581writing": 691, "\u2581teaching": 692, "\u2581course": 693, "\u2581dark": 694, "\u2581sorry": 695, "\u2581agree": 696, "\u2581thus": 697, "\u2581serve": 698, "ably": 699, "\u2581try": 700, "\u2581office": 701, "\u2581desk": 702, "aving": 703, "\u2581los": 704, "This": 705, "aught": 706, "8": 707, "\u2581address": 708, "\u2581Nobeoka": 709, "\u2581includ": 710, "\u2581janitor": 711, "\u2581sweet": 712, "\u2581prefer": 713, "\u2581square": 714, "\u2581request": 715, "\u2581sign": 716, "\u2581least": 717, "\u2581propos": 718, "\u2581point": 719, "\u2581insist": 720, "\u2581indeed": 721, "\u2581around": 722, "\u2581Ya": 723, "\u2581game": 724, "\u2581tru": 725, "\u2581free": 726, "\u2581fee": 727, "\u2581notice": 728, "\u2581probab": 729, "\u2581lie": 730, "copyright": 731, "\u2581Archive": 732, "\u2581Literary": 733, "\u2581almost": 734, "\u2581different": 735, "\u2581eBook": 736, "\u2581paragraph": 737, "\u2581possible": 738, "\u2581punishment": 739, "\u2581transfer": 740, "\u2581twenty": 741, "\u2581black": 742, "\u2581future": 743, "\u2581natural": 744, "\u2581pocket": 745, "\u2581normal": 746, "\u2581tender": 747, "\u2581With": 748, "\u2581favor": 749, "\u2581easy": 750, "\u2581speech": 751, "\u2581fault": 752, "ccord": 753, "\u2581large": 754, "\u2581close": 755, "\u2581along": 756, "\u2581guy": 757, "\u2581inside": 758, "\u2581interest": 759, "\u2581entered": 760, "\u2581finish": 761, "\u2581alone": 762, "\u2581honor": 763, "\u2581among": 764, "\u2581sick": 765, "\u2581tired": 766, "\u2581fond": 767, "\u2581sub": 768, "\u2581law": 769, "\u2581week": 770, "\u2581order": 771, "etic": 772, "ock": 773, "note": 774, "K": 775, "change": 776, "\u2581physical": 777, "\u2581purpose": 778, "\u2581explain": 779, "\u2581mathematics": 780, "\u2581study": 781, "\u2581suppose": 782, "\u2581tomorrow": 783, "between": 784, "\u2581access": 785, "\u2581incident": 786, "\u2581limit": 787, "\u2581listen": 788, "\u2581respect": 789, "\u2581prais": 790, "\u2581morning": 791, "\u2581behind": 792, "\u2581outside": 793, "\u2581provide": 794, "\u2581honest": 795, "\u2581worry": 796, "\u2581mouth": 797, "\u2581stone": 798, "\u2581scene": 799, "\u2581play": 800, "\u2581dress": 801, "\u2581donations": 802, "\u2581tank": 803, "\u2581else": 804, "\u2581begin": 805, "Let": 806, "\u2581wide": 807, "\u2581compli": 808, "mashi": 809, "ability": 810, "like": 811, "\u2581bamboo": 812, "\u2581picture": 813, "\u2581difficult": 814, "\u2581narrow": 815, "\u2581object": 816, "\u2581opinion": 817, "\u2581pleasure": 818, "\u2581somewhat": 819, "\u2581understood": 820, "\u2581view": 821, "\u2581character": 822, "\u2581pretty": 823, "\u2581minute": 824, "\u2581present": 825, "\u2581loud": 826, "\u2581rolled": 827, "mission": 828, "\u2581further": 829, "\u2581spoke": 830, "\u2581write": 831, "\u2581cause": 832, "\u2581proper": 833, "clock": 834, "\u2581litera": 835, "cross": 836, "\u2581idea": 837, "\u2581wall": 838, "\u2581past": 839, "teacher": 840, "utenberg": 841, "rofessor": 842, "\u2581However": 843, "\u2581Ikagin": 844, "\u2581License": 845, "\u2581United": 846, "\u2581easily": 847, "\u2581effect": 848, "\u2581stepped": 849, "\u2581stuff": 850, "\u2581suggest": 851, "\u2581sympath": 852, "\u2581temple": 853, "\u2581yesterday": 854, "\u2581command": 855, "\u2581entrance": 856, "\u2581visit": 857, "\u2581living": 858, "\u2581States": 859, "\u2581world": 860, "\u2581sword": 861, "\u2581speak": 862, "\u2581history": 863, "\u2581lack": 864, "\u2581fetch": 865, "\u2581queer": 866, "\u2581require": 867, "\u2581block": 868, "\u2581spirit": 869, "\u2581tax": 870, "\u2581crook": 871, "\u2581early": 872, "\u2581gradua": 873, "\u2581Even": 874, "\u2581style": 875, "\u2581push": 876, "\u2581catch": 877, "\u2581shirt": 878, "\u2581arra": 879, "\u2581invite": 880, "stead": 881, "\u2581usual": 882, "machi": 883, "\u2581direct": 884, "\u2581perform": 885, "\u2581polite": 886, "\u2581similar": 887, "Besides": 888, "\u2581Kadoya": 889, "\u2581Yoshikawa": 890, "\u2581afraid": 891, "\u2581associated": 892, "\u2581display": 893, "\u2581distribute": 894, "\u2581dormitory": 895, "\u2581enjoy": 896, "\u2581nephew": 897, "\u2581province": 898, "\u2581themselves": 899, "\u2581trademark": 900, "\u2581translation": 901, "\u2581quick": 902, "\u2581supper": 903, "\u2581affect": 904, "\u2581knock": 905, "\u2581nature": 906, "\u2581neither": 907, "\u2581eggs": 908, "\u2581intention": 909, "\u2581fashion": 910, "\u2581respon": 911, "\u2581corner": 912, "\u2581girl": 913, "\u2581street": 914, "Where": 915, "nformation": 916, "\u2581attend": 917, "\u2581print": 918, "claim": 919, "\u2581trick": 920, "mitted": 921, "fresh": 922, "\u2581smile": 923, "\u2581commen": 924, "ropped": 925, "\u2581copie": 926, "\u2581express": 927, "\u2581number": 928, "\u2581whisper": 929, "\u2581addition": 930, "\u2581consolation": 931, "\u2581explanation": 932, "\u2581judg": 933, "\u2581language": 934, "\u2581mistake": 935, "\u2581police": 936, "\u2581potatoes": 937, "\u2581previous": 938, "\u2581shoji": 939, "\u2581thoroughly": 940, "\u2581thunder": 941, "\u2581twist": 942, "\u2581volunteer": 943, "\u2581decline": 944, "\u2581mischief": 945, "\u2581success": 946, "\u2581thirty": 947, "\u2581refund": 948, "\u2581charge": 949, "\u2581funny": 950, "\u2581appeal": 951, "\u2581patron": 952, "\u2581piece": 953, "\u2581credit": 954, "\u2581pack": 955, "\u2581fifty": 956, "\u2581danger": 957, "\u2581glad": 958, "\u2581duty": 959, "\u2581equal": 960, "depend": 961, "becom": 962, "astard": 963, "\u2581doubl": 964, "\u2581simpl": 965, "\u2581occup": 966, "collared": 967, "\u2581Bachelor": 968, "\u2581Russian": 969, "\u2581Toyama": 970, "\u2581absurd": 971, "\u2581beautiful": 972, "\u2581blunder": 973, "\u2581distributing": 974, "\u2581education": 975, "\u2581eight": 976, "\u2581family": 977, "\u2581giving": 978, "\u2581instructor": 979, "\u2581occasion": 980, "\u2581replied": 981, "\u2581smooth": 982, "\u2581stuck": 983, "\u2581subject": 984, "\u2581suffer": 985, "\u2581swimming": 986, "\u2581swollen": 987, "\u2581twice": 988, "\u2581upstairs": 989, "\u2581Natsume": 990, "\u2581condition": 991, "\u2581discharge": 992, "\u2581garden": 993, "\u2581grabbe": 994, "(": 995, "*": 996, "z": 997, "q": 998, "j": 999}
|