{ "architectures": [ "RobertaForTokenClassification" ], "attention_probs_dropout_prob": 0.1, "bos_token_id": 0, "classifier_dropout": null, "eos_token_id": 2, "hidden_act": "gelu", "hidden_dropout_prob": 0.1, "hidden_size": 768, "id2label": { "0": "ADJ", "1": "ADP", "2": "ADP+DET", "3": "ADP+PRON", "4": "ADV", "5": "ADV+AUX", "6": "ADV+PART", "7": "AUX", "8": "AUX+PART", "9": "B-ADJ", "10": "B-ADJ+ADJ", "11": "B-ADJ+NOUN", "12": "B-ADJ+NOUN+NOUN", "13": "B-ADJ+PART", "14": "B-ADJ+PROPN", "15": "B-ADJ+PUNCT", "16": "B-ADP", "17": "B-ADP+ADJ", "18": "B-ADP+NOUN", "19": "B-ADP+PRON", "20": "B-ADV", "21": "B-ADV+AUX", "22": "B-ADV+PUNCT", "23": "B-AUX", "24": "B-AUX+ADV", "25": "B-AUX+PART", "26": "B-AUX+PART+VERB", "27": "B-AUX+VERB", "28": "B-CCONJ", "29": "B-DET", "30": "B-DET+AUX", "31": "B-DET+NOUN", "32": "B-INTJ", "33": "B-INTJ+PUNCT", "34": "B-NOUN", "35": "B-NOUN+ADJ", "36": "B-NOUN+ADP", "37": "B-NOUN+AUX", "38": "B-NOUN+NOUN", "39": "B-NOUN+NOUN+VERB", "40": "B-NOUN+PART", "41": "B-NOUN+PROPN", "42": "B-NOUN+PUNCT", "43": "B-NOUN+SCONJ", "44": "B-NOUN+VERB", "45": "B-NUM", "46": "B-PART", "47": "B-PRON", "48": "B-PRON+ADJ", "49": "B-PRON+ADV", "50": "B-PRON+AUX", "51": "B-PRON+NOUN", "52": "B-PRON+PART", "53": "B-PRON+PRON", "54": "B-PRON+VERB", "55": "B-PROPN", "56": "B-PROPN+ADP", "57": "B-PROPN+AUX", "58": "B-PROPN+PART", "59": "B-PROPN+PROPN", "60": "B-PROPN+PUNCT", "61": "B-PROPN+PUNCT+PUNCT", "62": "B-PROPN+VERB", "63": "B-PUNCT", "64": "B-PUNCT+PUNCT", "65": "B-PUNCT+PUNCT+PUNCT", "66": "B-PUNCT+SYM+PUNCT", "67": "B-SCONJ", "68": "B-SYM", "69": "B-VERB", "70": "B-VERB+ADJ", "71": "B-VERB+ADJ+CCONJ", "72": "B-VERB+ADP", "73": "B-VERB+ADV", "74": "B-VERB+ADV+PUNCT", "75": "B-VERB+AUX", "76": "B-VERB+CCONJ", "77": "B-VERB+DET", "78": "B-VERB+NOUN", "79": "B-VERB+NOUN+CCONJ", "80": "B-VERB+NOUN+NOUN", "81": "B-VERB+PART", "82": "B-VERB+PRON", "83": "B-VERB+PRON+ADP", "84": "B-VERB+PRON+ADV", "85": "B-VERB+PROPN", "86": "B-VERB+SCONJ", "87": "B-VERB+VERB", "88": "B-VERB+VERB+NOUN", "89": "B-X", "90": "B-X+PUNCT", "91": "B-X+PUNCT+PUNCT", "92": "B-X+X", "93": "B-X+X+PRON", "94": "CCONJ", "95": "DET", "96": "DET+NUM", "97": "I-ADJ", "98": "I-ADJ+ADJ", "99": "I-ADJ+NOUN", "100": "I-ADJ+NOUN+NOUN", "101": "I-ADJ+PART", "102": "I-ADJ+PROPN", "103": "I-ADJ+PUNCT", "104": "I-ADP", "105": "I-ADP+ADJ", "106": "I-ADP+NOUN", "107": "I-ADP+PRON", "108": "I-ADV", "109": "I-ADV+AUX", "110": "I-ADV+PUNCT", "111": "I-AUX", "112": "I-AUX+ADV", "113": "I-AUX+PART", "114": "I-AUX+PART+VERB", "115": "I-AUX+VERB", "116": "I-CCONJ", "117": "I-DET", "118": "I-DET+AUX", "119": "I-DET+NOUN", "120": "I-INTJ", "121": "I-INTJ+PUNCT", "122": "I-NOUN", "123": "I-NOUN+ADJ", "124": "I-NOUN+ADP", "125": "I-NOUN+AUX", "126": "I-NOUN+NOUN", "127": "I-NOUN+NOUN+VERB", "128": "I-NOUN+PART", "129": "I-NOUN+PROPN", "130": "I-NOUN+PUNCT", "131": "I-NOUN+SCONJ", "132": "I-NOUN+VERB", "133": "I-NUM", "134": "I-PART", "135": "I-PRON", "136": "I-PRON+ADJ", "137": "I-PRON+ADV", "138": "I-PRON+AUX", "139": "I-PRON+NOUN", "140": "I-PRON+PART", "141": "I-PRON+PRON", "142": "I-PRON+VERB", "143": "I-PROPN", "144": "I-PROPN+ADP", "145": "I-PROPN+AUX", "146": "I-PROPN+PART", "147": "I-PROPN+PROPN", "148": "I-PROPN+PUNCT", "149": "I-PROPN+PUNCT+PUNCT", "150": "I-PROPN+VERB", "151": "I-PUNCT", "152": "I-PUNCT+PUNCT", "153": "I-PUNCT+PUNCT+PUNCT", "154": "I-PUNCT+SYM+PUNCT", "155": "I-SCONJ", "156": "I-SYM", "157": "I-VERB", "158": "I-VERB+ADJ", "159": "I-VERB+ADJ+CCONJ", "160": "I-VERB+ADP", "161": "I-VERB+ADV", "162": "I-VERB+ADV+PUNCT", "163": "I-VERB+AUX", "164": "I-VERB+CCONJ", "165": "I-VERB+DET", "166": "I-VERB+NOUN", "167": "I-VERB+NOUN+CCONJ", "168": "I-VERB+NOUN+NOUN", "169": "I-VERB+PART", "170": "I-VERB+PRON", "171": "I-VERB+PRON+ADP", "172": "I-VERB+PRON+ADV", "173": "I-VERB+PROPN", "174": "I-VERB+SCONJ", "175": "I-VERB+VERB", "176": "I-VERB+VERB+NOUN", "177": "I-X", "178": "I-X+PUNCT", "179": "I-X+PUNCT+PUNCT", "180": "I-X+X", "181": "I-X+X+PRON", "182": "INTJ", "183": "NOUN", "184": "NOUN+AUX", "185": "NOUN+PART", "186": "NUM", "187": "PART", "188": "PRON", "189": "PRON+AUX", "190": "PRON+VERB", "191": "PROPN", "192": "PROPN+PART", "193": "PUNCT", "194": "PUNCT+PUNCT", "195": "PUNCT+PUNCT+PUNCT", "196": "PUNCT+SYM", "197": "SCONJ", "198": "SYM", "199": "SYM+PUNCT", "200": "SYM+SYM", "201": "VERB", "202": "VERB+ADP", "203": "VERB+PART", "204": "VERB+PRON", "205": "VERB+VERB", "206": "X", "207": "X+X" }, "initializer_range": 0.02, "intermediate_size": 3072, "label2id": { "ADJ": 0, "ADP": 1, "ADP+DET": 2, "ADP+PRON": 3, "ADV": 4, "ADV+AUX": 5, "ADV+PART": 6, "AUX": 7, "AUX+PART": 8, "B-ADJ": 9, "B-ADJ+ADJ": 10, "B-ADJ+NOUN": 11, "B-ADJ+NOUN+NOUN": 12, "B-ADJ+PART": 13, "B-ADJ+PROPN": 14, "B-ADJ+PUNCT": 15, "B-ADP": 16, "B-ADP+ADJ": 17, "B-ADP+NOUN": 18, "B-ADP+PRON": 19, "B-ADV": 20, "B-ADV+AUX": 21, "B-ADV+PUNCT": 22, "B-AUX": 23, "B-AUX+ADV": 24, "B-AUX+PART": 25, "B-AUX+PART+VERB": 26, "B-AUX+VERB": 27, "B-CCONJ": 28, "B-DET": 29, "B-DET+AUX": 30, "B-DET+NOUN": 31, "B-INTJ": 32, "B-INTJ+PUNCT": 33, "B-NOUN": 34, "B-NOUN+ADJ": 35, "B-NOUN+ADP": 36, "B-NOUN+AUX": 37, "B-NOUN+NOUN": 38, "B-NOUN+NOUN+VERB": 39, "B-NOUN+PART": 40, "B-NOUN+PROPN": 41, "B-NOUN+PUNCT": 42, "B-NOUN+SCONJ": 43, "B-NOUN+VERB": 44, "B-NUM": 45, "B-PART": 46, "B-PRON": 47, "B-PRON+ADJ": 48, "B-PRON+ADV": 49, "B-PRON+AUX": 50, "B-PRON+NOUN": 51, "B-PRON+PART": 52, "B-PRON+PRON": 53, "B-PRON+VERB": 54, "B-PROPN": 55, "B-PROPN+ADP": 56, "B-PROPN+AUX": 57, "B-PROPN+PART": 58, "B-PROPN+PROPN": 59, "B-PROPN+PUNCT": 60, "B-PROPN+PUNCT+PUNCT": 61, "B-PROPN+VERB": 62, "B-PUNCT": 63, "B-PUNCT+PUNCT": 64, "B-PUNCT+PUNCT+PUNCT": 65, "B-PUNCT+SYM+PUNCT": 66, "B-SCONJ": 67, "B-SYM": 68, "B-VERB": 69, "B-VERB+ADJ": 70, "B-VERB+ADJ+CCONJ": 71, "B-VERB+ADP": 72, "B-VERB+ADV": 73, "B-VERB+ADV+PUNCT": 74, "B-VERB+AUX": 75, "B-VERB+CCONJ": 76, "B-VERB+DET": 77, "B-VERB+NOUN": 78, "B-VERB+NOUN+CCONJ": 79, "B-VERB+NOUN+NOUN": 80, "B-VERB+PART": 81, "B-VERB+PRON": 82, "B-VERB+PRON+ADP": 83, "B-VERB+PRON+ADV": 84, "B-VERB+PROPN": 85, "B-VERB+SCONJ": 86, "B-VERB+VERB": 87, "B-VERB+VERB+NOUN": 88, "B-X": 89, "B-X+PUNCT": 90, "B-X+PUNCT+PUNCT": 91, "B-X+X": 92, "B-X+X+PRON": 93, "CCONJ": 94, "DET": 95, "DET+NUM": 96, "I-ADJ": 97, "I-ADJ+ADJ": 98, "I-ADJ+NOUN": 99, "I-ADJ+NOUN+NOUN": 100, "I-ADJ+PART": 101, "I-ADJ+PROPN": 102, "I-ADJ+PUNCT": 103, "I-ADP": 104, "I-ADP+ADJ": 105, "I-ADP+NOUN": 106, "I-ADP+PRON": 107, "I-ADV": 108, "I-ADV+AUX": 109, "I-ADV+PUNCT": 110, "I-AUX": 111, "I-AUX+ADV": 112, "I-AUX+PART": 113, "I-AUX+PART+VERB": 114, "I-AUX+VERB": 115, "I-CCONJ": 116, "I-DET": 117, "I-DET+AUX": 118, "I-DET+NOUN": 119, "I-INTJ": 120, "I-INTJ+PUNCT": 121, "I-NOUN": 122, "I-NOUN+ADJ": 123, "I-NOUN+ADP": 124, "I-NOUN+AUX": 125, "I-NOUN+NOUN": 126, "I-NOUN+NOUN+VERB": 127, "I-NOUN+PART": 128, "I-NOUN+PROPN": 129, "I-NOUN+PUNCT": 130, "I-NOUN+SCONJ": 131, "I-NOUN+VERB": 132, "I-NUM": 133, "I-PART": 134, "I-PRON": 135, "I-PRON+ADJ": 136, "I-PRON+ADV": 137, "I-PRON+AUX": 138, "I-PRON+NOUN": 139, "I-PRON+PART": 140, "I-PRON+PRON": 141, "I-PRON+VERB": 142, "I-PROPN": 143, "I-PROPN+ADP": 144, "I-PROPN+AUX": 145, "I-PROPN+PART": 146, "I-PROPN+PROPN": 147, "I-PROPN+PUNCT": 148, "I-PROPN+PUNCT+PUNCT": 149, "I-PROPN+VERB": 150, "I-PUNCT": 151, "I-PUNCT+PUNCT": 152, "I-PUNCT+PUNCT+PUNCT": 153, "I-PUNCT+SYM+PUNCT": 154, "I-SCONJ": 155, "I-SYM": 156, "I-VERB": 157, "I-VERB+ADJ": 158, "I-VERB+ADJ+CCONJ": 159, "I-VERB+ADP": 160, "I-VERB+ADV": 161, "I-VERB+ADV+PUNCT": 162, "I-VERB+AUX": 163, "I-VERB+CCONJ": 164, "I-VERB+DET": 165, "I-VERB+NOUN": 166, "I-VERB+NOUN+CCONJ": 167, "I-VERB+NOUN+NOUN": 168, "I-VERB+PART": 169, "I-VERB+PRON": 170, "I-VERB+PRON+ADP": 171, "I-VERB+PRON+ADV": 172, "I-VERB+PROPN": 173, "I-VERB+SCONJ": 174, "I-VERB+VERB": 175, "I-VERB+VERB+NOUN": 176, "I-X": 177, "I-X+PUNCT": 178, "I-X+PUNCT+PUNCT": 179, "I-X+X": 180, "I-X+X+PRON": 181, "INTJ": 182, "NOUN": 183, "NOUN+AUX": 184, "NOUN+PART": 185, "NUM": 186, "PART": 187, "PRON": 188, "PRON+AUX": 189, "PRON+VERB": 190, "PROPN": 191, "PROPN+PART": 192, "PUNCT": 193, "PUNCT+PUNCT": 194, "PUNCT+PUNCT+PUNCT": 195, "PUNCT+SYM": 196, "SCONJ": 197, "SYM": 198, "SYM+PUNCT": 199, "SYM+SYM": 200, "VERB": 201, "VERB+ADP": 202, "VERB+PART": 203, "VERB+PRON": 204, "VERB+VERB": 205, "X": 206, "X+X": 207 }, "layer_norm_eps": 1e-05, "max_position_embeddings": 514, "model_type": "roberta", "num_attention_heads": 12, "num_hidden_layers": 12, "pad_token_id": 1, "position_embedding_type": "absolute", "task_specific_params": { "upos_multiword": { "ADJ+ADJ": { "bigenough": [ "big", "enough" ], "interestingsocial": [ "interesting", "social" ], "longeight-inch": [ "long", "eight-inch" ], "pressingsocial": [ "pressing", "social" ] }, "ADJ+NOUN": { "bigsource": [ "big", "source" ], "contrastingseries": [ "contrasting", "series" ], "distractingelements": [ "distracting", "elements" ], "fascinatingshop": [ "fascinating", "shop" ], "gruelingsanctions": [ "grueling", "sanctions" ], "increasingsafety": [ "increasing", "safety" ], "longexposures": [ "long", "exposures" ], "longhair": [ "long", "hair" ], "longhistory": [ "long", "history" ], "ongoingsummaries": [ "ongoing", "summaries" ], "pre-meetingsite": [ "pre-meeting", "site" ], "rallyingsigns": [ "rallying", "signs" ], "revenue-raisingservices": [ "revenue-raising", "services" ], "self-questioningshrug": [ "self-questioning", "shrug" ], "simperingsmile": [ "simpering", "smile" ], "stronghints": [ "strong", "hints" ], "wizardingsport": [ "wizarding", "sport" ] }, "ADJ+PART": { "elses": [ "else", "s" ] }, "ADJ+PROPN": { "Nationwidetints": [ "Nationwide", "tints" ] }, "ADJ+PUNCT": { "Jr..": [ "Jr.", "." ], "e.g.:": [ "e.g.", ":" ], "i.e.,": [ "i.e.", "," ] }, "ADP+DET": { "des": [ "de", "les" ] }, "ADP+NOUN": { "Infact": [ "In", "fact" ], "overtime": [ "over", "time" ] }, "ADP+PRON": { "init": [ "in", "it" ] }, "ADV+AUX": { "Heres": [ "Here", "s" ], "longhave": [ "long", "have" ] }, "ADV+PART": { "into": [ "in", "to" ] }, "ADV+PUNCT": { "E.g.,": [ "E.g.", "," ], "e.g.,": [ "e.g.", "," ], "i.e.,": [ "i.e.", "," ], "i.e.:": [ "i.e.", ":" ] }, "AUX+ADV": { "cannot": [ "can", "not" ] }, "AUX+PART": { "Aren't": [ "Are", "n't" ], "Aren\u2019t": [ "Are", "n\u2019t" ], "CANT": [ "CA", "NT" ], "Can't": [ "Ca", "n't" ], "Cannot": [ "Can", "not" ], "Can\u2019t": [ "Ca", "n\u2019t" ], "DON'T": [ "DO", "N'T" ], "DONT": [ "DO", "NT" ], "Don't": [ "Do", "n't" ], "Dont": [ "Do", "nt" ], "Don\u2019t": [ "Do", "n\u2019t" ], "Haven't": [ "Have", "n't" ], "Isn't": [ "Is", "n't" ], "Isn\u2019t": [ "Is", "n\u2019t" ], "Won't": [ "Wo", "n't" ], "ain't": [ "ai", "n't" ], "aint": [ "ai", "nt" ], "aren't": [ "are", "not" ], "arent": [ "are", "nt" ], "aren\u2019t": [ "are", "n\u2019t" ], "can't": [ "can", "not" ], "cannot": [ "can", "not" ], "cant": [ "ca", "nt" ], "can\u2019t": [ "ca", "n\u2019t" ], "didn't": [ "did", "n't" ], "didn\u2019t": [ "did", "n\u2019t" ], "doesn't": [ "does", "n't" ], "doesn\u2019t": [ "does", "n\u2019t" ], "don't": [ "do", "not" ], "dont": [ "do", "nt" ], "don\u2019t": [ "do", "n\u2019t" ], "haven't": [ "have", "n't" ], "shan't": [ "sha", "n't" ], "shouldn't": [ "should", "not" ], "wasent": [ "wase", "nt" ], "weren't": [ "were", "n't" ], "weren\u2019t": [ "were", "n\u2019t" ], "won't": [ "will", "not" ], "wont": [ "wo", "nt" ], "won\u2019t": [ "wo", "n\u2019t" ] }, "AUX+PART+VERB": { "dunno": [ "du", "n", "no" ] }, "AUX+VERB": { "beingsaid": [ "being", "said" ], "beingsent": [ "being", "sent" ], "beingshipped": [ "being", "shipped" ], "beingspoken": [ "being", "spoken" ], "havingsaid": [ "having", "said" ] }, "DET+AUX": { "thes": [ "the", "s" ] }, "DET+NOUN": { "ALOT": [ "A", "LOT" ], "Alot": [ "A", "lot" ], "apart": [ "a", "part" ], "awhile": [ "a", "while" ], "sometime": [ "some", "time" ] }, "DET+NUM": { "everyone": [ "every", "one" ] }, "INTJ+PUNCT": { "etc.'": [ "etc.", "'" ], "ta',": [ "ta'", "," ] }, "NOUN+ADJ": { "nothingspecial": [ "nothing", "special" ] }, "NOUN+ADP": { "flagon": [ "flag", "on" ], "groundsof": [ "grounds", "of" ], "hashtagon": [ "hashtag", "on" ], "meetingsince": [ "meeting", "since" ] }, "NOUN+AUX": { "breathingshould": [ "breathing", "should" ], "doghas": [ "dog", "has" ], "mythmakingshould": [ "mythmaking", "should" ] }, "NOUN+NOUN": { "Drivingschool": [ "Driving", "school" ], "bakingsheet": [ "baking", "sheet" ], "bakingsoda": [ "baking", "soda" ], "counselingservices": [ "counseling", "services" ], "datingservice": [ "dating", "service" ], "doghouse": [ "dog", "house" ], "drivingschool": [ "driving", "school" ], "engineeringservices": [ "engineering", "services" ], "eveningschedule": [ "evening", "schedule" ], "kingsnake": [ "king", "snake" ], "kingsnakes": [ "king", "snakes" ], "lightingshowroom": [ "lighting", "showroom" ], "lightingsources": [ "lighting", "sources" ], "loggingsites": [ "logging", "sites" ], "mpgnumber": [ "mpg", "number" ], "plughole": [ "plug", "hole" ], "runningshorts": [ "running", "shorts" ], "tagsets": [ "tag", "sets" ], "testingschedule": [ "testing", "schedule" ], "towingservices": [ "towing", "services" ], "trainingsession": [ "training", "session" ], "writingschedule": [ "writing", "schedule" ], "writingsystem": [ "writing", "system" ] }, "NOUN+NOUN+VERB": { "RecruitingMeetingscheduled": [ "Recruiting", "Meeting", "scheduled" ] }, "NOUN+PART": { "DAUGHTERS": [ "DAUGHTER", "S" ], "Kids": [ "Kid", "s" ], "Mares": [ "Mare", "s" ], "Smokers": [ "Smoker", "s" ], "Travelers": [ "Traveler", "s" ], "animals": [ "animal", "s" ], "bachelors": [ "bachelor", "s" ], "bakers": [ "baker", "s" ], "beginners": [ "beginner", "s" ], "bettas": [ "betta", "s" ], "boys": [ "boy", "s" ], "cars": [ "car", "s" ], "cats": [ "cat", "s" ], "cycles": [ "cycle", "s" ], "dads": [ "dad", "s" ], "doctors": [ "doctor", "s" ], "dogs": [ "dog", "s" ], "drivers": [ "driver", "s" ], "friends": [ "friend", "s" ], "grandmas": [ "grandma", "s" ], "horses": [ "horse", "s" ], "humans": [ "human", "s" ], "males": [ "male", "s" ], "manufacturers": [ "manufacturer", "s" ], "mares": [ "mare", "s" ], "nights": [ "night", "s" ], "owners": [ "owner", "s" ], "peoples": [ "people", "s" ], "persons": [ "person", "s" ], "scammers": [ "scammer", "s" ], "sons": [ "son", "s" ], "teams": [ "team", "s" ], "todays": [ "today", "s" ], "trainers": [ "trainer", "s" ], "visitors": [ "visitor", "s" ], "wits": [ "wit", "s" ], "workers": [ "worker", "s" ], "years": [ "year", "s" ] }, "NOUN+PUNCT": { "Ed.:": [ "Ed.", ":" ], "Fax.(": [ "Fax.", "(" ], "a.m.,": [ "a.m.", "," ], "lb.,": [ "lb.", "," ], "mins.,": [ "mins.", "," ], "oz.,": [ "oz.", "," ], "p.m.,": [ "p.m.", "," ] }, "NOUN+SCONJ": { "buildingsince": [ "building", "since" ] }, "NOUN+VERB": { "dogeat": [ "dog", "eat" ], "morningserves": [ "morning", "serves" ], "thingsounded": [ "thing", "sounded" ] }, "PRON+ADJ": { "everythingset": [ "everything", "set" ], "somethingsuch": [ "something", "such" ] }, "PRON+ADV": { "somethingsometime": [ "something", "sometime" ] }, "PRON+AUX": { "ITS": [ "IT", "S" ], "Im": [ "I", "m" ], "Its": [ "It", "s" ], "Whats": [ "What", "s" ], "Your": [ "You", "r" ], "hes": [ "he", "s" ], "id": [ "i", "d" ], "im": [ "i", "m" ], "its": [ "it", "s" ], "iv": [ "i", "v" ], "ive": [ "i", "ve" ], "thats": [ "that", "s" ], "their": [ "thei", "r" ], "there": [ "the", "re" ], "ur": [ "u", "r" ], "your": [ "you", "r" ] }, "PRON+NOUN": { "alleconomy": [ "all", "economy" ] }, "PRON+PART": { "anyones": [ "anyone", "s" ] }, "PRON+PRON": { "everythingshe": [ "everything", "she" ] }, "PRON+VERB": { "Thats": [ "That", "s" ], "Theres": [ "There", "s" ], "everythingset": [ "everything", "set" ], "iguz": [ "i", "guz" ], "im": [ "i", "m" ], "its": [ "it", "s" ], "theres": [ "there", "s" ], "youthank": [ "you", "thank" ] }, "PROPN+ADP": { "Pagin": [ "Pag", "in" ], "Petersburgin": [ "Petersburg", "in" ] }, "PROPN+AUX": { "Hedwighad": [ "Hedwig", "had" ] }, "PROPN+PART": { "BJs": [ "BJ", "s" ], "Chilis": [ "Chili", "s" ], "Friscos": [ "Frisco", "s" ], "Hams": [ "Ham", "s" ], "Kobeys": [ "Kobey", "s" ], "LWs": [ "LW", "s" ], "Leonardos": [ "Leonardo", "s" ], "Mortons": [ "Morton", "s" ], "Travellers": [ "Traveller", "s" ], "Valentines": [ "Valentine", "s" ], "Years": [ "Year", "s" ], "jacks": [ "jack", "s" ] }, "PROPN+PROPN": { "G&GAutomotive": [ "G&G", "Automotive" ], "drivingschool": [ "driving", "school" ] }, "PROPN+PUNCT": { "B.,": [ "B.", "," ], "B.A.\"": [ "B.A.", "\"" ], "D.C.,": [ "D.C.", "," ], "Inc.\"": [ "Inc.", "\"" ], "M.,": [ "M.", "," ], "N.O.?": [ "N.O.", "?" ], "Que.,": [ "Que.", "," ], "U.N.,": [ "U.N.", "," ], "U.S.)": [ "U.S.", ")" ], "U.S.-": [ "U.S.", "-" ], "Va.-": [ "Va.", "-" ] }, "PROPN+PUNCT+PUNCT": { "W.H.\",": [ "W.H.", "\"", "," ] }, "PROPN+VERB": { "Orglive": [ "Org", "live" ], "Pagyelped": [ "Pag", "yelped" ] }, "PUNCT+PUNCT": { "!\"": [ "!", "\"" ], "!'": [ "!", "'" ], "!)": [ "!", ")" ], "\"!": [ "\"", "!" ], "\"\"": [ "\"", "\"" ], "\"(": [ "\"", "(" ], "\")": [ "\"", ")" ], "\",": [ "\"", "," ], "\"-": [ "\"", "-" ], "\".": [ "\"", "." ], "\"...": [ "\"", "..." ], "\":": [ "\"", ":" ], "\"[": [ "\"", "[" ], "')": [ "'", ")" ], "',": [ "'", "," ], "(\"": [ "(", "\"" ], "(\"\"": [ "(", "\"\"" ], "('": [ "(", "'" ], "((": [ "(", "(" ], "([": [ "(", "[" ], ")\"": [ ")", "\"" ], ")(": [ ")", "(" ], "))": [ ")", ")" ], "),": [ ")", "," ], ").": [ ")", "." ], ")...": [ ")", "..." ], "):": [ ")", ":" ], ");": [ ")", ";" ], "*,": [ "*", "," ], ",\"": [ ",", "\"" ], ",'": [ ",", "'" ], ",''": [ ",", "''" ], ",...": [ ",", "..." ], "-\"": [ "-", "\"" ], ".\"": [ ".", "\"" ], ".'": [ ".", "'" ], "..": [ ".", "." ], "...\"": [ "...", "\"" ], "....": [ "...", "." ], "?\"": [ "?", "\"" ], "?'": [ "?", "'" ], "?)": [ "?", ")" ], "?]": [ "?", "]" ], "],": [ "]", "," ], "];": [ "]", ";" ] }, "PUNCT+PUNCT+PUNCT": { "!),": [ "!", ")", "," ], "\"),": [ "\"", ")", "," ], "?),": [ "?", ")", "," ], "]),": [ "]", ")", "," ] }, "PUNCT+SYM": { "($": [ "(", "$" ] }, "PUNCT+SYM+PUNCT": { "(%)": [ "(", "%", ")" ] }, "SYM+PUNCT": { "$,": [ "$", "," ], "%)": [ "%", ")" ], "%,": [ "%", "," ], "-'": [ "-", "'" ] }, "SYM+SYM": { "-$": [ "-", "$" ] }, "VERB+ADJ": { "alteringspecific": [ "altering", "specific" ], "doingshoddy": [ "doing", "shoddy" ], "facingserious": [ "facing", "serious" ], "legalizingsame": [ "legalizing", "same" ], "mixinguppercase": [ "mixing", "uppercase" ], "motivatingsyntactic": [ "motivating", "syntactic" ], "outsourcingspecial": [ "outsourcing", "special" ], "reinforcingsimilar": [ "reinforcing", "similar" ], "showingsuperb": [ "showing", "superb" ], "usingsimple": [ "using", "simple" ] }, "VERB+ADJ+CCONJ": { "lookingsmugand": [ "looking", "smug", "and" ] }, "VERB+ADP": { "Login": [ "Log", "in" ], "gamingsince": [ "gaming", "since" ], "goto": [ "go", "to" ], "hummingsince": [ "humming", "since" ], "investigatingsince": [ "investigating", "since" ], "login": [ "log", "in" ], "setup": [ "set", "up" ] }, "VERB+ADV": { "advancingslowly": [ "advancing", "slowly" ], "behavingsplendidly": [ "behaving", "splendidly" ], "bucklingslightly": [ "buckling", "slightly" ], "contributingsubstantially": [ "contributing", "substantially" ], "exultingeverywhere": [ "exulting", "everywhere" ], "includingspecifically": [ "including", "specifically" ], "movingsouthward": [ "moving", "southward" ], "proposingspecifically": [ "proposing", "specifically" ], "scavengingseriously": [ "scavenging", "seriously" ], "swellingslightly": [ "swelling", "slightly" ], "totalingsomewhere": [ "totaling", "somewhere" ], "walkinguptown": [ "walking", "uptown" ] }, "VERB+ADV+PUNCT": { "studyinge.g.,": [ "studying", "e.g.", "," ] }, "VERB+AUX": { "Winningshall": [ "Winning", "shall" ], "copyingshould": [ "copying", "should" ] }, "VERB+CCONJ": { "departingeither": [ "departing", "either" ] }, "VERB+DET": { "basingsome": [ "basing", "some" ], "demonstratingsuch": [ "demonstrating", "such" ], "discussingsome": [ "discussing", "some" ], "doingevery": [ "doing", "every" ], "doingsome": [ "doing", "some" ], "dumpingsome": [ "dumping", "some" ], "experiencingsome": [ "experiencing", "some" ], "finishingsome": [ "finishing", "some" ], "hostingsome": [ "hosting", "some" ], "meetingeach": [ "meeting", "each" ], "playingsome": [ "playing", "some" ], "rangeach": [ "rang", "each" ], "readingsome": [ "reading", "some" ], "regardingsome": [ "regarding", "some" ], "replacingsome": [ "replacing", "some" ], "spendingsome": [ "spending", "some" ], "usingsome": [ "using", "some" ] }, "VERB+NOUN": { "continuingsource": [ "continuing", "source" ], "differingschedules": [ "differing", "schedules" ], "doingscissors": [ "doing", "scissors" ], "expandingsystem": [ "expanding", "system" ], "expressingsadness": [ "expressing", "sadness" ], "followingsuggestion": [ "following", "suggestion" ], "formingeggs": [ "forming", "eggs" ], "gettingsavage": [ "getting", "savage" ], "gleamingsand": [ "gleaming", "sand" ], "improvingsurveillance": [ "improving", "surveillance" ], "meaningshell": [ "meaning", "shell" ], "playingsports": [ "playing", "sports" ], "printingerrors": [ "printing", "errors" ], "producingshrubs": [ "producing", "shrubs" ], "providingservices": [ "providing", "services" ], "quittingsmoking": [ "quitting", "smoking" ], "rushingslipstream": [ "rushing", "slipstream" ], "seeingsomeone": [ "seeing", "someone" ], "studyingsymmetry": [ "studying", "symmetry" ] }, "VERB+PART": { "Gonna": [ "Gon", "na" ], "Gotta": [ "Got", "ta" ], "aren't": [ "are", "n't" ], "didn't": [ "did", "n't" ], "doesn't": [ "does", "n't" ], "don't": [ "do", "n't" ], "don\u2019t": [ "do", "n\u2019t" ], "gonna": [ "gon", "na" ], "gotta": [ "got", "ta" ], "haven't": [ "have", "n't" ], "wana": [ "wan", "a" ], "wanna": [ "wan", "na" ] }, "VERB+PRON": { "Lets": [ "Let", "s" ], "callyou": [ "call", "you" ], "crossingeach": [ "crossing", "each" ], "doingeverything": [ "doing", "everything" ], "expectingsomeone": [ "expecting", "someone" ], "lets": [ "let", "s" ], "slunghis": [ "slung", "his" ] }, "VERB+PRON+ADP": { "seeingeverythingaround": [ "seeing", "everything", "around" ] }, "VERB+PRON+ADV": { "screwingeverythingup": [ "screwing", "everything", "up" ] }, "VERB+PROPN": { "arrivingsalt": [ "arriving", "salt" ], "departingsan": [ "departing", "san" ], "leavingsan": [ "leaving", "san" ], "leavingsunday": [ "leaving", "sunday" ] }, "VERB+SCONJ": { "decidewhether": [ "decide", "whether" ] }, "VERB+VERB": { "growingsuspended": [ "growing", "suspended" ], "had": [ "h", "ad" ] }, "VERB+VERB+NOUN": { "crushingsleepingflowers": [ "crushing", "sleeping", "flowers" ], "hostingvisitingschool": [ "hosting", "visiting", "school" ] }, "X+PUNCT": { "al.,": [ "al.", "," ], "e.g.,": [ "e.g.", "," ], "etc.)": [ "etc.", ")" ], "etc.,": [ "etc.", "," ], "etc..": [ "etc.", "." ] }, "X+X": { "'s": [ "'", "s" ], ").doc": [ ")", ".doc" ] }, "X+X+PRON": { "http://i.imgur.com/T2zff.jpghttp://i.imgur.com/Xytex.jpgI": [ "http://i.imgur.com/T2zff.jpg", "http://i.imgur.com/Xytex.jpg", "I" ] } } }, "tokenizer_class": "RobertaTokenizerFast", "torch_dtype": "float32", "transformers_version": "4.11.3", "type_vocab_size": 1, "use_cache": true, "vocab_size": 50265 }