KoichiYasuoka's picture
initial release
9a393dc
raw
history blame
No virus
9.66 kB
{
"architectures": [
"XLMRobertaForTokenClassification"
],
"attention_probs_dropout_prob": 0.1,
"bos_token_id": 0,
"classifier_dropout": null,
"eos_token_id": 2,
"hidden_act": "gelu",
"hidden_dropout_prob": 0.1,
"hidden_size": 768,
"id2label": {
"0": "ADJ",
"1": "ADJ+PART",
"2": "ADP",
"3": "ADV",
"4": "ADV+PART",
"5": "AUX",
"6": "AUX+PART",
"7": "B-ADJ",
"8": "B-ADJ+PART",
"9": "B-ADP",
"10": "B-ADP+ADP",
"11": "B-ADV",
"12": "B-AUX",
"13": "B-AUX+PART",
"14": "B-AUX+PART+VERB",
"15": "B-CCONJ",
"16": "B-DET",
"17": "B-INTJ",
"18": "B-NOUN",
"19": "B-NOUN+PART",
"20": "B-NUM",
"21": "B-PART",
"22": "B-PRON",
"23": "B-PRON+AUX",
"24": "B-PROPN",
"25": "B-PROPN+PART",
"26": "B-PUNCT",
"27": "B-SCONJ",
"28": "B-SYM",
"29": "B-VERB",
"30": "B-VERB+ADV",
"31": "B-VERB+PART",
"32": "B-X",
"33": "CCONJ",
"34": "DET",
"35": "I-ADJ",
"36": "I-ADJ+PART",
"37": "I-ADP",
"38": "I-ADP+ADP",
"39": "I-ADV",
"40": "I-AUX",
"41": "I-AUX+PART",
"42": "I-AUX+PART+VERB",
"43": "I-CCONJ",
"44": "I-DET",
"45": "I-INTJ",
"46": "I-NOUN",
"47": "I-NOUN+PART",
"48": "I-NUM",
"49": "I-PART",
"50": "I-PRON",
"51": "I-PRON+AUX",
"52": "I-PROPN",
"53": "I-PROPN+PART",
"54": "I-PUNCT",
"55": "I-SCONJ",
"56": "I-SYM",
"57": "I-VERB",
"58": "I-VERB+ADV",
"59": "I-VERB+PART",
"60": "I-X",
"61": "INTJ",
"62": "NOUN",
"63": "NOUN+ADP",
"64": "NOUN+PART",
"65": "NUM",
"66": "PART",
"67": "PRON",
"68": "PRON+AUX",
"69": "PRON+VERB",
"70": "PROPN",
"71": "PUNCT",
"72": "SCONJ",
"73": "SYM",
"74": "VERB",
"75": "VERB+PART",
"76": "X"
},
"initializer_range": 0.02,
"intermediate_size": 3072,
"label2id": {
"ADJ": 0,
"ADJ+PART": 1,
"ADP": 2,
"ADV": 3,
"ADV+PART": 4,
"AUX": 5,
"AUX+PART": 6,
"B-ADJ": 7,
"B-ADJ+PART": 8,
"B-ADP": 9,
"B-ADP+ADP": 10,
"B-ADV": 11,
"B-AUX": 12,
"B-AUX+PART": 13,
"B-AUX+PART+VERB": 14,
"B-CCONJ": 15,
"B-DET": 16,
"B-INTJ": 17,
"B-NOUN": 18,
"B-NOUN+PART": 19,
"B-NUM": 20,
"B-PART": 21,
"B-PRON": 22,
"B-PRON+AUX": 23,
"B-PROPN": 24,
"B-PROPN+PART": 25,
"B-PUNCT": 26,
"B-SCONJ": 27,
"B-SYM": 28,
"B-VERB": 29,
"B-VERB+ADV": 30,
"B-VERB+PART": 31,
"B-X": 32,
"CCONJ": 33,
"DET": 34,
"I-ADJ": 35,
"I-ADJ+PART": 36,
"I-ADP": 37,
"I-ADP+ADP": 38,
"I-ADV": 39,
"I-AUX": 40,
"I-AUX+PART": 41,
"I-AUX+PART+VERB": 42,
"I-CCONJ": 43,
"I-DET": 44,
"I-INTJ": 45,
"I-NOUN": 46,
"I-NOUN+PART": 47,
"I-NUM": 48,
"I-PART": 49,
"I-PRON": 50,
"I-PRON+AUX": 51,
"I-PROPN": 52,
"I-PROPN+PART": 53,
"I-PUNCT": 54,
"I-SCONJ": 55,
"I-SYM": 56,
"I-VERB": 57,
"I-VERB+ADV": 58,
"I-VERB+PART": 59,
"I-X": 60,
"INTJ": 61,
"NOUN": 62,
"NOUN+ADP": 63,
"NOUN+PART": 64,
"NUM": 65,
"PART": 66,
"PRON": 67,
"PRON+AUX": 68,
"PRON+VERB": 69,
"PROPN": 70,
"PUNCT": 71,
"SCONJ": 72,
"SYM": 73,
"VERB": 74,
"VERB+PART": 75,
"X": 76
},
"layer_norm_eps": 1e-05,
"max_position_embeddings": 514,
"model_type": "xlm-roberta",
"num_attention_heads": 12,
"num_hidden_layers": 12,
"output_past": true,
"pad_token_id": 1,
"position_embedding_type": "absolute",
"task_specific_params": {
"upos_multiword": {
"ADJ+PART": {
"elses": [
"else",
"s"
],
"others": [
"other",
"s"
]
},
"ADP+ADP": {
"OUTTA": [
"OUT",
"TA"
]
},
"ADV+PART": {
"into": [
"in",
"to"
]
},
"AUX+PART": {
"Aren't": [
"Are",
"n't"
],
"CANNOT": [
"CAN",
"NOT"
],
"CANT": [
"CA",
"NT"
],
"Can't": [
"Ca",
"n't"
],
"DON'T": [
"DO",
"N'T"
],
"Don't": [
"Do",
"n't"
],
"Dont": [
"Do",
"nt"
],
"WASN'T": [
"WAS",
"N'T"
],
"ain't": [
"ai",
"n't"
],
"aint": [
"ai",
"nt"
],
"aren't": [
"are",
"n't"
],
"arent": [
"are",
"nt"
],
"can't": [
"ca",
"n't"
],
"cannot": [
"can",
"not"
],
"cant": [
"ca",
"nt"
],
"can\u2019t": [
"ca",
"n\u2019t"
],
"couldn't": [
"could",
"n't"
],
"couldnt": [
"could",
"nt"
],
"didn't": [
"did",
"n't"
],
"didnt": [
"did",
"nt"
],
"didn\u2019t": [
"did",
"n\u2019t"
],
"doesn't": [
"does",
"n't"
],
"doesnt": [
"does",
"nt"
],
"don't": [
"do",
"n't"
],
"dont": [
"do",
"nt"
],
"don\u2019t": [
"do",
"n\u2019t"
],
"haven't": [
"have",
"n't"
],
"havn't": [
"hav",
"n't"
],
"isn't": [
"is",
"n't"
],
"wasent": [
"wase",
"nt"
],
"wasn't": [
"was",
"n't"
],
"won't": [
"wo",
"n't"
],
"wont": [
"wo",
"nt"
],
"won\u2019t": [
"wo",
"n\u2019t"
],
"wouldn't": [
"would",
"n't"
],
"wouldnt": [
"would",
"nt"
]
},
"AUX+PART+VERB": {
"dunno": [
"du",
"n",
"no"
]
},
"NOUN+ADP": {
"sorta": [
"sort",
"a"
]
},
"NOUN+PART": {
"DAUGHTERS": [
"DAUGHTER",
"S"
],
"Kids": [
"Kid",
"s"
],
"Smokers": [
"Smoker",
"s"
],
"Travelers": [
"Traveler",
"s"
],
"animals": [
"animal",
"s"
],
"bakers": [
"baker",
"s"
],
"beginners": [
"beginner",
"s"
],
"bettas": [
"betta",
"s"
],
"boys": [
"boy",
"s"
],
"friends": [
"friend",
"s"
],
"grandmas": [
"grandma",
"s"
],
"humans": [
"human",
"s"
],
"manufacturers": [
"manufacturer",
"s"
],
"owners": [
"owner",
"s"
],
"scammers": [
"scammer",
"s"
],
"teams": [
"team",
"s"
],
"visitors": [
"visitor",
"s"
],
"workers": [
"worker",
"s"
]
},
"PRON+AUX": {
"ITS": [
"IT",
"S"
],
"Im": [
"I",
"m"
],
"Your": [
"You",
"r"
],
"id": [
"i",
"d"
],
"im": [
"i",
"m"
],
"its": [
"it",
"s"
],
"their": [
"thei",
"r"
],
"there": [
"the",
"re"
],
"ur": [
"u",
"r"
],
"your": [
"you",
"r"
],
"youre": [
"you",
"re"
]
},
"PRON+VERB": {
"im": [
"i",
"m"
],
"its": [
"it",
"s"
]
},
"PROPN+PART": {
"Friscos": [
"Frisco",
"s"
],
"Mortons": [
"Morton",
"s"
]
},
"VERB+ADV": {
"c'mon": [
"c'm",
"on"
]
},
"VERB+PART": {
"Gotta": [
"Got",
"ta"
],
"aren't": [
"are",
"n't"
],
"doesn't": [
"does",
"n't"
],
"doesnt": [
"does",
"nt"
],
"don't": [
"do",
"n't"
],
"gonna": [
"gon",
"na"
],
"gotta": [
"got",
"ta"
],
"isn't": [
"is",
"n't"
],
"wana": [
"wan",
"a"
],
"wasn't": [
"was",
"n't"
]
}
}
},
"tokenizer_class": "XLMRobertaTokenizerFast",
"torch_dtype": "float32",
"transformers_version": "4.11.3",
"type_vocab_size": 1,
"use_cache": true,
"vocab_size": 250002
}