DerivedFunction's picture
Training in progress, step 2500
8480c2b
{
"add_cross_attention": false,
"architectures": [
"XLMRobertaForTokenClassification"
],
"attention_probs_dropout_prob": 0.1,
"bos_token_id": 0,
"classifier_dropout": null,
"dtype": "float32",
"eos_token_id": 2,
"hidden_act": "gelu",
"hidden_dropout_prob": 0.1,
"hidden_size": 768,
"id2label": {
"0": "O",
"1": "B-EN",
"2": "I-EN",
"3": "B-ES",
"4": "I-ES",
"5": "B-FR",
"6": "I-FR",
"7": "B-DE",
"8": "I-DE",
"9": "B-IT",
"10": "I-IT",
"11": "B-PT",
"12": "I-PT",
"13": "B-NL",
"14": "I-NL",
"15": "B-VI",
"16": "I-VI",
"17": "B-TR",
"18": "I-TR",
"19": "B-LA",
"20": "I-LA",
"21": "B-ID",
"22": "I-ID",
"23": "B-MS",
"24": "I-MS",
"25": "B-AF",
"26": "I-AF",
"27": "B-SQ",
"28": "I-SQ",
"29": "B-IS",
"30": "I-IS",
"31": "B-NO",
"32": "I-NO",
"33": "B-SV",
"34": "I-SV",
"35": "B-DA",
"36": "I-DA",
"37": "B-FI",
"38": "I-FI",
"39": "B-HU",
"40": "I-HU",
"41": "B-PL",
"42": "I-PL",
"43": "B-CS",
"44": "I-CS",
"45": "B-RO",
"46": "I-RO",
"47": "B-RU",
"48": "I-RU",
"49": "B-BG",
"50": "I-BG",
"51": "B-UK",
"52": "I-UK",
"53": "B-SR",
"54": "I-SR",
"55": "B-BE",
"56": "I-BE",
"57": "B-KK",
"58": "I-KK",
"59": "B-MK",
"60": "I-MK",
"61": "B-MN",
"62": "I-MN",
"63": "B-ZH",
"64": "I-ZH",
"65": "B-JA",
"66": "I-JA",
"67": "B-KO",
"68": "I-KO",
"69": "B-HI",
"70": "I-HI",
"71": "B-UR",
"72": "I-UR",
"73": "B-BN",
"74": "I-BN",
"75": "B-TA",
"76": "I-TA",
"77": "B-TE",
"78": "I-TE",
"79": "B-MR",
"80": "I-MR",
"81": "B-GU",
"82": "I-GU",
"83": "B-KN",
"84": "I-KN",
"85": "B-ML",
"86": "I-ML",
"87": "B-PA",
"88": "I-PA",
"89": "B-AS",
"90": "I-AS",
"91": "B-OR",
"92": "I-OR",
"93": "B-AR",
"94": "I-AR",
"95": "B-FA",
"96": "I-FA",
"97": "B-PS",
"98": "I-PS",
"99": "B-SD",
"100": "I-SD",
"101": "B-UG",
"102": "I-UG",
"103": "B-EL",
"104": "I-EL",
"105": "B-HE",
"106": "I-HE",
"107": "B-HY",
"108": "I-HY",
"109": "B-KA",
"110": "I-KA",
"111": "B-AM",
"112": "I-AM",
"113": "B-KM",
"114": "I-KM",
"115": "B-LO",
"116": "I-LO",
"117": "B-MY",
"118": "I-MY",
"119": "B-TH",
"120": "I-TH",
"121": "B-SI",
"122": "I-SI",
"123": "B-BO",
"124": "I-BO",
"125": "B-DV",
"126": "I-DV",
"127": "B-TI",
"128": "I-TI",
"129": "B-SW",
"130": "I-SW",
"131": "B-EU",
"132": "I-EU",
"133": "B-TL",
"134": "I-TL",
"135": "B-CA",
"136": "I-CA",
"137": "B-GL",
"138": "I-GL",
"139": "B-OC",
"140": "I-OC",
"141": "B-BR",
"142": "I-BR",
"143": "B-GA",
"144": "I-GA",
"145": "B-GD",
"146": "I-GD",
"147": "B-CY",
"148": "I-CY",
"149": "B-BS",
"150": "I-BS",
"151": "B-HR",
"152": "I-HR",
"153": "B-SL",
"154": "I-SL",
"155": "B-SK",
"156": "I-SK",
"157": "B-ET",
"158": "I-ET",
"159": "B-LV",
"160": "I-LV",
"161": "B-LT",
"162": "I-LT",
"163": "B-EO",
"164": "I-EO",
"165": "B-JV",
"166": "I-JV",
"167": "B-MG",
"168": "I-MG",
"169": "B-OM",
"170": "I-OM",
"171": "B-SO",
"172": "I-SO",
"173": "B-SU",
"174": "I-SU",
"175": "B-UZ",
"176": "I-UZ",
"177": "B-KU",
"178": "I-KU",
"179": "B-CKB",
"180": "I-CKB",
"181": "B-HBO",
"182": "I-HBO",
"183": "B-GRC",
"184": "I-GRC",
"185": "B-NE",
"186": "I-NE",
"187": "B-MT",
"188": "I-MT",
"189": "B-LB",
"190": "I-LB",
"191": "B-RM",
"192": "I-RM",
"193": "B-TT",
"194": "I-TT",
"195": "B-KY",
"196": "I-KY",
"197": "B-TG",
"198": "I-TG",
"199": "B-BA",
"200": "I-BA",
"201": "B-YO",
"202": "I-YO",
"203": "B-ZU",
"204": "I-ZU",
"205": "B-NY",
"206": "I-NY",
"207": "B-CE",
"208": "I-CE"
},
"initializer_range": 0.02,
"intermediate_size": 3072,
"is_decoder": false,
"label2id": {
"B-AF": 25,
"B-AM": 111,
"B-AR": 93,
"B-AS": 89,
"B-BA": 199,
"B-BE": 55,
"B-BG": 49,
"B-BN": 73,
"B-BO": 123,
"B-BR": 141,
"B-BS": 149,
"B-CA": 135,
"B-CE": 207,
"B-CKB": 179,
"B-CS": 43,
"B-CY": 147,
"B-DA": 35,
"B-DE": 7,
"B-DV": 125,
"B-EL": 103,
"B-EN": 1,
"B-EO": 163,
"B-ES": 3,
"B-ET": 157,
"B-EU": 131,
"B-FA": 95,
"B-FI": 37,
"B-FR": 5,
"B-GA": 143,
"B-GD": 145,
"B-GL": 137,
"B-GRC": 183,
"B-GU": 81,
"B-HBO": 181,
"B-HE": 105,
"B-HI": 69,
"B-HR": 151,
"B-HU": 39,
"B-HY": 107,
"B-ID": 21,
"B-IS": 29,
"B-IT": 9,
"B-JA": 65,
"B-JV": 165,
"B-KA": 109,
"B-KK": 57,
"B-KM": 113,
"B-KN": 83,
"B-KO": 67,
"B-KU": 177,
"B-KY": 195,
"B-LA": 19,
"B-LB": 189,
"B-LO": 115,
"B-LT": 161,
"B-LV": 159,
"B-MG": 167,
"B-MK": 59,
"B-ML": 85,
"B-MN": 61,
"B-MR": 79,
"B-MS": 23,
"B-MT": 187,
"B-MY": 117,
"B-NE": 185,
"B-NL": 13,
"B-NO": 31,
"B-NY": 205,
"B-OC": 139,
"B-OM": 169,
"B-OR": 91,
"B-PA": 87,
"B-PL": 41,
"B-PS": 97,
"B-PT": 11,
"B-RM": 191,
"B-RO": 45,
"B-RU": 47,
"B-SD": 99,
"B-SI": 121,
"B-SK": 155,
"B-SL": 153,
"B-SO": 171,
"B-SQ": 27,
"B-SR": 53,
"B-SU": 173,
"B-SV": 33,
"B-SW": 129,
"B-TA": 75,
"B-TE": 77,
"B-TG": 197,
"B-TH": 119,
"B-TI": 127,
"B-TL": 133,
"B-TR": 17,
"B-TT": 193,
"B-UG": 101,
"B-UK": 51,
"B-UR": 71,
"B-UZ": 175,
"B-VI": 15,
"B-YO": 201,
"B-ZH": 63,
"B-ZU": 203,
"I-AF": 26,
"I-AM": 112,
"I-AR": 94,
"I-AS": 90,
"I-BA": 200,
"I-BE": 56,
"I-BG": 50,
"I-BN": 74,
"I-BO": 124,
"I-BR": 142,
"I-BS": 150,
"I-CA": 136,
"I-CE": 208,
"I-CKB": 180,
"I-CS": 44,
"I-CY": 148,
"I-DA": 36,
"I-DE": 8,
"I-DV": 126,
"I-EL": 104,
"I-EN": 2,
"I-EO": 164,
"I-ES": 4,
"I-ET": 158,
"I-EU": 132,
"I-FA": 96,
"I-FI": 38,
"I-FR": 6,
"I-GA": 144,
"I-GD": 146,
"I-GL": 138,
"I-GRC": 184,
"I-GU": 82,
"I-HBO": 182,
"I-HE": 106,
"I-HI": 70,
"I-HR": 152,
"I-HU": 40,
"I-HY": 108,
"I-ID": 22,
"I-IS": 30,
"I-IT": 10,
"I-JA": 66,
"I-JV": 166,
"I-KA": 110,
"I-KK": 58,
"I-KM": 114,
"I-KN": 84,
"I-KO": 68,
"I-KU": 178,
"I-KY": 196,
"I-LA": 20,
"I-LB": 190,
"I-LO": 116,
"I-LT": 162,
"I-LV": 160,
"I-MG": 168,
"I-MK": 60,
"I-ML": 86,
"I-MN": 62,
"I-MR": 80,
"I-MS": 24,
"I-MT": 188,
"I-MY": 118,
"I-NE": 186,
"I-NL": 14,
"I-NO": 32,
"I-NY": 206,
"I-OC": 140,
"I-OM": 170,
"I-OR": 92,
"I-PA": 88,
"I-PL": 42,
"I-PS": 98,
"I-PT": 12,
"I-RM": 192,
"I-RO": 46,
"I-RU": 48,
"I-SD": 100,
"I-SI": 122,
"I-SK": 156,
"I-SL": 154,
"I-SO": 172,
"I-SQ": 28,
"I-SR": 54,
"I-SU": 174,
"I-SV": 34,
"I-SW": 130,
"I-TA": 76,
"I-TE": 78,
"I-TG": 198,
"I-TH": 120,
"I-TI": 128,
"I-TL": 134,
"I-TR": 18,
"I-TT": 194,
"I-UG": 102,
"I-UK": 52,
"I-UR": 72,
"I-UZ": 176,
"I-VI": 16,
"I-YO": 202,
"I-ZH": 64,
"I-ZU": 204,
"O": 0
},
"layer_norm_eps": 1e-05,
"max_position_embeddings": 514,
"model_type": "xlm-roberta",
"num_attention_heads": 12,
"num_hidden_layers": 12,
"output_past": true,
"pad_token_id": 1,
"position_embedding_type": "absolute",
"tie_word_embeddings": true,
"transformers_version": "5.0.0",
"type_vocab_size": 1,
"use_cache": false,
"vocab_size": 250002
}