| { |
| "architectures": [ |
| "ModernBertForSequenceClassification" |
| ], |
| "attention_bias": false, |
| "attention_dropout": 0.0, |
| "bos_token_id": 2, |
| "classifier_activation": "gelu", |
| "classifier_bias": false, |
| "classifier_dropout": 0.0, |
| "classifier_pooling": "mean", |
| "cls_token_id": 1, |
| "decoder_bias": true, |
| "deterministic_flash_attn": false, |
| "dtype": "float32", |
| "embedding_dropout": 0.0, |
| "eos_token_id": 1, |
| "global_attn_every_n_layers": 3, |
| "global_rope_theta": 160000, |
| "gradient_checkpointing": false, |
| "hidden_activation": "gelu", |
| "hidden_size": 768, |
| "id2label": { |
| "0": "aeb", |
| "1": "afr", |
| "2": "als", |
| "3": "amh", |
| "4": "anp", |
| "5": "apc", |
| "6": "arb", |
| "7": "arg", |
| "8": "ars", |
| "9": "ary", |
| "10": "arz", |
| "11": "asm", |
| "12": "ast", |
| "13": "azb", |
| "14": "azj", |
| "15": "bak", |
| "16": "bar", |
| "17": "bel", |
| "18": "ben", |
| "19": "bew", |
| "20": "bho", |
| "21": "bod", |
| "22": "bos", |
| "23": "bul", |
| "24": "cat", |
| "25": "ceb", |
| "26": "ces", |
| "27": "che", |
| "28": "chv", |
| "29": "ckb", |
| "30": "cmn", |
| "31": "cnh", |
| "32": "cos", |
| "33": "crh", |
| "34": "cym", |
| "35": "dan", |
| "36": "deu", |
| "37": "div", |
| "38": "dzo", |
| "39": "ekk", |
| "40": "ell", |
| "41": "eng", |
| "42": "epo", |
| "43": "eus", |
| "44": "fao", |
| "45": "fas", |
| "46": "fij", |
| "47": "fil", |
| "48": "fin", |
| "49": "fra", |
| "50": "fry", |
| "51": "fur", |
| "52": "gaz", |
| "53": "gla", |
| "54": "gle", |
| "55": "glg", |
| "56": "glk", |
| "57": "grc", |
| "58": "gsw", |
| "59": "guj", |
| "60": "hac", |
| "61": "hat", |
| "62": "hau", |
| "63": "haw", |
| "64": "hbo", |
| "65": "heb", |
| "66": "hif", |
| "67": "hil", |
| "68": "hin", |
| "69": "hne", |
| "70": "hrv", |
| "71": "hsb", |
| "72": "hun", |
| "73": "hye", |
| "74": "hyw", |
| "75": "iba", |
| "76": "ibo", |
| "77": "ilo", |
| "78": "ind", |
| "79": "isl", |
| "80": "ita", |
| "81": "jav", |
| "82": "jpn", |
| "83": "kal", |
| "84": "kan", |
| "85": "kat", |
| "86": "kaz", |
| "87": "kha", |
| "88": "khk", |
| "89": "khm", |
| "90": "kin", |
| "91": "kir", |
| "92": "kiu", |
| "93": "kmr", |
| "94": "kor", |
| "95": "lao", |
| "96": "lat", |
| "97": "lim", |
| "98": "lin", |
| "99": "lit", |
| "100": "ltz", |
| "101": "lug", |
| "102": "lus", |
| "103": "lvs", |
| "104": "mai", |
| "105": "mal", |
| "106": "mar", |
| "107": "mhr", |
| "108": "mkd", |
| "109": "mlt", |
| "110": "mri", |
| "111": "mww", |
| "112": "mya", |
| "113": "nap", |
| "114": "nde", |
| "115": "nds", |
| "116": "new", |
| "117": "nld", |
| "118": "nno", |
| "119": "nob", |
| "120": "npi", |
| "121": "nrm", |
| "122": "nya", |
| "123": "oci", |
| "124": "ory", |
| "125": "oss", |
| "126": "pan", |
| "127": "pap", |
| "128": "pbt", |
| "129": "plt", |
| "130": "pnb", |
| "131": "pol", |
| "132": "por", |
| "133": "roh", |
| "134": "ron", |
| "135": "rue", |
| "136": "run", |
| "137": "rus", |
| "138": "sah", |
| "139": "san", |
| "140": "scn", |
| "141": "sdh", |
| "142": "sin", |
| "143": "slk", |
| "144": "slv", |
| "145": "sme", |
| "146": "smo", |
| "147": "sna", |
| "148": "snd", |
| "149": "som", |
| "150": "sot", |
| "151": "spa", |
| "152": "srd", |
| "153": "srp", |
| "154": "sun", |
| "155": "swe", |
| "156": "swh", |
| "157": "tam", |
| "158": "tat", |
| "159": "tel", |
| "160": "tgk", |
| "161": "tha", |
| "162": "tir", |
| "163": "tuk", |
| "164": "tur", |
| "165": "tyv", |
| "166": "udm", |
| "167": "uig", |
| "168": "ukr", |
| "169": "urd", |
| "170": "uzn", |
| "171": "uzs", |
| "172": "vie", |
| "173": "xho", |
| "174": "ydd", |
| "175": "yor", |
| "176": "yue", |
| "177": "zea", |
| "178": "zsm", |
| "179": "zul" |
| }, |
| "initializer_cutoff_factor": 2.0, |
| "initializer_range": 0.02, |
| "intermediate_size": 1152, |
| "label2id": { |
| "aeb": 0, |
| "afr": 1, |
| "als": 2, |
| "amh": 3, |
| "anp": 4, |
| "apc": 5, |
| "arb": 6, |
| "arg": 7, |
| "ars": 8, |
| "ary": 9, |
| "arz": 10, |
| "asm": 11, |
| "ast": 12, |
| "azb": 13, |
| "azj": 14, |
| "bak": 15, |
| "bar": 16, |
| "bel": 17, |
| "ben": 18, |
| "bew": 19, |
| "bho": 20, |
| "bod": 21, |
| "bos": 22, |
| "bul": 23, |
| "cat": 24, |
| "ceb": 25, |
| "ces": 26, |
| "che": 27, |
| "chv": 28, |
| "ckb": 29, |
| "cmn": 30, |
| "cnh": 31, |
| "cos": 32, |
| "crh": 33, |
| "cym": 34, |
| "dan": 35, |
| "deu": 36, |
| "div": 37, |
| "dzo": 38, |
| "ekk": 39, |
| "ell": 40, |
| "eng": 41, |
| "epo": 42, |
| "eus": 43, |
| "fao": 44, |
| "fas": 45, |
| "fij": 46, |
| "fil": 47, |
| "fin": 48, |
| "fra": 49, |
| "fry": 50, |
| "fur": 51, |
| "gaz": 52, |
| "gla": 53, |
| "gle": 54, |
| "glg": 55, |
| "glk": 56, |
| "grc": 57, |
| "gsw": 58, |
| "guj": 59, |
| "hac": 60, |
| "hat": 61, |
| "hau": 62, |
| "haw": 63, |
| "hbo": 64, |
| "heb": 65, |
| "hif": 66, |
| "hil": 67, |
| "hin": 68, |
| "hne": 69, |
| "hrv": 70, |
| "hsb": 71, |
| "hun": 72, |
| "hye": 73, |
| "hyw": 74, |
| "iba": 75, |
| "ibo": 76, |
| "ilo": 77, |
| "ind": 78, |
| "isl": 79, |
| "ita": 80, |
| "jav": 81, |
| "jpn": 82, |
| "kal": 83, |
| "kan": 84, |
| "kat": 85, |
| "kaz": 86, |
| "kha": 87, |
| "khk": 88, |
| "khm": 89, |
| "kin": 90, |
| "kir": 91, |
| "kiu": 92, |
| "kmr": 93, |
| "kor": 94, |
| "lao": 95, |
| "lat": 96, |
| "lim": 97, |
| "lin": 98, |
| "lit": 99, |
| "ltz": 100, |
| "lug": 101, |
| "lus": 102, |
| "lvs": 103, |
| "mai": 104, |
| "mal": 105, |
| "mar": 106, |
| "mhr": 107, |
| "mkd": 108, |
| "mlt": 109, |
| "mri": 110, |
| "mww": 111, |
| "mya": 112, |
| "nap": 113, |
| "nde": 114, |
| "nds": 115, |
| "new": 116, |
| "nld": 117, |
| "nno": 118, |
| "nob": 119, |
| "npi": 120, |
| "nrm": 121, |
| "nya": 122, |
| "oci": 123, |
| "ory": 124, |
| "oss": 125, |
| "pan": 126, |
| "pap": 127, |
| "pbt": 128, |
| "plt": 129, |
| "pnb": 130, |
| "pol": 131, |
| "por": 132, |
| "roh": 133, |
| "ron": 134, |
| "rue": 135, |
| "run": 136, |
| "rus": 137, |
| "sah": 138, |
| "san": 139, |
| "scn": 140, |
| "sdh": 141, |
| "sin": 142, |
| "slk": 143, |
| "slv": 144, |
| "sme": 145, |
| "smo": 146, |
| "sna": 147, |
| "snd": 148, |
| "som": 149, |
| "sot": 150, |
| "spa": 151, |
| "srd": 152, |
| "srp": 153, |
| "sun": 154, |
| "swe": 155, |
| "swh": 156, |
| "tam": 157, |
| "tat": 158, |
| "tel": 159, |
| "tgk": 160, |
| "tha": 161, |
| "tir": 162, |
| "tuk": 163, |
| "tur": 164, |
| "tyv": 165, |
| "udm": 166, |
| "uig": 167, |
| "ukr": 168, |
| "urd": 169, |
| "uzn": 170, |
| "uzs": 171, |
| "vie": 172, |
| "xho": 173, |
| "ydd": 174, |
| "yor": 175, |
| "yue": 176, |
| "zea": 177, |
| "zsm": 178, |
| "zul": 179 |
| }, |
| "layer_norm_eps": 1e-05, |
| "local_attention": 128, |
| "local_rope_theta": 160000, |
| "mask_token_id": 4, |
| "max_position_embeddings": 8192, |
| "mlp_bias": false, |
| "mlp_dropout": 0.0, |
| "model_type": "modernbert", |
| "norm_bias": false, |
| "norm_eps": 1e-05, |
| "num_attention_heads": 12, |
| "num_hidden_layers": 22, |
| "pad_token_id": 0, |
| "position_embedding_type": "sans_pos", |
| "problem_type": "single_label_classification", |
| "repad_logits_with_grad": false, |
| "sep_token_id": 1, |
| "sparse_pred_ignore_index": -100, |
| "sparse_prediction": false, |
| "transformers_version": "4.57.6", |
| "vocab_size": 256000 |
| } |
|
|