| { |
| "architectures": [ |
| "ModernBertForSequenceClassification" |
| ], |
| "attention_bias": false, |
| "attention_dropout": 0.0, |
| "bos_token_id": 50281, |
| "classifier_activation": "gelu", |
| "classifier_bias": false, |
| "classifier_dropout": 0.0, |
| "classifier_pooling": "mean", |
| "cls_token_id": 50281, |
| "decoder_bias": true, |
| "deterministic_flash_attn": false, |
| "embedding_dropout": 0.0, |
| "eos_token_id": 50282, |
| "global_attn_every_n_layers": 3, |
| "global_rope_theta": 160000.0, |
| "gradient_checkpointing": false, |
| "hidden_activation": "gelu", |
| "hidden_size": 768, |
| "id2label": { |
| "0": 0, |
| "1": 1, |
| "10": 10, |
| "11": 11, |
| "12": 12, |
| "13": 13, |
| "14": 14, |
| "15": 15, |
| "16": 16, |
| "17": 17, |
| "18": 18, |
| "19": 19, |
| "2": 2, |
| "20": 20, |
| "21": 21, |
| "22": 22, |
| "23": 23, |
| "24": 24, |
| "25": 25, |
| "26": 26, |
| "27": 27, |
| "28": 28, |
| "29": 29, |
| "3": 3, |
| "30": 30, |
| "31": 31, |
| "32": 32, |
| "33": 33, |
| "34": 34, |
| "35": 35, |
| "36": 36, |
| "37": 37, |
| "38": 38, |
| "39": 39, |
| "4": 4, |
| "40": 40, |
| "41": 41, |
| "42": 42, |
| "43": 43, |
| "44": 44, |
| "45": 45, |
| "46": 46, |
| "47": 47, |
| "48": 48, |
| "49": 49, |
| "5": 5, |
| "50": 50, |
| "6": 6, |
| "7": 7, |
| "8": 8, |
| "9": 9 |
| }, |
| "initializer_cutoff_factor": 2.0, |
| "initializer_range": 0.02, |
| "intermediate_size": 1152, |
| "label2id": { |
| "0": "0", |
| "1": "1", |
| "2": "2", |
| "3": "3", |
| "4": "4", |
| "5": "5", |
| "6": "6", |
| "7": "7", |
| "8": "8", |
| "9": "9", |
| "10": "10", |
| "11": "11", |
| "12": "12", |
| "13": "13", |
| "14": "14", |
| "15": "15", |
| "16": "16", |
| "17": "17", |
| "18": "18", |
| "19": "19", |
| "20": "20", |
| "21": "21", |
| "22": "22", |
| "23": "23", |
| "24": "24", |
| "25": "25", |
| "26": "26", |
| "27": "27", |
| "28": "28", |
| "29": "29", |
| "30": "30", |
| "31": "31", |
| "32": "32", |
| "33": "33", |
| "34": "34", |
| "35": "35", |
| "36": "36", |
| "37": "37", |
| "38": "38", |
| "39": "39", |
| "40": "40", |
| "41": "41", |
| "42": "42", |
| "43": "43", |
| "44": "44", |
| "45": "45", |
| "46": "46", |
| "47": "47", |
| "48": "48", |
| "49": "49", |
| "50": "50" |
| }, |
| "layer_norm_eps": 1e-05, |
| "local_attention": 128, |
| "local_rope_theta": 10000.0, |
| "max_position_embeddings": 8192, |
| "mlp_bias": false, |
| "mlp_dropout": 0.0, |
| "model_type": "modernbert", |
| "norm_bias": false, |
| "norm_eps": 1e-05, |
| "num_attention_heads": 12, |
| "num_hidden_layers": 22, |
| "pad_token_id": 50283, |
| "position_embedding_type": "absolute", |
| "problem_type": "single_label_classification", |
| "repad_logits_with_grad": false, |
| "sep_token_id": 50282, |
| "sparse_pred_ignore_index": -100, |
| "sparse_prediction": false, |
| "torch_dtype": "float32", |
| "transformers_version": "4.55.2", |
| "vocab_size": 50368 |
| } |
|
|