my_awesome_model / config.json
jacksprat's picture
Training in progress, epoch 1
35d5eea
raw
history blame contribute delete
No virus
3.8 kB
{
"_name_or_path": "distilbert-base-uncased",
"activation": "gelu",
"architectures": [
"DistilBertForSequenceClassification"
],
"attention_dropout": 0.1,
"dim": 768,
"dropout": 0.1,
"hidden_dim": 3072,
"id2label": {
"0": "C50.9",
"1": "C61.9",
"2": "C50.8",
"3": "C50.4",
"4": "C50.2",
"5": "C13.9",
"6": "C80.9",
"7": "C34.9",
"8": "C42.1",
"9": "C18.0",
"10": "C15.5",
"11": "C00.1",
"12": "C34.0",
"13": "C00.0",
"14": "C44.3",
"15": "C24.0",
"16": "C64.9",
"17": "C34.1",
"18": "C22.0",
"19": "C20.9",
"20": "C00.2",
"21": "C50.5",
"22": "C18.7",
"23": "C34.3",
"24": "C67.9",
"25": "C77.4",
"26": "C17.9",
"27": "C44.7",
"28": "C77.2",
"29": "C18.2",
"30": "C18.3",
"31": "C18.9",
"32": "C44.5",
"33": "C16.9",
"34": "C25.0",
"35": "C44.6",
"36": "C19.9",
"37": "C09.8",
"38": "C55.9",
"39": "C43.9",
"40": "C01.9",
"41": "C48.0",
"42": "C54.1",
"43": "C62.9",
"44": "C69.3",
"45": "C50.3",
"46": "C02.9",
"47": "C77.9",
"48": "C62.1",
"49": "C18.1",
"50": "C73.9",
"51": "C44.9",
"52": "C77.5",
"53": "C15.9",
"54": "C21.0",
"55": "C67.0",
"56": "C18.6",
"57": "C44.2",
"58": "C25.9",
"59": "C30.0",
"60": "C77.0",
"61": "C13.1",
"62": "C71.9",
"63": "C42.0",
"64": "C34.2",
"65": "C52.2",
"66": "C17.2",
"67": "C44.4",
"68": "C18.4",
"69": "C09.9",
"70": "C22.1",
"71": "C17.0",
"72": "C71.8",
"73": "C16.0",
"74": "C49.3",
"75": "C71.2",
"76": "C41.0",
"77": "C53.9",
"78": "C69.0",
"79": "C37.9",
"80": "C76.3",
"81": "C50.",
"82": "C16.2",
"83": "C18.5",
"84": "C32.3",
"85": "C66.9",
"86": "C56.9",
"87": "C53.0"
},
"initializer_range": 0.02,
"label2id": {
"C00.0": 13,
"C00.1": 11,
"C00.2": 20,
"C01.9": 40,
"C02.9": 46,
"C09.8": 37,
"C09.9": 69,
"C13.1": 61,
"C13.9": 5,
"C15.5": 10,
"C15.9": 53,
"C16.0": 73,
"C16.2": 82,
"C16.9": 33,
"C17.0": 71,
"C17.2": 66,
"C17.9": 26,
"C18.0": 9,
"C18.1": 49,
"C18.2": 29,
"C18.3": 30,
"C18.4": 68,
"C18.5": 83,
"C18.6": 56,
"C18.7": 22,
"C18.9": 31,
"C19.9": 36,
"C20.9": 19,
"C21.0": 54,
"C22.0": 18,
"C22.1": 70,
"C24.0": 15,
"C25.0": 34,
"C25.9": 58,
"C30.0": 59,
"C32.3": 84,
"C34.0": 12,
"C34.1": 17,
"C34.2": 64,
"C34.3": 23,
"C34.9": 7,
"C37.9": 79,
"C41.0": 76,
"C42.0": 63,
"C42.1": 8,
"C43.9": 39,
"C44.2": 57,
"C44.3": 14,
"C44.4": 67,
"C44.5": 32,
"C44.6": 35,
"C44.7": 27,
"C44.9": 51,
"C48.0": 41,
"C49.3": 74,
"C50.": 81,
"C50.2": 4,
"C50.3": 45,
"C50.4": 3,
"C50.5": 21,
"C50.8": 2,
"C50.9": 0,
"C52.2": 65,
"C53.0": 87,
"C53.9": 77,
"C54.1": 42,
"C55.9": 38,
"C56.9": 86,
"C61.9": 1,
"C62.1": 48,
"C62.9": 43,
"C64.9": 16,
"C66.9": 85,
"C67.0": 55,
"C67.9": 24,
"C69.0": 78,
"C69.3": 44,
"C71.2": 75,
"C71.8": 72,
"C71.9": 62,
"C73.9": 50,
"C76.3": 80,
"C77.0": 60,
"C77.2": 28,
"C77.4": 25,
"C77.5": 52,
"C77.9": 47,
"C80.9": 6
},
"max_position_embeddings": 512,
"model_type": "distilbert",
"n_heads": 12,
"n_layers": 6,
"pad_token_id": 0,
"problem_type": "single_label_classification",
"qa_dropout": 0.1,
"seq_classif_dropout": 0.2,
"sinusoidal_pos_embds": false,
"tie_weights_": true,
"torch_dtype": "float32",
"transformers_version": "4.18.0",
"vocab_size": 30522
}