tlphams's picture
Training in progress, epoch 0
c292e93 verified
{
"_name_or_path": "facebook/dinov2-giant",
"apply_layernorm": true,
"architectures": [
"Dinov2ForImageClassification"
],
"attention_probs_dropout_prob": 0.0,
"drop_path_rate": 0.0,
"hidden_act": "gelu",
"hidden_dropout_prob": 0.0,
"hidden_size": 1536,
"id2label": {
"0": "k-01",
"1": "k-02",
"2": "k-03",
"3": "k-04",
"4": "k-05",
"5": "k-06",
"6": "k-07",
"7": "k-08",
"8": "k-09",
"9": "k-10",
"10": "k-11",
"11": "k-12",
"12": "k-13",
"13": "k-14",
"14": "k-15",
"15": "k-16",
"16": "k-17",
"17": "k-18",
"18": "k-19",
"19": "k-20",
"20": "k-21",
"21": "k-22",
"22": "k-23",
"23": "k-24",
"24": "k-25",
"25": "k-26",
"26": "k-27",
"27": "k-28",
"28": "k-29",
"29": "k-30",
"30": "k-31",
"31": "k-32",
"32": "k-33",
"33": "k-34",
"34": "k-35",
"35": "k-36",
"36": "k-37",
"37": "k-38",
"38": "k-39",
"39": "k-40",
"40": "k-41",
"41": "k-42",
"42": "k-43",
"43": "k-44",
"44": "k-45",
"45": "k-46",
"46": "k-47",
"47": "k-48",
"48": "k-49",
"49": "k-51",
"50": "k-52",
"51": "k-53",
"52": "k-54",
"53": "k-55",
"54": "k-56",
"55": "k-57",
"56": "k-58",
"57": "k-59",
"58": "k-60",
"59": "k-61",
"60": "k-62",
"61": "stamp0",
"62": "stamp1",
"63": "stamp10",
"64": "stamp11",
"65": "stamp12",
"66": "stamp13",
"67": "stamp14",
"68": "stamp15",
"69": "stamp16",
"70": "stamp17",
"71": "stamp18",
"72": "stamp19",
"73": "stamp2",
"74": "stamp20",
"75": "stamp21",
"76": "stamp22",
"77": "stamp23",
"78": "stamp24",
"79": "stamp25",
"80": "stamp3",
"81": "stamp4",
"82": "stamp5",
"83": "stamp6",
"84": "stamp7",
"85": "stamp8",
"86": "stamp9"
},
"image_size": 518,
"initializer_range": 0.02,
"label2id": {
"k-01": 0,
"k-02": 1,
"k-03": 2,
"k-04": 3,
"k-05": 4,
"k-06": 5,
"k-07": 6,
"k-08": 7,
"k-09": 8,
"k-10": 9,
"k-11": 10,
"k-12": 11,
"k-13": 12,
"k-14": 13,
"k-15": 14,
"k-16": 15,
"k-17": 16,
"k-18": 17,
"k-19": 18,
"k-20": 19,
"k-21": 20,
"k-22": 21,
"k-23": 22,
"k-24": 23,
"k-25": 24,
"k-26": 25,
"k-27": 26,
"k-28": 27,
"k-29": 28,
"k-30": 29,
"k-31": 30,
"k-32": 31,
"k-33": 32,
"k-34": 33,
"k-35": 34,
"k-36": 35,
"k-37": 36,
"k-38": 37,
"k-39": 38,
"k-40": 39,
"k-41": 40,
"k-42": 41,
"k-43": 42,
"k-44": 43,
"k-45": 44,
"k-46": 45,
"k-47": 46,
"k-48": 47,
"k-49": 48,
"k-51": 49,
"k-52": 50,
"k-53": 51,
"k-54": 52,
"k-55": 53,
"k-56": 54,
"k-57": 55,
"k-58": 56,
"k-59": 57,
"k-60": 58,
"k-61": 59,
"k-62": 60,
"stamp0": 61,
"stamp1": 62,
"stamp10": 63,
"stamp11": 64,
"stamp12": 65,
"stamp13": 66,
"stamp14": 67,
"stamp15": 68,
"stamp16": 69,
"stamp17": 70,
"stamp18": 71,
"stamp19": 72,
"stamp2": 73,
"stamp20": 74,
"stamp21": 75,
"stamp22": 76,
"stamp23": 77,
"stamp24": 78,
"stamp25": 79,
"stamp3": 80,
"stamp4": 81,
"stamp5": 82,
"stamp6": 83,
"stamp7": 84,
"stamp8": 85,
"stamp9": 86
},
"layer_norm_eps": 1e-06,
"layerscale_value": 1.0,
"mlp_ratio": 4,
"model_type": "dinov2",
"num_attention_heads": 24,
"num_channels": 3,
"num_hidden_layers": 40,
"out_features": [
"stage40"
],
"out_indices": [
40
],
"patch_size": 14,
"problem_type": "single_label_classification",
"qkv_bias": true,
"reshape_hidden_states": true,
"stage_names": [
"stem",
"stage1",
"stage2",
"stage3",
"stage4",
"stage5",
"stage6",
"stage7",
"stage8",
"stage9",
"stage10",
"stage11",
"stage12",
"stage13",
"stage14",
"stage15",
"stage16",
"stage17",
"stage18",
"stage19",
"stage20",
"stage21",
"stage22",
"stage23",
"stage24",
"stage25",
"stage26",
"stage27",
"stage28",
"stage29",
"stage30",
"stage31",
"stage32",
"stage33",
"stage34",
"stage35",
"stage36",
"stage37",
"stage38",
"stage39",
"stage40"
],
"torch_dtype": "float32",
"transformers_version": "4.45.0.dev0",
"use_swiglu_ffn": true
}