test-hasy-7 / config.json
khaingsmon's picture
Training in progress, epoch 1
b20eac8 verified
{
"_name_or_path": "google/vit-base-patch16-224-in21k",
"architectures": [
"ViTForImageClassification"
],
"attention_probs_dropout_prob": 0.0,
"encoder_stride": 16,
"hidden_act": "gelu",
"hidden_dropout_prob": 0.0,
"hidden_size": 768,
"id2label": {
"0": "A",
"1": "B",
"2": "C",
"3": "D",
"4": "E",
"5": "F",
"6": "G",
"7": "H",
"8": "I",
"9": "J",
"10": "K",
"11": "L",
"12": "M",
"13": "N",
"14": "O",
"15": "P",
"16": "Q",
"17": "R",
"18": "S",
"19": "T",
"20": "U",
"21": "V",
"22": "W",
"23": "X",
"24": "Y",
"25": "Z",
"26": "\\rightarrow",
"27": "0",
"28": "1",
"29": "2",
"30": "3",
"31": "4",
"32": "5",
"33": "6",
"34": "7",
"35": "8",
"36": "9",
"37": "\\pi",
"38": "\\alpha",
"39": "\\beta",
"40": "\\sum",
"41": "\\sigma",
"42": "a",
"43": "b",
"44": "c",
"45": "d",
"46": "e",
"47": "f",
"48": "g",
"49": "h",
"50": "i",
"51": "j",
"52": "k",
"53": "l",
"54": "m",
"55": "n",
"56": "o",
"57": "p",
"58": "q",
"59": "r",
"60": "s",
"61": "u",
"62": "v",
"63": "w",
"64": "x",
"65": "y",
"66": "z",
"67": "\\Sigma",
"68": "\\gamma",
"69": "\\Gamma",
"70": "\\delta",
"71": "\\Delta",
"72": "\\zeta",
"73": "\\eta",
"74": "\\theta",
"75": "\\Theta",
"76": "\\epsilon",
"77": "\\varepsilon",
"78": "\\iota",
"79": "\\kappa",
"80": "\\varkappa",
"81": "\\lambda",
"82": "\\Lambda",
"83": "\\mu",
"84": "\\nu",
"85": "\\xi",
"86": "\\Xi",
"87": "\\Pi",
"88": "\\rho",
"89": "\\varrho",
"90": "\\tau",
"91": "\\phi",
"92": "\\Phi",
"93": "\\varphi",
"94": "\\chi",
"95": "\\psi",
"96": "\\Psi",
"97": "\\omega",
"98": "\\Omega",
"99": "\\partial",
"100": "\\int",
"101": "\\cdot",
"102": "\\leq",
"103": "\\geq",
"104": "<",
"105": ">",
"106": "\\subset",
"107": "\\supset",
"108": "\\subseteq",
"109": "\\supseteq",
"110": "\\cong",
"111": "\\propto",
"112": "-",
"113": "+",
"114": "\\mathbb{R}",
"115": "\\$",
"116": "\\{",
"117": "\\copyright",
"118": "\\dots",
"119": "\\}",
"120": "\\S",
"121": "\\dag",
"122": "\\pounds",
"123": "\\&"
},
"image_size": 224,
"initializer_range": 0.02,
"intermediate_size": 3072,
"label2id": {
"+": 113,
"-": 112,
"0": 27,
"1": 28,
"2": 29,
"3": 30,
"4": 31,
"5": 32,
"6": 33,
"7": 34,
"8": 35,
"9": 36,
"<": 104,
">": 105,
"A": 0,
"B": 1,
"C": 2,
"D": 3,
"E": 4,
"F": 5,
"G": 6,
"H": 7,
"I": 8,
"J": 9,
"K": 10,
"L": 11,
"M": 12,
"N": 13,
"O": 14,
"P": 15,
"Q": 16,
"R": 17,
"S": 18,
"T": 19,
"U": 20,
"V": 21,
"W": 22,
"X": 23,
"Y": 24,
"Z": 25,
"\\$": 115,
"\\&": 123,
"\\Delta": 71,
"\\Gamma": 69,
"\\Lambda": 82,
"\\Omega": 98,
"\\Phi": 92,
"\\Pi": 87,
"\\Psi": 96,
"\\S": 120,
"\\Sigma": 67,
"\\Theta": 75,
"\\Xi": 86,
"\\alpha": 38,
"\\beta": 39,
"\\cdot": 101,
"\\chi": 94,
"\\cong": 110,
"\\copyright": 117,
"\\dag": 121,
"\\delta": 70,
"\\dots": 118,
"\\epsilon": 76,
"\\eta": 73,
"\\gamma": 68,
"\\geq": 103,
"\\int": 100,
"\\iota": 78,
"\\kappa": 79,
"\\lambda": 81,
"\\leq": 102,
"\\mathbb{R}": 114,
"\\mu": 83,
"\\nu": 84,
"\\omega": 97,
"\\partial": 99,
"\\phi": 91,
"\\pi": 37,
"\\pounds": 122,
"\\propto": 111,
"\\psi": 95,
"\\rho": 88,
"\\rightarrow": 26,
"\\sigma": 41,
"\\subset": 106,
"\\subseteq": 108,
"\\sum": 40,
"\\supset": 107,
"\\supseteq": 109,
"\\tau": 90,
"\\theta": 74,
"\\varepsilon": 77,
"\\varkappa": 80,
"\\varphi": 93,
"\\varrho": 89,
"\\xi": 85,
"\\zeta": 72,
"\\{": 116,
"\\}": 119,
"a": 42,
"b": 43,
"c": 44,
"d": 45,
"e": 46,
"f": 47,
"g": 48,
"h": 49,
"i": 50,
"j": 51,
"k": 52,
"l": 53,
"m": 54,
"n": 55,
"o": 56,
"p": 57,
"q": 58,
"r": 59,
"s": 60,
"u": 61,
"v": 62,
"w": 63,
"x": 64,
"y": 65,
"z": 66
},
"layer_norm_eps": 1e-12,
"model_type": "vit",
"num_attention_heads": 12,
"num_channels": 3,
"num_hidden_layers": 12,
"patch_size": 16,
"problem_type": "single_label_classification",
"qkv_bias": true,
"torch_dtype": "float32",
"transformers_version": "4.38.2"
}