GeneZC's picture
Update config.json
68f861a
{
"_name_or_path": "ckpt-last",
"architectures": [
"SparseBertMiniLM"
],
"attention_probs_dropout_prob": 0.1,
"classifier_dropout": null,
"gradient_checkpointing": false,
"hidden_act": "gelu",
"hidden_dropout_prob": 0.1,
"hidden_size": 768,
"initializer_range": 0.02,
"intermediate_size": 3072,
"layer_norm_eps": 1e-12,
"layer_skip": 1,
"max_position_embeddings": 512,
"model_type": "bert",
"num_attention_heads": 12,
"num_hidden_layers": 12,
"num_relation_heads": 32,
"pad_token_id": 0,
"position_embedding_type": "absolute",
"sparsity": "90",
"sparsity_map": {
"0": {
"head": {},
"hidden": {
"-1": 0,
"0": 0,
"1": 0,
"10": 0,
"11": 0,
"2": 0,
"3": 0,
"4": 0,
"5": 0,
"6": 0,
"7": 0,
"8": 0,
"9": 0
},
"neuron": {}
},
"10": {
"head": {
"1": 5,
"11": 1,
"3": 1
},
"hidden": {
"-1": 38,
"0": 38,
"1": 38,
"10": 38,
"11": 38,
"2": 38,
"3": 38,
"4": 38,
"5": 38,
"6": 38,
"7": 38,
"8": 38,
"9": 38
},
"neuron": {
"0": 190,
"1": 298,
"11": 1,
"2": 1323,
"3": 4,
"4": 5,
"5": 8,
"6": 4,
"7": 7,
"8": 2,
"9": 1
}
},
"20": {
"head": {
"0": 1,
"1": 7,
"10": 1,
"11": 4,
"3": 2,
"9": 1
},
"hidden": {
"-1": 84,
"0": 84,
"1": 84,
"10": 84,
"11": 84,
"2": 84,
"3": 84,
"4": 84,
"5": 84,
"6": 84,
"7": 84,
"8": 84,
"9": 84
},
"neuron": {
"0": 597,
"1": 802,
"11": 16,
"2": 2294,
"3": 48,
"4": 78,
"5": 123,
"6": 22,
"7": 47,
"8": 23,
"9": 5
}
},
"30": {
"head": {
"0": 1,
"1": 8,
"10": 2,
"11": 4,
"2": 1,
"3": 2,
"6": 1,
"7": 1,
"8": 1,
"9": 2
},
"hidden": {
"-1": 123,
"0": 123,
"1": 123,
"10": 123,
"11": 123,
"2": 123,
"3": 123,
"4": 123,
"5": 123,
"6": 123,
"7": 123,
"8": 123,
"9": 123
},
"neuron": {
"0": 980,
"1": 1233,
"10": 2,
"11": 116,
"2": 2512,
"3": 132,
"4": 233,
"5": 386,
"6": 61,
"7": 146,
"8": 73,
"9": 24
}
},
"40": {
"head": {
"0": 3,
"1": 8,
"10": 2,
"11": 5,
"2": 1,
"3": 3,
"4": 2,
"5": 1,
"6": 2,
"7": 1,
"8": 1,
"9": 4
},
"hidden": {
"-1": 177,
"0": 177,
"1": 177,
"10": 177,
"11": 177,
"2": 177,
"3": 177,
"4": 177,
"5": 177,
"6": 177,
"7": 177,
"8": 177,
"9": 177
},
"neuron": {
"0": 1436,
"1": 1664,
"10": 6,
"11": 518,
"2": 2634,
"3": 306,
"4": 449,
"5": 732,
"6": 138,
"7": 321,
"8": 184,
"9": 91
}
},
"50": {
"head": {
"0": 5,
"1": 8,
"10": 3,
"11": 5,
"2": 2,
"3": 3,
"4": 3,
"5": 2,
"6": 3,
"7": 2,
"8": 2,
"9": 4
},
"hidden": {
"-1": 223,
"0": 223,
"1": 223,
"10": 223,
"11": 223,
"2": 223,
"3": 223,
"4": 223,
"5": 223,
"6": 223,
"7": 223,
"8": 223,
"9": 223
},
"neuron": {
"0": 1749,
"1": 1933,
"10": 21,
"11": 915,
"2": 2699,
"3": 519,
"4": 664,
"5": 976,
"6": 252,
"7": 469,
"8": 307,
"9": 187
}
},
"60": {
"head": {
"0": 6,
"1": 8,
"10": 5,
"11": 7,
"2": 3,
"3": 4,
"4": 4,
"5": 3,
"6": 5,
"7": 2,
"8": 2,
"9": 4
},
"hidden": {
"-1": 284,
"0": 284,
"1": 284,
"10": 284,
"11": 284,
"2": 284,
"3": 284,
"4": 284,
"5": 284,
"6": 284,
"7": 284,
"8": 284,
"9": 284
},
"neuron": {
"0": 2065,
"1": 2200,
"10": 67,
"11": 1392,
"2": 2762,
"3": 817,
"4": 991,
"5": 1279,
"6": 454,
"7": 695,
"8": 521,
"9": 397
}
},
"70": {
"head": {
"0": 6,
"1": 8,
"10": 6,
"11": 7,
"2": 4,
"3": 6,
"4": 4,
"5": 5,
"6": 6,
"7": 3,
"8": 5,
"9": 5
},
"hidden": {
"-1": 346,
"0": 346,
"1": 346,
"10": 346,
"11": 346,
"2": 346,
"3": 346,
"4": 346,
"5": 346,
"6": 346,
"7": 346,
"8": 346,
"9": 346
},
"neuron": {
"0": 2266,
"1": 2390,
"10": 206,
"11": 1745,
"2": 2820,
"3": 1173,
"4": 1308,
"5": 1537,
"6": 694,
"7": 951,
"8": 791,
"9": 708
}
},
"80": {
"head": {
"0": 6,
"1": 9,
"10": 8,
"11": 8,
"2": 6,
"3": 6,
"4": 6,
"5": 9,
"6": 7,
"7": 4,
"8": 5,
"9": 5
},
"hidden": {
"-1": 422,
"0": 422,
"1": 422,
"10": 422,
"11": 422,
"2": 422,
"3": 422,
"4": 422,
"5": 422,
"6": 422,
"7": 422,
"8": 422,
"9": 422
},
"neuron": {
"0": 2450,
"1": 2541,
"10": 574,
"11": 2105,
"2": 2863,
"3": 1559,
"4": 1676,
"5": 1862,
"6": 1071,
"7": 1294,
"8": 1154,
"9": 1126
}
},
"85": {
"head": {
"0": 6,
"1": 9,
"10": 10,
"11": 8,
"2": 6,
"3": 6,
"4": 7,
"5": 9,
"6": 8,
"7": 7,
"8": 5,
"9": 7
},
"hidden": {
"-1": 468,
"0": 468,
"1": 468,
"10": 468,
"11": 468,
"2": 468,
"3": 468,
"4": 468,
"5": 468,
"6": 468,
"7": 468,
"8": 468,
"9": 468
},
"neuron": {
"0": 2554,
"1": 2635,
"10": 936,
"11": 2278,
"2": 2889,
"3": 1780,
"4": 1836,
"5": 2037,
"6": 1292,
"7": 1489,
"8": 1360,
"9": 1401
}
},
"90": {
"head": {
"0": 6,
"1": 9,
"10": 11,
"11": 8,
"2": 7,
"3": 7,
"4": 9,
"5": 9,
"6": 9,
"7": 9,
"8": 6,
"9": 8
},
"hidden": {
"-1": 522,
"0": 522,
"1": 522,
"10": 522,
"11": 522,
"2": 522,
"3": 522,
"4": 522,
"5": 522,
"6": 522,
"7": 522,
"8": 522,
"9": 522
},
"neuron": {
"0": 2653,
"1": 2713,
"10": 1390,
"11": 2433,
"2": 2913,
"3": 2013,
"4": 2064,
"5": 2243,
"6": 1569,
"7": 1741,
"8": 1648,
"9": 1688
}
},
"95": {
"head": {
"0": 8,
"1": 10,
"10": 11,
"11": 9,
"2": 9,
"3": 9,
"4": 9,
"5": 9,
"6": 11,
"7": 9,
"8": 9,
"9": 9
},
"hidden": {
"-1": 599,
"0": 599,
"1": 599,
"10": 599,
"11": 599,
"2": 599,
"3": 599,
"4": 599,
"5": 599,
"6": 599,
"7": 599,
"8": 599,
"9": 599
},
"neuron": {
"0": 2753,
"1": 2799,
"10": 2001,
"11": 2654,
"2": 2948,
"3": 2337,
"4": 2381,
"5": 2519,
"6": 1992,
"7": 2148,
"8": 2061,
"9": 2161
}
},
"96": {
"head": {
"0": 9,
"1": 10,
"10": 11,
"11": 10,
"2": 9,
"3": 9,
"4": 9,
"5": 10,
"6": 11,
"7": 9,
"8": 9,
"9": 9
},
"hidden": {
"-1": 614,
"0": 614,
"1": 614,
"10": 614,
"11": 614,
"2": 614,
"3": 614,
"4": 614,
"5": 614,
"6": 614,
"7": 614,
"8": 614,
"9": 614
},
"neuron": {
"0": 2768,
"1": 2822,
"10": 2133,
"11": 2689,
"2": 2955,
"3": 2392,
"4": 2439,
"5": 2579,
"6": 2077,
"7": 2223,
"8": 2148,
"9": 2266
}
},
"97": {
"head": {
"0": 10,
"1": 10,
"10": 11,
"11": 10,
"2": 9,
"3": 9,
"4": 9,
"5": 10,
"6": 11,
"7": 10,
"8": 11,
"9": 10
},
"hidden": {
"-1": 637,
"0": 637,
"1": 637,
"10": 637,
"11": 637,
"2": 637,
"3": 637,
"4": 637,
"5": 637,
"6": 637,
"7": 637,
"8": 637,
"9": 637
},
"neuron": {
"0": 2799,
"1": 2846,
"10": 2294,
"11": 2746,
"2": 2970,
"3": 2487,
"4": 2537,
"5": 2656,
"6": 2207,
"7": 2355,
"8": 2291,
"9": 2409
}
},
"98": {
"head": {
"0": 11,
"1": 10,
"10": 11,
"11": 10,
"2": 10,
"3": 10,
"4": 10,
"5": 10,
"6": 11,
"7": 10,
"8": 11,
"9": 10
},
"hidden": {
"-1": 660,
"0": 660,
"1": 660,
"10": 660,
"11": 660,
"2": 660,
"3": 660,
"4": 660,
"5": 660,
"6": 660,
"7": 660,
"8": 660,
"9": 660
},
"neuron": {
"0": 2826,
"1": 2870,
"10": 2455,
"11": 2794,
"2": 2984,
"3": 2588,
"4": 2634,
"5": 2726,
"6": 2350,
"7": 2501,
"8": 2440,
"9": 2535
}
},
"99": {
"head": {
"0": 11,
"1": 10,
"10": 11,
"11": 11,
"2": 11,
"3": 11,
"4": 11,
"5": 11,
"6": 11,
"7": 11,
"8": 11,
"9": 10
},
"hidden": {
"-1": 691,
"0": 691,
"1": 691,
"10": 691,
"11": 691,
"2": 691,
"3": 691,
"4": 691,
"5": 691,
"6": 691,
"7": 691,
"8": 691,
"9": 691
},
"neuron": {
"0": 2861,
"1": 2915,
"10": 2683,
"11": 2862,
"2": 2998,
"3": 2709,
"4": 2746,
"5": 2845,
"6": 2551,
"7": 2678,
"8": 2635,
"9": 2695
}
}
},
"torch_dtype": "float32",
"transformers_version": "4.9.2",
"type_vocab_size": 2,
"use_cache": true,
"vocab_size": 30522
}