Vui Seng Chua
Update collateral
68c7f51
pt_module_name block_id orig_w_shape final_w_shape orig_b_shape final_b_shape prune_by id_to_keep head_id_to_keep nncf_graph_node
0 nncf_module.bert.encoder.layer.0.attention.self.key 0 (1024, 1024) (448, 1024) (1024,) (448,) group of 64 rows See pkl [1, 2, 6, 7, 10, 13, 14] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[0]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
1 nncf_module.bert.encoder.layer.0.attention.self.value 0 (1024, 1024) (448, 1024) (1024,) (448,) group of 64 rows See pkl [1, 2, 6, 7, 10, 13, 14] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[0]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
2 nncf_module.bert.encoder.layer.0.attention.self.query 0 (1024, 1024) (448, 1024) (1024,) (448,) group of 64 rows See pkl [1, 2, 6, 7, 10, 13, 14] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[0]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
3 nncf_module.bert.encoder.layer.0.attention.output.dense 0 (1024, 1024) (1024, 448) (1024,) (1024,) group of 64 cols See pkl [1, 2, 6, 7, 10, 13, 14] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[0]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
4 nncf_module.bert.encoder.layer.0.intermediate.dense 1 (4096, 1024) (915, 1024) (4096,) (915,) row See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[0]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
5 nncf_module.bert.encoder.layer.0.output.dense 1 (1024, 4096) (1024, 915) (1024,) (1024,) col See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[0]/BertOutput[output]/NNCFLinear[dense]/linear_0
6 nncf_module.bert.encoder.layer.1.attention.self.query 2 (1024, 1024) (64, 1024) (1024,) (64,) group of 64 rows See pkl [8] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[1]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
7 nncf_module.bert.encoder.layer.1.attention.self.value 2 (1024, 1024) (64, 1024) (1024,) (64,) group of 64 rows See pkl [8] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[1]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
8 nncf_module.bert.encoder.layer.1.attention.self.key 2 (1024, 1024) (64, 1024) (1024,) (64,) group of 64 rows See pkl [8] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[1]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
9 nncf_module.bert.encoder.layer.1.attention.output.dense 2 (1024, 1024) (1024, 64) (1024,) (1024,) group of 64 cols See pkl [8] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[1]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
10 nncf_module.bert.encoder.layer.1.output.dense 3 (1024, 4096) (1024, 829) (1024,) (1024,) col See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[1]/BertOutput[output]/NNCFLinear[dense]/linear_0
11 nncf_module.bert.encoder.layer.1.intermediate.dense 3 (4096, 1024) (829, 1024) (4096,) (829,) row See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[1]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
12 nncf_module.bert.encoder.layer.2.attention.output.dense 4 (1024, 1024) (1024, 128) (1024,) (1024,) group of 64 cols See pkl [3, 5] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[2]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
13 nncf_module.bert.encoder.layer.2.attention.self.value 4 (1024, 1024) (128, 1024) (1024,) (128,) group of 64 rows See pkl [3, 5] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[2]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
14 nncf_module.bert.encoder.layer.2.attention.self.key 4 (1024, 1024) (128, 1024) (1024,) (128,) group of 64 rows See pkl [3, 5] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[2]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
15 nncf_module.bert.encoder.layer.2.attention.self.query 4 (1024, 1024) (128, 1024) (1024,) (128,) group of 64 rows See pkl [3, 5] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[2]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
16 nncf_module.bert.encoder.layer.2.output.dense 5 (1024, 4096) (1024, 1181) (1024,) (1024,) col See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[2]/BertOutput[output]/NNCFLinear[dense]/linear_0
17 nncf_module.bert.encoder.layer.2.intermediate.dense 5 (4096, 1024) (1181, 1024) (4096,) (1181,) row See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[2]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
18 nncf_module.bert.encoder.layer.3.attention.self.value 6 (1024, 1024) (128, 1024) (1024,) (128,) group of 64 rows See pkl [4, 12] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[3]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
19 nncf_module.bert.encoder.layer.3.attention.self.key 6 (1024, 1024) (128, 1024) (1024,) (128,) group of 64 rows See pkl [4, 12] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[3]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
20 nncf_module.bert.encoder.layer.3.attention.self.query 6 (1024, 1024) (128, 1024) (1024,) (128,) group of 64 rows See pkl [4, 12] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[3]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
21 nncf_module.bert.encoder.layer.3.attention.output.dense 6 (1024, 1024) (1024, 128) (1024,) (1024,) group of 64 cols See pkl [4, 12] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[3]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
22 nncf_module.bert.encoder.layer.3.output.dense 7 (1024, 4096) (1024, 1526) (1024,) (1024,) col See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[3]/BertOutput[output]/NNCFLinear[dense]/linear_0
23 nncf_module.bert.encoder.layer.3.intermediate.dense 7 (4096, 1024) (1526, 1024) (4096,) (1526,) row See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[3]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
24 nncf_module.bert.encoder.layer.4.attention.self.key 8 (1024, 1024) (64, 1024) (1024,) (64,) group of 64 rows See pkl [15] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[4]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
25 nncf_module.bert.encoder.layer.4.attention.self.value 8 (1024, 1024) (64, 1024) (1024,) (64,) group of 64 rows See pkl [15] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[4]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
26 nncf_module.bert.encoder.layer.4.attention.self.query 8 (1024, 1024) (64, 1024) (1024,) (64,) group of 64 rows See pkl [15] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[4]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
27 nncf_module.bert.encoder.layer.4.attention.output.dense 8 (1024, 1024) (1024, 64) (1024,) (1024,) group of 64 cols See pkl [15] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[4]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
28 nncf_module.bert.encoder.layer.4.output.dense 9 (1024, 4096) (1024, 1749) (1024,) (1024,) col See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[4]/BertOutput[output]/NNCFLinear[dense]/linear_0
29 nncf_module.bert.encoder.layer.4.intermediate.dense 9 (4096, 1024) (1749, 1024) (4096,) (1749,) row See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[4]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
30 nncf_module.bert.encoder.layer.5.attention.self.query 10 (1024, 1024) (1024, 1024) (1024,) (1024,) group of 64 rows See pkl [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[5]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
31 nncf_module.bert.encoder.layer.5.attention.output.dense 10 (1024, 1024) (1024, 1024) (1024,) (1024,) group of 64 cols See pkl [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[5]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
32 nncf_module.bert.encoder.layer.5.attention.self.value 10 (1024, 1024) (1024, 1024) (1024,) (1024,) group of 64 rows See pkl [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[5]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
33 nncf_module.bert.encoder.layer.5.attention.self.key 10 (1024, 1024) (1024, 1024) (1024,) (1024,) group of 64 rows See pkl [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[5]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
34 nncf_module.bert.encoder.layer.5.output.dense 11 (1024, 4096) (1024, 2107) (1024,) (1024,) col See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[5]/BertOutput[output]/NNCFLinear[dense]/linear_0
35 nncf_module.bert.encoder.layer.5.intermediate.dense 11 (4096, 1024) (2107, 1024) (4096,) (2107,) row See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[5]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
36 nncf_module.bert.encoder.layer.6.attention.self.query 12 (1024, 1024) (1024, 1024) (1024,) (1024,) group of 64 rows See pkl [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[6]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
37 nncf_module.bert.encoder.layer.6.attention.self.key 12 (1024, 1024) (1024, 1024) (1024,) (1024,) group of 64 rows See pkl [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[6]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
38 nncf_module.bert.encoder.layer.6.attention.self.value 12 (1024, 1024) (1024, 1024) (1024,) (1024,) group of 64 rows See pkl [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[6]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
39 nncf_module.bert.encoder.layer.6.attention.output.dense 12 (1024, 1024) (1024, 1024) (1024,) (1024,) group of 64 cols See pkl [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[6]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
40 nncf_module.bert.encoder.layer.6.output.dense 13 (1024, 4096) (1024, 2368) (1024,) (1024,) col See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[6]/BertOutput[output]/NNCFLinear[dense]/linear_0
41 nncf_module.bert.encoder.layer.6.intermediate.dense 13 (4096, 1024) (2368, 1024) (4096,) (2368,) row See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[6]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
42 nncf_module.bert.encoder.layer.7.attention.self.query 14 (1024, 1024) (128, 1024) (1024,) (128,) group of 64 rows See pkl [1, 6] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[7]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
43 nncf_module.bert.encoder.layer.7.attention.self.key 14 (1024, 1024) (128, 1024) (1024,) (128,) group of 64 rows See pkl [1, 6] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[7]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
44 nncf_module.bert.encoder.layer.7.attention.output.dense 14 (1024, 1024) (1024, 128) (1024,) (1024,) group of 64 cols See pkl [1, 6] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[7]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
45 nncf_module.bert.encoder.layer.7.attention.self.value 14 (1024, 1024) (128, 1024) (1024,) (128,) group of 64 rows See pkl [1, 6] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[7]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
46 nncf_module.bert.encoder.layer.7.intermediate.dense 15 (4096, 1024) (2395, 1024) (4096,) (2395,) row See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[7]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
47 nncf_module.bert.encoder.layer.7.output.dense 15 (1024, 4096) (1024, 2395) (1024,) (1024,) col See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[7]/BertOutput[output]/NNCFLinear[dense]/linear_0
48 nncf_module.bert.encoder.layer.8.attention.self.value 16 (1024, 1024) (128, 1024) (1024,) (128,) group of 64 rows See pkl [1, 6] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[8]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
49 nncf_module.bert.encoder.layer.8.attention.output.dense 16 (1024, 1024) (1024, 128) (1024,) (1024,) group of 64 cols See pkl [1, 6] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[8]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
50 nncf_module.bert.encoder.layer.8.attention.self.query 16 (1024, 1024) (128, 1024) (1024,) (128,) group of 64 rows See pkl [1, 6] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[8]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
51 nncf_module.bert.encoder.layer.8.attention.self.key 16 (1024, 1024) (128, 1024) (1024,) (128,) group of 64 rows See pkl [1, 6] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[8]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
52 nncf_module.bert.encoder.layer.8.intermediate.dense 17 (4096, 1024) (2352, 1024) (4096,) (2352,) row See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[8]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
53 nncf_module.bert.encoder.layer.8.output.dense 17 (1024, 4096) (1024, 2352) (1024,) (1024,) col See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[8]/BertOutput[output]/NNCFLinear[dense]/linear_0
54 nncf_module.bert.encoder.layer.9.attention.self.query 18 (1024, 1024) (64, 1024) (1024,) (64,) group of 64 rows See pkl [12] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[9]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
55 nncf_module.bert.encoder.layer.9.attention.self.key 18 (1024, 1024) (64, 1024) (1024,) (64,) group of 64 rows See pkl [12] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[9]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
56 nncf_module.bert.encoder.layer.9.attention.output.dense 18 (1024, 1024) (1024, 64) (1024,) (1024,) group of 64 cols See pkl [12] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[9]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
57 nncf_module.bert.encoder.layer.9.attention.self.value 18 (1024, 1024) (64, 1024) (1024,) (64,) group of 64 rows See pkl [12] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[9]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
58 nncf_module.bert.encoder.layer.9.output.dense 19 (1024, 4096) (1024, 2345) (1024,) (1024,) col See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[9]/BertOutput[output]/NNCFLinear[dense]/linear_0
59 nncf_module.bert.encoder.layer.9.intermediate.dense 19 (4096, 1024) (2345, 1024) (4096,) (2345,) row See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[9]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
60 nncf_module.bert.encoder.layer.10.attention.self.query 20 (1024, 1024) (64, 1024) (1024,) (64,) group of 64 rows See pkl [0] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[10]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
61 nncf_module.bert.encoder.layer.10.attention.self.key 20 (1024, 1024) (64, 1024) (1024,) (64,) group of 64 rows See pkl [0] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[10]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
62 nncf_module.bert.encoder.layer.10.attention.output.dense 20 (1024, 1024) (1024, 64) (1024,) (1024,) group of 64 cols See pkl [0] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[10]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
63 nncf_module.bert.encoder.layer.10.attention.self.value 20 (1024, 1024) (64, 1024) (1024,) (64,) group of 64 rows See pkl [0] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[10]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
64 nncf_module.bert.encoder.layer.10.intermediate.dense 21 (4096, 1024) (2261, 1024) (4096,) (2261,) row See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[10]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
65 nncf_module.bert.encoder.layer.10.output.dense 21 (1024, 4096) (1024, 2261) (1024,) (1024,) col See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[10]/BertOutput[output]/NNCFLinear[dense]/linear_0
66 nncf_module.bert.encoder.layer.11.attention.output.dense 22 (1024, 1024) (1024, 256) (1024,) (1024,) group of 64 cols See pkl [1, 4, 9, 13] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[11]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
67 nncf_module.bert.encoder.layer.11.attention.self.key 22 (1024, 1024) (256, 1024) (1024,) (256,) group of 64 rows See pkl [1, 4, 9, 13] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[11]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
68 nncf_module.bert.encoder.layer.11.attention.self.value 22 (1024, 1024) (256, 1024) (1024,) (256,) group of 64 rows See pkl [1, 4, 9, 13] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[11]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
69 nncf_module.bert.encoder.layer.11.attention.self.query 22 (1024, 1024) (256, 1024) (1024,) (256,) group of 64 rows See pkl [1, 4, 9, 13] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[11]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
70 nncf_module.bert.encoder.layer.11.intermediate.dense 23 (4096, 1024) (1950, 1024) (4096,) (1950,) row See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[11]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
71 nncf_module.bert.encoder.layer.11.output.dense 23 (1024, 4096) (1024, 1950) (1024,) (1024,) col See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[11]/BertOutput[output]/NNCFLinear[dense]/linear_0
72 nncf_module.bert.encoder.layer.12.attention.self.query 24 (1024, 1024) (320, 1024) (1024,) (320,) group of 64 rows See pkl [4, 5, 7, 14, 15] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[12]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
73 nncf_module.bert.encoder.layer.12.attention.self.value 24 (1024, 1024) (320, 1024) (1024,) (320,) group of 64 rows See pkl [4, 5, 7, 14, 15] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[12]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
74 nncf_module.bert.encoder.layer.12.attention.self.key 24 (1024, 1024) (320, 1024) (1024,) (320,) group of 64 rows See pkl [4, 5, 7, 14, 15] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[12]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
75 nncf_module.bert.encoder.layer.12.attention.output.dense 24 (1024, 1024) (1024, 320) (1024,) (1024,) group of 64 cols See pkl [4, 5, 7, 14, 15] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[12]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
76 nncf_module.bert.encoder.layer.12.intermediate.dense 25 (4096, 1024) (1818, 1024) (4096,) (1818,) row See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[12]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
77 nncf_module.bert.encoder.layer.12.output.dense 25 (1024, 4096) (1024, 1818) (1024,) (1024,) col See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[12]/BertOutput[output]/NNCFLinear[dense]/linear_0
78 nncf_module.bert.encoder.layer.13.attention.self.query 26 (1024, 1024) (256, 1024) (1024,) (256,) group of 64 rows See pkl [4, 7, 13, 14] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[13]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
79 nncf_module.bert.encoder.layer.13.attention.output.dense 26 (1024, 1024) (1024, 256) (1024,) (1024,) group of 64 cols See pkl [4, 7, 13, 14] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[13]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
80 nncf_module.bert.encoder.layer.13.attention.self.key 26 (1024, 1024) (256, 1024) (1024,) (256,) group of 64 rows See pkl [4, 7, 13, 14] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[13]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
81 nncf_module.bert.encoder.layer.13.attention.self.value 26 (1024, 1024) (256, 1024) (1024,) (256,) group of 64 rows See pkl [4, 7, 13, 14] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[13]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
82 nncf_module.bert.encoder.layer.13.output.dense 27 (1024, 4096) (1024, 1585) (1024,) (1024,) col See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[13]/BertOutput[output]/NNCFLinear[dense]/linear_0
83 nncf_module.bert.encoder.layer.13.intermediate.dense 27 (4096, 1024) (1585, 1024) (4096,) (1585,) row See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[13]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
84 nncf_module.bert.encoder.layer.14.attention.output.dense 28 (1024, 1024) (1024, 320) (1024,) (1024,) group of 64 cols See pkl [2, 3, 4, 7, 8] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[14]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
85 nncf_module.bert.encoder.layer.14.attention.self.value 28 (1024, 1024) (320, 1024) (1024,) (320,) group of 64 rows See pkl [2, 3, 4, 7, 8] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[14]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
86 nncf_module.bert.encoder.layer.14.attention.self.key 28 (1024, 1024) (320, 1024) (1024,) (320,) group of 64 rows See pkl [2, 3, 4, 7, 8] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[14]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
87 nncf_module.bert.encoder.layer.14.attention.self.query 28 (1024, 1024) (320, 1024) (1024,) (320,) group of 64 rows See pkl [2, 3, 4, 7, 8] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[14]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
88 nncf_module.bert.encoder.layer.14.intermediate.dense 29 (4096, 1024) (1165, 1024) (4096,) (1165,) row See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[14]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
89 nncf_module.bert.encoder.layer.14.output.dense 29 (1024, 4096) (1024, 1165) (1024,) (1024,) col See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[14]/BertOutput[output]/NNCFLinear[dense]/linear_0
90 nncf_module.bert.encoder.layer.15.attention.output.dense 30 (1024, 1024) (1024, 320) (1024,) (1024,) group of 64 cols See pkl [2, 7, 8, 10, 14] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[15]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
91 nncf_module.bert.encoder.layer.15.attention.self.query 30 (1024, 1024) (320, 1024) (1024,) (320,) group of 64 rows See pkl [2, 7, 8, 10, 14] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[15]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
92 nncf_module.bert.encoder.layer.15.attention.self.key 30 (1024, 1024) (320, 1024) (1024,) (320,) group of 64 rows See pkl [2, 7, 8, 10, 14] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[15]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
93 nncf_module.bert.encoder.layer.15.attention.self.value 30 (1024, 1024) (320, 1024) (1024,) (320,) group of 64 rows See pkl [2, 7, 8, 10, 14] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[15]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
94 nncf_module.bert.encoder.layer.15.output.dense 31 (1024, 4096) (1024, 982) (1024,) (1024,) col See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[15]/BertOutput[output]/NNCFLinear[dense]/linear_0
95 nncf_module.bert.encoder.layer.15.intermediate.dense 31 (4096, 1024) (982, 1024) (4096,) (982,) row See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[15]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
96 nncf_module.bert.encoder.layer.16.attention.self.value 32 (1024, 1024) (320, 1024) (1024,) (320,) group of 64 rows See pkl [0, 8, 10, 13, 14] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[16]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
97 nncf_module.bert.encoder.layer.16.attention.self.key 32 (1024, 1024) (320, 1024) (1024,) (320,) group of 64 rows See pkl [0, 8, 10, 13, 14] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[16]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
98 nncf_module.bert.encoder.layer.16.attention.self.query 32 (1024, 1024) (320, 1024) (1024,) (320,) group of 64 rows See pkl [0, 8, 10, 13, 14] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[16]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
99 nncf_module.bert.encoder.layer.16.attention.output.dense 32 (1024, 1024) (1024, 320) (1024,) (1024,) group of 64 cols See pkl [0, 8, 10, 13, 14] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[16]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
100 nncf_module.bert.encoder.layer.16.intermediate.dense 33 (4096, 1024) (941, 1024) (4096,) (941,) row See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[16]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
101 nncf_module.bert.encoder.layer.16.output.dense 33 (1024, 4096) (1024, 941) (1024,) (1024,) col See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[16]/BertOutput[output]/NNCFLinear[dense]/linear_0
102 nncf_module.bert.encoder.layer.17.attention.self.key 34 (1024, 1024) (256, 1024) (1024,) (256,) group of 64 rows See pkl [3, 6, 7, 15] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[17]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
103 nncf_module.bert.encoder.layer.17.attention.self.value 34 (1024, 1024) (256, 1024) (1024,) (256,) group of 64 rows See pkl [3, 6, 7, 15] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[17]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
104 nncf_module.bert.encoder.layer.17.attention.output.dense 34 (1024, 1024) (1024, 256) (1024,) (1024,) group of 64 cols See pkl [3, 6, 7, 15] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[17]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
105 nncf_module.bert.encoder.layer.17.attention.self.query 34 (1024, 1024) (256, 1024) (1024,) (256,) group of 64 rows See pkl [3, 6, 7, 15] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[17]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
106 nncf_module.bert.encoder.layer.17.intermediate.dense 35 (4096, 1024) (838, 1024) (4096,) (838,) row See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[17]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
107 nncf_module.bert.encoder.layer.17.output.dense 35 (1024, 4096) (1024, 838) (1024,) (1024,) col See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[17]/BertOutput[output]/NNCFLinear[dense]/linear_0
108 nncf_module.bert.encoder.layer.18.attention.output.dense 36 (1024, 1024) (1024, 192) (1024,) (1024,) group of 64 cols See pkl [6, 8, 12] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[18]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
109 nncf_module.bert.encoder.layer.18.attention.self.value 36 (1024, 1024) (192, 1024) (1024,) (192,) group of 64 rows See pkl [6, 8, 12] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[18]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
110 nncf_module.bert.encoder.layer.18.attention.self.query 36 (1024, 1024) (192, 1024) (1024,) (192,) group of 64 rows See pkl [6, 8, 12] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[18]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
111 nncf_module.bert.encoder.layer.18.attention.self.key 36 (1024, 1024) (192, 1024) (1024,) (192,) group of 64 rows See pkl [6, 8, 12] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[18]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
112 nncf_module.bert.encoder.layer.18.output.dense 37 (1024, 4096) (1024, 611) (1024,) (1024,) col See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[18]/BertOutput[output]/NNCFLinear[dense]/linear_0
113 nncf_module.bert.encoder.layer.18.intermediate.dense 37 (4096, 1024) (611, 1024) (4096,) (611,) row See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[18]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
114 nncf_module.bert.encoder.layer.19.attention.output.dense 38 (1024, 1024) (1024, 192) (1024,) (1024,) group of 64 cols See pkl [7, 9, 10] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[19]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
115 nncf_module.bert.encoder.layer.19.attention.self.key 38 (1024, 1024) (192, 1024) (1024,) (192,) group of 64 rows See pkl [7, 9, 10] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[19]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
116 nncf_module.bert.encoder.layer.19.attention.self.query 38 (1024, 1024) (192, 1024) (1024,) (192,) group of 64 rows See pkl [7, 9, 10] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[19]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
117 nncf_module.bert.encoder.layer.19.attention.self.value 38 (1024, 1024) (192, 1024) (1024,) (192,) group of 64 rows See pkl [7, 9, 10] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[19]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
118 nncf_module.bert.encoder.layer.19.intermediate.dense 39 (4096, 1024) (371, 1024) (4096,) (371,) row See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[19]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
119 nncf_module.bert.encoder.layer.19.output.dense 39 (1024, 4096) (1024, 371) (1024,) (1024,) col See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[19]/BertOutput[output]/NNCFLinear[dense]/linear_0
120 nncf_module.bert.encoder.layer.20.attention.self.key 40 (1024, 1024) (256, 1024) (1024,) (256,) group of 64 rows See pkl [5, 6, 9, 15] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[20]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
121 nncf_module.bert.encoder.layer.20.attention.self.value 40 (1024, 1024) (256, 1024) (1024,) (256,) group of 64 rows See pkl [5, 6, 9, 15] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[20]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
122 nncf_module.bert.encoder.layer.20.attention.output.dense 40 (1024, 1024) (1024, 256) (1024,) (1024,) group of 64 cols See pkl [5, 6, 9, 15] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[20]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
123 nncf_module.bert.encoder.layer.20.attention.self.query 40 (1024, 1024) (256, 1024) (1024,) (256,) group of 64 rows See pkl [5, 6, 9, 15] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[20]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
124 nncf_module.bert.encoder.layer.20.intermediate.dense 41 (4096, 1024) (175, 1024) (4096,) (175,) row See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[20]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
125 nncf_module.bert.encoder.layer.20.output.dense 41 (1024, 4096) (1024, 175) (1024,) (1024,) col See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[20]/BertOutput[output]/NNCFLinear[dense]/linear_0
126 nncf_module.bert.encoder.layer.21.attention.self.value 42 (1024, 1024) (128, 1024) (1024,) (128,) group of 64 rows See pkl [6, 7] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[21]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
127 nncf_module.bert.encoder.layer.21.attention.output.dense 42 (1024, 1024) (1024, 128) (1024,) (1024,) group of 64 cols See pkl [6, 7] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[21]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
128 nncf_module.bert.encoder.layer.21.attention.self.key 42 (1024, 1024) (128, 1024) (1024,) (128,) group of 64 rows See pkl [6, 7] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[21]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
129 nncf_module.bert.encoder.layer.21.attention.self.query 42 (1024, 1024) (128, 1024) (1024,) (128,) group of 64 rows See pkl [6, 7] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[21]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
130 nncf_module.bert.encoder.layer.21.output.dense 43 (1024, 4096) (1024, 128) (1024,) (1024,) col See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[21]/BertOutput[output]/NNCFLinear[dense]/linear_0
131 nncf_module.bert.encoder.layer.21.intermediate.dense 43 (4096, 1024) (128, 1024) (4096,) (128,) row See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[21]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
132 nncf_module.bert.encoder.layer.22.attention.self.value 44 (1024, 1024) (64, 1024) (1024,) (64,) group of 64 rows See pkl [14] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[22]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
133 nncf_module.bert.encoder.layer.22.attention.self.query 44 (1024, 1024) (64, 1024) (1024,) (64,) group of 64 rows See pkl [14] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[22]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
134 nncf_module.bert.encoder.layer.22.attention.output.dense 44 (1024, 1024) (1024, 64) (1024,) (1024,) group of 64 cols See pkl [14] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[22]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
135 nncf_module.bert.encoder.layer.22.attention.self.key 44 (1024, 1024) (64, 1024) (1024,) (64,) group of 64 rows See pkl [14] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[22]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
136 nncf_module.bert.encoder.layer.22.intermediate.dense 45 (4096, 1024) (100, 1024) (4096,) (100,) row See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[22]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
137 nncf_module.bert.encoder.layer.22.output.dense 45 (1024, 4096) (1024, 100) (1024,) (1024,) col See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[22]/BertOutput[output]/NNCFLinear[dense]/linear_0
138 nncf_module.bert.encoder.layer.23.attention.output.dense 46 (1024, 1024) (1024, 704) (1024,) (1024,) group of 64 cols See pkl [0, 1, 3, 5, 7, 8, 10, 11, 13, 14, 15] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[23]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
139 nncf_module.bert.encoder.layer.23.attention.self.key 46 (1024, 1024) (704, 1024) (1024,) (704,) group of 64 rows See pkl [0, 1, 3, 5, 7, 8, 10, 11, 13, 14, 15] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[23]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
140 nncf_module.bert.encoder.layer.23.attention.self.value 46 (1024, 1024) (704, 1024) (1024,) (704,) group of 64 rows See pkl [0, 1, 3, 5, 7, 8, 10, 11, 13, 14, 15] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[23]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
141 nncf_module.bert.encoder.layer.23.attention.self.query 46 (1024, 1024) (704, 1024) (1024,) (704,) group of 64 rows See pkl [0, 1, 3, 5, 7, 8, 10, 11, 13, 14, 15] BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[23]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
142 nncf_module.bert.encoder.layer.23.output.dense 47 (1024, 4096) (1024, 114) (1024,) (1024,) col See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[23]/BertOutput[output]/NNCFLinear[dense]/linear_0
143 nncf_module.bert.encoder.layer.23.intermediate.dense 47 (4096, 1024) (114, 1024) (4096,) (114,) row See pkl BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[23]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0