| | pt_module_name | block_id | orig_w_shape | final_w_shape | orig_b_shape | final_b_shape | prune_by | id_to_keep | head_id_to_keep | nncf_graph_node | |----:|:---------------------------------------------------------|-----------:|:---------------|:----------------|:---------------|:----------------|:-----------------|:-------------|:-------------------------------------------------------|:--------------------------------------------------------------------------------------------------------------------------------------------------------------------------| | 0 | nncf_module.bert.encoder.layer.0.attention.self.query | 0 | (1024, 1024) | (448, 1024) | (1024,) | (448,) | group of 64 rows | See pkl | [1, 2, 6, 7, 10, 13, 14] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[0]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 | | 1 | nncf_module.bert.encoder.layer.0.attention.self.key | 0 | (1024, 1024) | (448, 1024) | (1024,) | (448,) | group of 64 rows | See pkl | [1, 2, 6, 7, 10, 13, 14] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[0]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 | | 2 | nncf_module.bert.encoder.layer.0.attention.self.value | 0 | (1024, 1024) | (448, 1024) | (1024,) | (448,) | group of 64 rows | See pkl | [1, 2, 6, 7, 10, 13, 14] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[0]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 | | 3 | nncf_module.bert.encoder.layer.0.attention.output.dense | 0 | (1024, 1024) | (1024, 448) | (1024,) | (1024,) | group of 64 cols | See pkl | [1, 2, 6, 7, 10, 13, 14] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[0]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 | | 4 | nncf_module.bert.encoder.layer.0.output.dense | 1 | (1024, 4096) | (1024, 915) | (1024,) | (1024,) | col | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[0]/BertOutput[output]/NNCFLinear[dense]/linear_0 | | 5 | nncf_module.bert.encoder.layer.0.intermediate.dense | 1 | (4096, 1024) | (915, 1024) | (4096,) | (915,) | row | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[0]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 | | 6 | nncf_module.bert.encoder.layer.1.attention.self.key | 2 | (1024, 1024) | (64, 1024) | (1024,) | (64,) | group of 64 rows | See pkl | [8] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[1]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 | | 7 | nncf_module.bert.encoder.layer.1.attention.self.query | 2 | (1024, 1024) | (64, 1024) | (1024,) | (64,) | group of 64 rows | See pkl | [8] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[1]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 | | 8 | nncf_module.bert.encoder.layer.1.attention.output.dense | 2 | (1024, 1024) | (1024, 64) | (1024,) | (1024,) | group of 64 cols | See pkl | [8] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[1]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 | | 9 | nncf_module.bert.encoder.layer.1.attention.self.value | 2 | (1024, 1024) | (64, 1024) | (1024,) | (64,) | group of 64 rows | See pkl | [8] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[1]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 | | 10 | nncf_module.bert.encoder.layer.1.intermediate.dense | 3 | (4096, 1024) | (829, 1024) | (4096,) | (829,) | row | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[1]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 | | 11 | nncf_module.bert.encoder.layer.1.output.dense | 3 | (1024, 4096) | (1024, 829) | (1024,) | (1024,) | col | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[1]/BertOutput[output]/NNCFLinear[dense]/linear_0 | | 12 | nncf_module.bert.encoder.layer.2.attention.output.dense | 4 | (1024, 1024) | (1024, 128) | (1024,) | (1024,) | group of 64 cols | See pkl | [3, 5] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[2]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 | | 13 | nncf_module.bert.encoder.layer.2.attention.self.value | 4 | (1024, 1024) | (128, 1024) | (1024,) | (128,) | group of 64 rows | See pkl | [3, 5] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[2]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 | | 14 | nncf_module.bert.encoder.layer.2.attention.self.query | 4 | (1024, 1024) | (128, 1024) | (1024,) | (128,) | group of 64 rows | See pkl | [3, 5] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[2]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 | | 15 | nncf_module.bert.encoder.layer.2.attention.self.key | 4 | (1024, 1024) | (128, 1024) | (1024,) | (128,) | group of 64 rows | See pkl | [3, 5] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[2]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 | | 16 | nncf_module.bert.encoder.layer.2.output.dense | 5 | (1024, 4096) | (1024, 1181) | (1024,) | (1024,) | col | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[2]/BertOutput[output]/NNCFLinear[dense]/linear_0 | | 17 | nncf_module.bert.encoder.layer.2.intermediate.dense | 5 | (4096, 1024) | (1181, 1024) | (4096,) | (1181,) | row | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[2]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 | | 18 | nncf_module.bert.encoder.layer.3.attention.self.value | 6 | (1024, 1024) | (128, 1024) | (1024,) | (128,) | group of 64 rows | See pkl | [4, 12] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[3]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 | | 19 | nncf_module.bert.encoder.layer.3.attention.output.dense | 6 | (1024, 1024) | (1024, 128) | (1024,) | (1024,) | group of 64 cols | See pkl | [4, 12] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[3]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 | | 20 | nncf_module.bert.encoder.layer.3.attention.self.query | 6 | (1024, 1024) | (128, 1024) | (1024,) | (128,) | group of 64 rows | See pkl | [4, 12] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[3]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 | | 21 | nncf_module.bert.encoder.layer.3.attention.self.key | 6 | (1024, 1024) | (128, 1024) | (1024,) | (128,) | group of 64 rows | See pkl | [4, 12] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[3]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 | | 22 | nncf_module.bert.encoder.layer.3.output.dense | 7 | (1024, 4096) | (1024, 1526) | (1024,) | (1024,) | col | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[3]/BertOutput[output]/NNCFLinear[dense]/linear_0 | | 23 | nncf_module.bert.encoder.layer.3.intermediate.dense | 7 | (4096, 1024) | (1526, 1024) | (4096,) | (1526,) | row | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[3]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 | | 24 | nncf_module.bert.encoder.layer.4.attention.self.key | 8 | (1024, 1024) | (64, 1024) | (1024,) | (64,) | group of 64 rows | See pkl | [15] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[4]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 | | 25 | nncf_module.bert.encoder.layer.4.attention.self.value | 8 | (1024, 1024) | (64, 1024) | (1024,) | (64,) | group of 64 rows | See pkl | [15] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[4]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 | | 26 | nncf_module.bert.encoder.layer.4.attention.output.dense | 8 | (1024, 1024) | (1024, 64) | (1024,) | (1024,) | group of 64 cols | See pkl | [15] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[4]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 | | 27 | nncf_module.bert.encoder.layer.4.attention.self.query | 8 | (1024, 1024) | (64, 1024) | (1024,) | (64,) | group of 64 rows | See pkl | [15] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[4]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 | | 28 | nncf_module.bert.encoder.layer.4.output.dense | 9 | (1024, 4096) | (1024, 1749) | (1024,) | (1024,) | col | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[4]/BertOutput[output]/NNCFLinear[dense]/linear_0 | | 29 | nncf_module.bert.encoder.layer.4.intermediate.dense | 9 | (4096, 1024) | (1749, 1024) | (4096,) | (1749,) | row | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[4]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 | | 30 | nncf_module.bert.encoder.layer.5.attention.self.query | 10 | (1024, 1024) | (1024, 1024) | (1024,) | (1024,) | group of 64 rows | See pkl | [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[5]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 | | 31 | nncf_module.bert.encoder.layer.5.attention.self.value | 10 | (1024, 1024) | (1024, 1024) | (1024,) | (1024,) | group of 64 rows | See pkl | [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[5]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 | | 32 | nncf_module.bert.encoder.layer.5.attention.self.key | 10 | (1024, 1024) | (1024, 1024) | (1024,) | (1024,) | group of 64 rows | See pkl | [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[5]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 | | 33 | nncf_module.bert.encoder.layer.5.attention.output.dense | 10 | (1024, 1024) | (1024, 1024) | (1024,) | (1024,) | group of 64 cols | See pkl | [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[5]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 | | 34 | nncf_module.bert.encoder.layer.5.intermediate.dense | 11 | (4096, 1024) | (2107, 1024) | (4096,) | (2107,) | row | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[5]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 | | 35 | nncf_module.bert.encoder.layer.5.output.dense | 11 | (1024, 4096) | (1024, 2107) | (1024,) | (1024,) | col | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[5]/BertOutput[output]/NNCFLinear[dense]/linear_0 | | 36 | nncf_module.bert.encoder.layer.6.attention.output.dense | 12 | (1024, 1024) | (1024, 1024) | (1024,) | (1024,) | group of 64 cols | See pkl | [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[6]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 | | 37 | nncf_module.bert.encoder.layer.6.attention.self.key | 12 | (1024, 1024) | (1024, 1024) | (1024,) | (1024,) | group of 64 rows | See pkl | [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[6]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 | | 38 | nncf_module.bert.encoder.layer.6.attention.self.query | 12 | (1024, 1024) | (1024, 1024) | (1024,) | (1024,) | group of 64 rows | See pkl | [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[6]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 | | 39 | nncf_module.bert.encoder.layer.6.attention.self.value | 12 | (1024, 1024) | (1024, 1024) | (1024,) | (1024,) | group of 64 rows | See pkl | [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[6]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 | | 40 | nncf_module.bert.encoder.layer.6.intermediate.dense | 13 | (4096, 1024) | (2368, 1024) | (4096,) | (2368,) | row | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[6]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 | | 41 | nncf_module.bert.encoder.layer.6.output.dense | 13 | (1024, 4096) | (1024, 2368) | (1024,) | (1024,) | col | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[6]/BertOutput[output]/NNCFLinear[dense]/linear_0 | | 42 | nncf_module.bert.encoder.layer.7.attention.output.dense | 14 | (1024, 1024) | (1024, 128) | (1024,) | (1024,) | group of 64 cols | See pkl | [1, 6] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[7]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 | | 43 | nncf_module.bert.encoder.layer.7.attention.self.value | 14 | (1024, 1024) | (128, 1024) | (1024,) | (128,) | group of 64 rows | See pkl | [1, 6] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[7]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 | | 44 | nncf_module.bert.encoder.layer.7.attention.self.query | 14 | (1024, 1024) | (128, 1024) | (1024,) | (128,) | group of 64 rows | See pkl | [1, 6] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[7]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 | | 45 | nncf_module.bert.encoder.layer.7.attention.self.key | 14 | (1024, 1024) | (128, 1024) | (1024,) | (128,) | group of 64 rows | See pkl | [1, 6] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[7]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 | | 46 | nncf_module.bert.encoder.layer.7.output.dense | 15 | (1024, 4096) | (1024, 2395) | (1024,) | (1024,) | col | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[7]/BertOutput[output]/NNCFLinear[dense]/linear_0 | | 47 | nncf_module.bert.encoder.layer.7.intermediate.dense | 15 | (4096, 1024) | (2395, 1024) | (4096,) | (2395,) | row | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[7]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 | | 48 | nncf_module.bert.encoder.layer.8.attention.self.value | 16 | (1024, 1024) | (128, 1024) | (1024,) | (128,) | group of 64 rows | See pkl | [1, 6] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[8]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 | | 49 | nncf_module.bert.encoder.layer.8.attention.self.query | 16 | (1024, 1024) | (128, 1024) | (1024,) | (128,) | group of 64 rows | See pkl | [1, 6] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[8]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 | | 50 | nncf_module.bert.encoder.layer.8.attention.self.key | 16 | (1024, 1024) | (128, 1024) | (1024,) | (128,) | group of 64 rows | See pkl | [1, 6] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[8]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 | | 51 | nncf_module.bert.encoder.layer.8.attention.output.dense | 16 | (1024, 1024) | (1024, 128) | (1024,) | (1024,) | group of 64 cols | See pkl | [1, 6] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[8]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 | | 52 | nncf_module.bert.encoder.layer.8.output.dense | 17 | (1024, 4096) | (1024, 2352) | (1024,) | (1024,) | col | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[8]/BertOutput[output]/NNCFLinear[dense]/linear_0 | | 53 | nncf_module.bert.encoder.layer.8.intermediate.dense | 17 | (4096, 1024) | (2352, 1024) | (4096,) | (2352,) | row | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[8]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 | | 54 | nncf_module.bert.encoder.layer.9.attention.self.value | 18 | (1024, 1024) | (64, 1024) | (1024,) | (64,) | group of 64 rows | See pkl | [12] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[9]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 | | 55 | nncf_module.bert.encoder.layer.9.attention.self.key | 18 | (1024, 1024) | (64, 1024) | (1024,) | (64,) | group of 64 rows | See pkl | [12] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[9]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 | | 56 | nncf_module.bert.encoder.layer.9.attention.output.dense | 18 | (1024, 1024) | (1024, 64) | (1024,) | (1024,) | group of 64 cols | See pkl | [12] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[9]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 | | 57 | nncf_module.bert.encoder.layer.9.attention.self.query | 18 | (1024, 1024) | (64, 1024) | (1024,) | (64,) | group of 64 rows | See pkl | [12] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[9]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 | | 58 | nncf_module.bert.encoder.layer.9.output.dense | 19 | (1024, 4096) | (1024, 2345) | (1024,) | (1024,) | col | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[9]/BertOutput[output]/NNCFLinear[dense]/linear_0 | | 59 | nncf_module.bert.encoder.layer.9.intermediate.dense | 19 | (4096, 1024) | (2345, 1024) | (4096,) | (2345,) | row | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[9]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 | | 60 | nncf_module.bert.encoder.layer.10.attention.output.dense | 20 | (1024, 1024) | (1024, 64) | (1024,) | (1024,) | group of 64 cols | See pkl | [0] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[10]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 | | 61 | nncf_module.bert.encoder.layer.10.attention.self.query | 20 | (1024, 1024) | (64, 1024) | (1024,) | (64,) | group of 64 rows | See pkl | [0] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[10]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 | | 62 | nncf_module.bert.encoder.layer.10.attention.self.value | 20 | (1024, 1024) | (64, 1024) | (1024,) | (64,) | group of 64 rows | See pkl | [0] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[10]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 | | 63 | nncf_module.bert.encoder.layer.10.attention.self.key | 20 | (1024, 1024) | (64, 1024) | (1024,) | (64,) | group of 64 rows | See pkl | [0] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[10]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 | | 64 | nncf_module.bert.encoder.layer.10.intermediate.dense | 21 | (4096, 1024) | (2261, 1024) | (4096,) | (2261,) | row | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[10]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 | | 65 | nncf_module.bert.encoder.layer.10.output.dense | 21 | (1024, 4096) | (1024, 2261) | (1024,) | (1024,) | col | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[10]/BertOutput[output]/NNCFLinear[dense]/linear_0 | | 66 | nncf_module.bert.encoder.layer.11.attention.self.query | 22 | (1024, 1024) | (256, 1024) | (1024,) | (256,) | group of 64 rows | See pkl | [1, 4, 9, 13] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[11]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 | | 67 | nncf_module.bert.encoder.layer.11.attention.output.dense | 22 | (1024, 1024) | (1024, 256) | (1024,) | (1024,) | group of 64 cols | See pkl | [1, 4, 9, 13] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[11]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 | | 68 | nncf_module.bert.encoder.layer.11.attention.self.key | 22 | (1024, 1024) | (256, 1024) | (1024,) | (256,) | group of 64 rows | See pkl | [1, 4, 9, 13] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[11]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 | | 69 | nncf_module.bert.encoder.layer.11.attention.self.value | 22 | (1024, 1024) | (256, 1024) | (1024,) | (256,) | group of 64 rows | See pkl | [1, 4, 9, 13] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[11]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 | | 70 | nncf_module.bert.encoder.layer.11.output.dense | 23 | (1024, 4096) | (1024, 1950) | (1024,) | (1024,) | col | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[11]/BertOutput[output]/NNCFLinear[dense]/linear_0 | | 71 | nncf_module.bert.encoder.layer.11.intermediate.dense | 23 | (4096, 1024) | (1950, 1024) | (4096,) | (1950,) | row | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[11]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 | | 72 | nncf_module.bert.encoder.layer.12.attention.self.value | 24 | (1024, 1024) | (320, 1024) | (1024,) | (320,) | group of 64 rows | See pkl | [4, 5, 7, 14, 15] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[12]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 | | 73 | nncf_module.bert.encoder.layer.12.attention.output.dense | 24 | (1024, 1024) | (1024, 320) | (1024,) | (1024,) | group of 64 cols | See pkl | [4, 5, 7, 14, 15] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[12]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 | | 74 | nncf_module.bert.encoder.layer.12.attention.self.key | 24 | (1024, 1024) | (320, 1024) | (1024,) | (320,) | group of 64 rows | See pkl | [4, 5, 7, 14, 15] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[12]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 | | 75 | nncf_module.bert.encoder.layer.12.attention.self.query | 24 | (1024, 1024) | (320, 1024) | (1024,) | (320,) | group of 64 rows | See pkl | [4, 5, 7, 14, 15] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[12]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 | | 76 | nncf_module.bert.encoder.layer.12.output.dense | 25 | (1024, 4096) | (1024, 1818) | (1024,) | (1024,) | col | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[12]/BertOutput[output]/NNCFLinear[dense]/linear_0 | | 77 | nncf_module.bert.encoder.layer.12.intermediate.dense | 25 | (4096, 1024) | (1818, 1024) | (4096,) | (1818,) | row | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[12]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 | | 78 | nncf_module.bert.encoder.layer.13.attention.output.dense | 26 | (1024, 1024) | (1024, 256) | (1024,) | (1024,) | group of 64 cols | See pkl | [4, 7, 13, 14] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[13]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 | | 79 | nncf_module.bert.encoder.layer.13.attention.self.value | 26 | (1024, 1024) | (256, 1024) | (1024,) | (256,) | group of 64 rows | See pkl | [4, 7, 13, 14] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[13]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 | | 80 | nncf_module.bert.encoder.layer.13.attention.self.query | 26 | (1024, 1024) | (256, 1024) | (1024,) | (256,) | group of 64 rows | See pkl | [4, 7, 13, 14] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[13]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 | | 81 | nncf_module.bert.encoder.layer.13.attention.self.key | 26 | (1024, 1024) | (256, 1024) | (1024,) | (256,) | group of 64 rows | See pkl | [4, 7, 13, 14] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[13]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 | | 82 | nncf_module.bert.encoder.layer.13.intermediate.dense | 27 | (4096, 1024) | (1585, 1024) | (4096,) | (1585,) | row | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[13]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 | | 83 | nncf_module.bert.encoder.layer.13.output.dense | 27 | (1024, 4096) | (1024, 1585) | (1024,) | (1024,) | col | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[13]/BertOutput[output]/NNCFLinear[dense]/linear_0 | | 84 | nncf_module.bert.encoder.layer.14.attention.self.query | 28 | (1024, 1024) | (320, 1024) | (1024,) | (320,) | group of 64 rows | See pkl | [2, 3, 4, 7, 8] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[14]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 | | 85 | nncf_module.bert.encoder.layer.14.attention.output.dense | 28 | (1024, 1024) | (1024, 320) | (1024,) | (1024,) | group of 64 cols | See pkl | [2, 3, 4, 7, 8] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[14]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 | | 86 | nncf_module.bert.encoder.layer.14.attention.self.key | 28 | (1024, 1024) | (320, 1024) | (1024,) | (320,) | group of 64 rows | See pkl | [2, 3, 4, 7, 8] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[14]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 | | 87 | nncf_module.bert.encoder.layer.14.attention.self.value | 28 | (1024, 1024) | (320, 1024) | (1024,) | (320,) | group of 64 rows | See pkl | [2, 3, 4, 7, 8] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[14]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 | | 88 | nncf_module.bert.encoder.layer.14.intermediate.dense | 29 | (4096, 1024) | (1165, 1024) | (4096,) | (1165,) | row | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[14]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 | | 89 | nncf_module.bert.encoder.layer.14.output.dense | 29 | (1024, 4096) | (1024, 1165) | (1024,) | (1024,) | col | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[14]/BertOutput[output]/NNCFLinear[dense]/linear_0 | | 90 | nncf_module.bert.encoder.layer.15.attention.self.query | 30 | (1024, 1024) | (320, 1024) | (1024,) | (320,) | group of 64 rows | See pkl | [2, 7, 8, 10, 14] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[15]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 | | 91 | nncf_module.bert.encoder.layer.15.attention.self.key | 30 | (1024, 1024) | (320, 1024) | (1024,) | (320,) | group of 64 rows | See pkl | [2, 7, 8, 10, 14] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[15]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 | | 92 | nncf_module.bert.encoder.layer.15.attention.self.value | 30 | (1024, 1024) | (320, 1024) | (1024,) | (320,) | group of 64 rows | See pkl | [2, 7, 8, 10, 14] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[15]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 | | 93 | nncf_module.bert.encoder.layer.15.attention.output.dense | 30 | (1024, 1024) | (1024, 320) | (1024,) | (1024,) | group of 64 cols | See pkl | [2, 7, 8, 10, 14] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[15]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 | | 94 | nncf_module.bert.encoder.layer.15.intermediate.dense | 31 | (4096, 1024) | (982, 1024) | (4096,) | (982,) | row | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[15]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 | | 95 | nncf_module.bert.encoder.layer.15.output.dense | 31 | (1024, 4096) | (1024, 982) | (1024,) | (1024,) | col | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[15]/BertOutput[output]/NNCFLinear[dense]/linear_0 | | 96 | nncf_module.bert.encoder.layer.16.attention.self.query | 32 | (1024, 1024) | (320, 1024) | (1024,) | (320,) | group of 64 rows | See pkl | [0, 8, 10, 13, 14] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[16]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 | | 97 | nncf_module.bert.encoder.layer.16.attention.self.key | 32 | (1024, 1024) | (320, 1024) | (1024,) | (320,) | group of 64 rows | See pkl | [0, 8, 10, 13, 14] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[16]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 | | 98 | nncf_module.bert.encoder.layer.16.attention.output.dense | 32 | (1024, 1024) | (1024, 320) | (1024,) | (1024,) | group of 64 cols | See pkl | [0, 8, 10, 13, 14] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[16]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 | | 99 | nncf_module.bert.encoder.layer.16.attention.self.value | 32 | (1024, 1024) | (320, 1024) | (1024,) | (320,) | group of 64 rows | See pkl | [0, 8, 10, 13, 14] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[16]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 | | 100 | nncf_module.bert.encoder.layer.16.output.dense | 33 | (1024, 4096) | (1024, 941) | (1024,) | (1024,) | col | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[16]/BertOutput[output]/NNCFLinear[dense]/linear_0 | | 101 | nncf_module.bert.encoder.layer.16.intermediate.dense | 33 | (4096, 1024) | (941, 1024) | (4096,) | (941,) | row | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[16]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 | | 102 | nncf_module.bert.encoder.layer.17.attention.self.query | 34 | (1024, 1024) | (256, 1024) | (1024,) | (256,) | group of 64 rows | See pkl | [3, 6, 7, 15] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[17]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 | | 103 | nncf_module.bert.encoder.layer.17.attention.self.value | 34 | (1024, 1024) | (256, 1024) | (1024,) | (256,) | group of 64 rows | See pkl | [3, 6, 7, 15] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[17]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 | | 104 | nncf_module.bert.encoder.layer.17.attention.self.key | 34 | (1024, 1024) | (256, 1024) | (1024,) | (256,) | group of 64 rows | See pkl | [3, 6, 7, 15] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[17]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 | | 105 | nncf_module.bert.encoder.layer.17.attention.output.dense | 34 | (1024, 1024) | (1024, 256) | (1024,) | (1024,) | group of 64 cols | See pkl | [3, 6, 7, 15] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[17]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 | | 106 | nncf_module.bert.encoder.layer.17.output.dense | 35 | (1024, 4096) | (1024, 838) | (1024,) | (1024,) | col | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[17]/BertOutput[output]/NNCFLinear[dense]/linear_0 | | 107 | nncf_module.bert.encoder.layer.17.intermediate.dense | 35 | (4096, 1024) | (838, 1024) | (4096,) | (838,) | row | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[17]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 | | 108 | nncf_module.bert.encoder.layer.18.attention.self.value | 36 | (1024, 1024) | (192, 1024) | (1024,) | (192,) | group of 64 rows | See pkl | [6, 8, 12] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[18]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 | | 109 | nncf_module.bert.encoder.layer.18.attention.self.query | 36 | (1024, 1024) | (192, 1024) | (1024,) | (192,) | group of 64 rows | See pkl | [6, 8, 12] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[18]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 | | 110 | nncf_module.bert.encoder.layer.18.attention.self.key | 36 | (1024, 1024) | (192, 1024) | (1024,) | (192,) | group of 64 rows | See pkl | [6, 8, 12] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[18]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 | | 111 | nncf_module.bert.encoder.layer.18.attention.output.dense | 36 | (1024, 1024) | (1024, 192) | (1024,) | (1024,) | group of 64 cols | See pkl | [6, 8, 12] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[18]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 | | 112 | nncf_module.bert.encoder.layer.18.output.dense | 37 | (1024, 4096) | (1024, 611) | (1024,) | (1024,) | col | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[18]/BertOutput[output]/NNCFLinear[dense]/linear_0 | | 113 | nncf_module.bert.encoder.layer.18.intermediate.dense | 37 | (4096, 1024) | (611, 1024) | (4096,) | (611,) | row | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[18]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 | | 114 | nncf_module.bert.encoder.layer.19.attention.output.dense | 38 | (1024, 1024) | (1024, 192) | (1024,) | (1024,) | group of 64 cols | See pkl | [7, 9, 10] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[19]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 | | 115 | nncf_module.bert.encoder.layer.19.attention.self.key | 38 | (1024, 1024) | (192, 1024) | (1024,) | (192,) | group of 64 rows | See pkl | [7, 9, 10] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[19]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 | | 116 | nncf_module.bert.encoder.layer.19.attention.self.value | 38 | (1024, 1024) | (192, 1024) | (1024,) | (192,) | group of 64 rows | See pkl | [7, 9, 10] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[19]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 | | 117 | nncf_module.bert.encoder.layer.19.attention.self.query | 38 | (1024, 1024) | (192, 1024) | (1024,) | (192,) | group of 64 rows | See pkl | [7, 9, 10] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[19]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 | | 118 | nncf_module.bert.encoder.layer.19.output.dense | 39 | (1024, 4096) | (1024, 371) | (1024,) | (1024,) | col | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[19]/BertOutput[output]/NNCFLinear[dense]/linear_0 | | 119 | nncf_module.bert.encoder.layer.19.intermediate.dense | 39 | (4096, 1024) | (371, 1024) | (4096,) | (371,) | row | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[19]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 | | 120 | nncf_module.bert.encoder.layer.20.attention.self.key | 40 | (1024, 1024) | (256, 1024) | (1024,) | (256,) | group of 64 rows | See pkl | [5, 6, 9, 15] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[20]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 | | 121 | nncf_module.bert.encoder.layer.20.attention.self.value | 40 | (1024, 1024) | (256, 1024) | (1024,) | (256,) | group of 64 rows | See pkl | [5, 6, 9, 15] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[20]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 | | 122 | nncf_module.bert.encoder.layer.20.attention.output.dense | 40 | (1024, 1024) | (1024, 256) | (1024,) | (1024,) | group of 64 cols | See pkl | [5, 6, 9, 15] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[20]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 | | 123 | nncf_module.bert.encoder.layer.20.attention.self.query | 40 | (1024, 1024) | (256, 1024) | (1024,) | (256,) | group of 64 rows | See pkl | [5, 6, 9, 15] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[20]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 | | 124 | nncf_module.bert.encoder.layer.20.intermediate.dense | 41 | (4096, 1024) | (175, 1024) | (4096,) | (175,) | row | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[20]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 | | 125 | nncf_module.bert.encoder.layer.20.output.dense | 41 | (1024, 4096) | (1024, 175) | (1024,) | (1024,) | col | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[20]/BertOutput[output]/NNCFLinear[dense]/linear_0 | | 126 | nncf_module.bert.encoder.layer.21.attention.output.dense | 42 | (1024, 1024) | (1024, 128) | (1024,) | (1024,) | group of 64 cols | See pkl | [6, 7] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[21]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 | | 127 | nncf_module.bert.encoder.layer.21.attention.self.query | 42 | (1024, 1024) | (128, 1024) | (1024,) | (128,) | group of 64 rows | See pkl | [6, 7] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[21]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 | | 128 | nncf_module.bert.encoder.layer.21.attention.self.value | 42 | (1024, 1024) | (128, 1024) | (1024,) | (128,) | group of 64 rows | See pkl | [6, 7] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[21]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 | | 129 | nncf_module.bert.encoder.layer.21.attention.self.key | 42 | (1024, 1024) | (128, 1024) | (1024,) | (128,) | group of 64 rows | See pkl | [6, 7] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[21]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 | | 130 | nncf_module.bert.encoder.layer.21.intermediate.dense | 43 | (4096, 1024) | (128, 1024) | (4096,) | (128,) | row | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[21]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 | | 131 | nncf_module.bert.encoder.layer.21.output.dense | 43 | (1024, 4096) | (1024, 128) | (1024,) | (1024,) | col | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[21]/BertOutput[output]/NNCFLinear[dense]/linear_0 | | 132 | nncf_module.bert.encoder.layer.22.attention.output.dense | 44 | (1024, 1024) | (1024, 64) | (1024,) | (1024,) | group of 64 cols | See pkl | [14] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[22]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 | | 133 | nncf_module.bert.encoder.layer.22.attention.self.value | 44 | (1024, 1024) | (64, 1024) | (1024,) | (64,) | group of 64 rows | See pkl | [14] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[22]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 | | 134 | nncf_module.bert.encoder.layer.22.attention.self.key | 44 | (1024, 1024) | (64, 1024) | (1024,) | (64,) | group of 64 rows | See pkl | [14] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[22]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 | | 135 | nncf_module.bert.encoder.layer.22.attention.self.query | 44 | (1024, 1024) | (64, 1024) | (1024,) | (64,) | group of 64 rows | See pkl | [14] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[22]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 | | 136 | nncf_module.bert.encoder.layer.22.intermediate.dense | 45 | (4096, 1024) | (100, 1024) | (4096,) | (100,) | row | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[22]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 | | 137 | nncf_module.bert.encoder.layer.22.output.dense | 45 | (1024, 4096) | (1024, 100) | (1024,) | (1024,) | col | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[22]/BertOutput[output]/NNCFLinear[dense]/linear_0 | | 138 | nncf_module.bert.encoder.layer.23.attention.self.query | 46 | (1024, 1024) | (704, 1024) | (1024,) | (704,) | group of 64 rows | See pkl | [0, 1, 3, 5, 7, 8, 10, 11, 13, 14, 15] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[23]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 | | 139 | nncf_module.bert.encoder.layer.23.attention.self.key | 46 | (1024, 1024) | (704, 1024) | (1024,) | (704,) | group of 64 rows | See pkl | [0, 1, 3, 5, 7, 8, 10, 11, 13, 14, 15] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[23]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 | | 140 | nncf_module.bert.encoder.layer.23.attention.output.dense | 46 | (1024, 1024) | (1024, 704) | (1024,) | (1024,) | group of 64 cols | See pkl | [0, 1, 3, 5, 7, 8, 10, 11, 13, 14, 15] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[23]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 | | 141 | nncf_module.bert.encoder.layer.23.attention.self.value | 46 | (1024, 1024) | (704, 1024) | (1024,) | (704,) | group of 64 rows | See pkl | [0, 1, 3, 5, 7, 8, 10, 11, 13, 14, 15] | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[23]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 | | 142 | nncf_module.bert.encoder.layer.23.intermediate.dense | 47 | (4096, 1024) | (114, 1024) | (4096,) | (114,) | row | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[23]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 | | 143 | nncf_module.bert.encoder.layer.23.output.dense | 47 | (1024, 4096) | (1024, 114) | (1024,) | (1024,) | col | See pkl | | BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[23]/BertOutput[output]/NNCFLinear[dense]/linear_0 |