Vui Seng Chua
Update collateral
68c7f51
pt_module_name,block_id,orig_w_shape,final_w_shape,orig_b_shape,final_b_shape,prune_by,id_to_keep,head_id_to_keep,nncf_graph_node
nncf_module.bert.encoder.layer.0.attention.self.key,0,"(1024, 1024)","(448, 1024)","(1024,)","(448,)",group of 64 rows,See pkl,"[1, 2, 6, 7, 10, 13, 14]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[0]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
nncf_module.bert.encoder.layer.0.attention.self.value,0,"(1024, 1024)","(448, 1024)","(1024,)","(448,)",group of 64 rows,See pkl,"[1, 2, 6, 7, 10, 13, 14]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[0]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
nncf_module.bert.encoder.layer.0.attention.self.query,0,"(1024, 1024)","(448, 1024)","(1024,)","(448,)",group of 64 rows,See pkl,"[1, 2, 6, 7, 10, 13, 14]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[0]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
nncf_module.bert.encoder.layer.0.attention.output.dense,0,"(1024, 1024)","(1024, 448)","(1024,)","(1024,)",group of 64 cols,See pkl,"[1, 2, 6, 7, 10, 13, 14]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[0]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.0.intermediate.dense,1,"(4096, 1024)","(915, 1024)","(4096,)","(915,)",row,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[0]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.0.output.dense,1,"(1024, 4096)","(1024, 915)","(1024,)","(1024,)",col,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[0]/BertOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.1.attention.self.query,2,"(1024, 1024)","(64, 1024)","(1024,)","(64,)",group of 64 rows,See pkl,[8],BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[1]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
nncf_module.bert.encoder.layer.1.attention.self.value,2,"(1024, 1024)","(64, 1024)","(1024,)","(64,)",group of 64 rows,See pkl,[8],BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[1]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
nncf_module.bert.encoder.layer.1.attention.self.key,2,"(1024, 1024)","(64, 1024)","(1024,)","(64,)",group of 64 rows,See pkl,[8],BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[1]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
nncf_module.bert.encoder.layer.1.attention.output.dense,2,"(1024, 1024)","(1024, 64)","(1024,)","(1024,)",group of 64 cols,See pkl,[8],BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[1]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.1.output.dense,3,"(1024, 4096)","(1024, 829)","(1024,)","(1024,)",col,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[1]/BertOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.1.intermediate.dense,3,"(4096, 1024)","(829, 1024)","(4096,)","(829,)",row,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[1]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.2.attention.output.dense,4,"(1024, 1024)","(1024, 128)","(1024,)","(1024,)",group of 64 cols,See pkl,"[3, 5]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[2]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.2.attention.self.value,4,"(1024, 1024)","(128, 1024)","(1024,)","(128,)",group of 64 rows,See pkl,"[3, 5]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[2]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
nncf_module.bert.encoder.layer.2.attention.self.key,4,"(1024, 1024)","(128, 1024)","(1024,)","(128,)",group of 64 rows,See pkl,"[3, 5]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[2]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
nncf_module.bert.encoder.layer.2.attention.self.query,4,"(1024, 1024)","(128, 1024)","(1024,)","(128,)",group of 64 rows,See pkl,"[3, 5]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[2]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
nncf_module.bert.encoder.layer.2.output.dense,5,"(1024, 4096)","(1024, 1181)","(1024,)","(1024,)",col,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[2]/BertOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.2.intermediate.dense,5,"(4096, 1024)","(1181, 1024)","(4096,)","(1181,)",row,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[2]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.3.attention.self.value,6,"(1024, 1024)","(128, 1024)","(1024,)","(128,)",group of 64 rows,See pkl,"[4, 12]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[3]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
nncf_module.bert.encoder.layer.3.attention.self.key,6,"(1024, 1024)","(128, 1024)","(1024,)","(128,)",group of 64 rows,See pkl,"[4, 12]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[3]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
nncf_module.bert.encoder.layer.3.attention.self.query,6,"(1024, 1024)","(128, 1024)","(1024,)","(128,)",group of 64 rows,See pkl,"[4, 12]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[3]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
nncf_module.bert.encoder.layer.3.attention.output.dense,6,"(1024, 1024)","(1024, 128)","(1024,)","(1024,)",group of 64 cols,See pkl,"[4, 12]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[3]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.3.output.dense,7,"(1024, 4096)","(1024, 1526)","(1024,)","(1024,)",col,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[3]/BertOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.3.intermediate.dense,7,"(4096, 1024)","(1526, 1024)","(4096,)","(1526,)",row,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[3]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.4.attention.self.key,8,"(1024, 1024)","(64, 1024)","(1024,)","(64,)",group of 64 rows,See pkl,[15],BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[4]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
nncf_module.bert.encoder.layer.4.attention.self.value,8,"(1024, 1024)","(64, 1024)","(1024,)","(64,)",group of 64 rows,See pkl,[15],BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[4]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
nncf_module.bert.encoder.layer.4.attention.self.query,8,"(1024, 1024)","(64, 1024)","(1024,)","(64,)",group of 64 rows,See pkl,[15],BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[4]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
nncf_module.bert.encoder.layer.4.attention.output.dense,8,"(1024, 1024)","(1024, 64)","(1024,)","(1024,)",group of 64 cols,See pkl,[15],BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[4]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.4.output.dense,9,"(1024, 4096)","(1024, 1749)","(1024,)","(1024,)",col,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[4]/BertOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.4.intermediate.dense,9,"(4096, 1024)","(1749, 1024)","(4096,)","(1749,)",row,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[4]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.5.attention.self.query,10,"(1024, 1024)","(1024, 1024)","(1024,)","(1024,)",group of 64 rows,See pkl,"[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[5]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
nncf_module.bert.encoder.layer.5.attention.output.dense,10,"(1024, 1024)","(1024, 1024)","(1024,)","(1024,)",group of 64 cols,See pkl,"[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[5]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.5.attention.self.value,10,"(1024, 1024)","(1024, 1024)","(1024,)","(1024,)",group of 64 rows,See pkl,"[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[5]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
nncf_module.bert.encoder.layer.5.attention.self.key,10,"(1024, 1024)","(1024, 1024)","(1024,)","(1024,)",group of 64 rows,See pkl,"[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[5]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
nncf_module.bert.encoder.layer.5.output.dense,11,"(1024, 4096)","(1024, 2107)","(1024,)","(1024,)",col,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[5]/BertOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.5.intermediate.dense,11,"(4096, 1024)","(2107, 1024)","(4096,)","(2107,)",row,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[5]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.6.attention.self.query,12,"(1024, 1024)","(1024, 1024)","(1024,)","(1024,)",group of 64 rows,See pkl,"[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[6]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
nncf_module.bert.encoder.layer.6.attention.self.key,12,"(1024, 1024)","(1024, 1024)","(1024,)","(1024,)",group of 64 rows,See pkl,"[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[6]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
nncf_module.bert.encoder.layer.6.attention.self.value,12,"(1024, 1024)","(1024, 1024)","(1024,)","(1024,)",group of 64 rows,See pkl,"[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[6]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
nncf_module.bert.encoder.layer.6.attention.output.dense,12,"(1024, 1024)","(1024, 1024)","(1024,)","(1024,)",group of 64 cols,See pkl,"[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[6]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.6.output.dense,13,"(1024, 4096)","(1024, 2368)","(1024,)","(1024,)",col,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[6]/BertOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.6.intermediate.dense,13,"(4096, 1024)","(2368, 1024)","(4096,)","(2368,)",row,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[6]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.7.attention.self.query,14,"(1024, 1024)","(128, 1024)","(1024,)","(128,)",group of 64 rows,See pkl,"[1, 6]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[7]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
nncf_module.bert.encoder.layer.7.attention.self.key,14,"(1024, 1024)","(128, 1024)","(1024,)","(128,)",group of 64 rows,See pkl,"[1, 6]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[7]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
nncf_module.bert.encoder.layer.7.attention.output.dense,14,"(1024, 1024)","(1024, 128)","(1024,)","(1024,)",group of 64 cols,See pkl,"[1, 6]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[7]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.7.attention.self.value,14,"(1024, 1024)","(128, 1024)","(1024,)","(128,)",group of 64 rows,See pkl,"[1, 6]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[7]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
nncf_module.bert.encoder.layer.7.intermediate.dense,15,"(4096, 1024)","(2395, 1024)","(4096,)","(2395,)",row,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[7]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.7.output.dense,15,"(1024, 4096)","(1024, 2395)","(1024,)","(1024,)",col,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[7]/BertOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.8.attention.self.value,16,"(1024, 1024)","(128, 1024)","(1024,)","(128,)",group of 64 rows,See pkl,"[1, 6]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[8]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
nncf_module.bert.encoder.layer.8.attention.output.dense,16,"(1024, 1024)","(1024, 128)","(1024,)","(1024,)",group of 64 cols,See pkl,"[1, 6]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[8]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.8.attention.self.query,16,"(1024, 1024)","(128, 1024)","(1024,)","(128,)",group of 64 rows,See pkl,"[1, 6]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[8]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
nncf_module.bert.encoder.layer.8.attention.self.key,16,"(1024, 1024)","(128, 1024)","(1024,)","(128,)",group of 64 rows,See pkl,"[1, 6]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[8]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
nncf_module.bert.encoder.layer.8.intermediate.dense,17,"(4096, 1024)","(2352, 1024)","(4096,)","(2352,)",row,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[8]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.8.output.dense,17,"(1024, 4096)","(1024, 2352)","(1024,)","(1024,)",col,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[8]/BertOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.9.attention.self.query,18,"(1024, 1024)","(64, 1024)","(1024,)","(64,)",group of 64 rows,See pkl,[12],BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[9]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
nncf_module.bert.encoder.layer.9.attention.self.key,18,"(1024, 1024)","(64, 1024)","(1024,)","(64,)",group of 64 rows,See pkl,[12],BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[9]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
nncf_module.bert.encoder.layer.9.attention.output.dense,18,"(1024, 1024)","(1024, 64)","(1024,)","(1024,)",group of 64 cols,See pkl,[12],BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[9]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.9.attention.self.value,18,"(1024, 1024)","(64, 1024)","(1024,)","(64,)",group of 64 rows,See pkl,[12],BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[9]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
nncf_module.bert.encoder.layer.9.output.dense,19,"(1024, 4096)","(1024, 2345)","(1024,)","(1024,)",col,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[9]/BertOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.9.intermediate.dense,19,"(4096, 1024)","(2345, 1024)","(4096,)","(2345,)",row,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[9]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.10.attention.self.query,20,"(1024, 1024)","(64, 1024)","(1024,)","(64,)",group of 64 rows,See pkl,[0],BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[10]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
nncf_module.bert.encoder.layer.10.attention.self.key,20,"(1024, 1024)","(64, 1024)","(1024,)","(64,)",group of 64 rows,See pkl,[0],BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[10]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
nncf_module.bert.encoder.layer.10.attention.output.dense,20,"(1024, 1024)","(1024, 64)","(1024,)","(1024,)",group of 64 cols,See pkl,[0],BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[10]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.10.attention.self.value,20,"(1024, 1024)","(64, 1024)","(1024,)","(64,)",group of 64 rows,See pkl,[0],BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[10]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
nncf_module.bert.encoder.layer.10.intermediate.dense,21,"(4096, 1024)","(2261, 1024)","(4096,)","(2261,)",row,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[10]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.10.output.dense,21,"(1024, 4096)","(1024, 2261)","(1024,)","(1024,)",col,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[10]/BertOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.11.attention.output.dense,22,"(1024, 1024)","(1024, 256)","(1024,)","(1024,)",group of 64 cols,See pkl,"[1, 4, 9, 13]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[11]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.11.attention.self.key,22,"(1024, 1024)","(256, 1024)","(1024,)","(256,)",group of 64 rows,See pkl,"[1, 4, 9, 13]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[11]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
nncf_module.bert.encoder.layer.11.attention.self.value,22,"(1024, 1024)","(256, 1024)","(1024,)","(256,)",group of 64 rows,See pkl,"[1, 4, 9, 13]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[11]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
nncf_module.bert.encoder.layer.11.attention.self.query,22,"(1024, 1024)","(256, 1024)","(1024,)","(256,)",group of 64 rows,See pkl,"[1, 4, 9, 13]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[11]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
nncf_module.bert.encoder.layer.11.intermediate.dense,23,"(4096, 1024)","(1950, 1024)","(4096,)","(1950,)",row,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[11]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.11.output.dense,23,"(1024, 4096)","(1024, 1950)","(1024,)","(1024,)",col,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[11]/BertOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.12.attention.self.query,24,"(1024, 1024)","(320, 1024)","(1024,)","(320,)",group of 64 rows,See pkl,"[4, 5, 7, 14, 15]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[12]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
nncf_module.bert.encoder.layer.12.attention.self.value,24,"(1024, 1024)","(320, 1024)","(1024,)","(320,)",group of 64 rows,See pkl,"[4, 5, 7, 14, 15]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[12]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
nncf_module.bert.encoder.layer.12.attention.self.key,24,"(1024, 1024)","(320, 1024)","(1024,)","(320,)",group of 64 rows,See pkl,"[4, 5, 7, 14, 15]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[12]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
nncf_module.bert.encoder.layer.12.attention.output.dense,24,"(1024, 1024)","(1024, 320)","(1024,)","(1024,)",group of 64 cols,See pkl,"[4, 5, 7, 14, 15]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[12]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.12.intermediate.dense,25,"(4096, 1024)","(1818, 1024)","(4096,)","(1818,)",row,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[12]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.12.output.dense,25,"(1024, 4096)","(1024, 1818)","(1024,)","(1024,)",col,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[12]/BertOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.13.attention.self.query,26,"(1024, 1024)","(256, 1024)","(1024,)","(256,)",group of 64 rows,See pkl,"[4, 7, 13, 14]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[13]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
nncf_module.bert.encoder.layer.13.attention.output.dense,26,"(1024, 1024)","(1024, 256)","(1024,)","(1024,)",group of 64 cols,See pkl,"[4, 7, 13, 14]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[13]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.13.attention.self.key,26,"(1024, 1024)","(256, 1024)","(1024,)","(256,)",group of 64 rows,See pkl,"[4, 7, 13, 14]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[13]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
nncf_module.bert.encoder.layer.13.attention.self.value,26,"(1024, 1024)","(256, 1024)","(1024,)","(256,)",group of 64 rows,See pkl,"[4, 7, 13, 14]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[13]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
nncf_module.bert.encoder.layer.13.output.dense,27,"(1024, 4096)","(1024, 1585)","(1024,)","(1024,)",col,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[13]/BertOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.13.intermediate.dense,27,"(4096, 1024)","(1585, 1024)","(4096,)","(1585,)",row,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[13]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.14.attention.output.dense,28,"(1024, 1024)","(1024, 320)","(1024,)","(1024,)",group of 64 cols,See pkl,"[2, 3, 4, 7, 8]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[14]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.14.attention.self.value,28,"(1024, 1024)","(320, 1024)","(1024,)","(320,)",group of 64 rows,See pkl,"[2, 3, 4, 7, 8]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[14]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
nncf_module.bert.encoder.layer.14.attention.self.key,28,"(1024, 1024)","(320, 1024)","(1024,)","(320,)",group of 64 rows,See pkl,"[2, 3, 4, 7, 8]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[14]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
nncf_module.bert.encoder.layer.14.attention.self.query,28,"(1024, 1024)","(320, 1024)","(1024,)","(320,)",group of 64 rows,See pkl,"[2, 3, 4, 7, 8]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[14]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
nncf_module.bert.encoder.layer.14.intermediate.dense,29,"(4096, 1024)","(1165, 1024)","(4096,)","(1165,)",row,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[14]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.14.output.dense,29,"(1024, 4096)","(1024, 1165)","(1024,)","(1024,)",col,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[14]/BertOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.15.attention.output.dense,30,"(1024, 1024)","(1024, 320)","(1024,)","(1024,)",group of 64 cols,See pkl,"[2, 7, 8, 10, 14]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[15]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.15.attention.self.query,30,"(1024, 1024)","(320, 1024)","(1024,)","(320,)",group of 64 rows,See pkl,"[2, 7, 8, 10, 14]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[15]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
nncf_module.bert.encoder.layer.15.attention.self.key,30,"(1024, 1024)","(320, 1024)","(1024,)","(320,)",group of 64 rows,See pkl,"[2, 7, 8, 10, 14]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[15]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
nncf_module.bert.encoder.layer.15.attention.self.value,30,"(1024, 1024)","(320, 1024)","(1024,)","(320,)",group of 64 rows,See pkl,"[2, 7, 8, 10, 14]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[15]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
nncf_module.bert.encoder.layer.15.output.dense,31,"(1024, 4096)","(1024, 982)","(1024,)","(1024,)",col,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[15]/BertOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.15.intermediate.dense,31,"(4096, 1024)","(982, 1024)","(4096,)","(982,)",row,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[15]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.16.attention.self.value,32,"(1024, 1024)","(320, 1024)","(1024,)","(320,)",group of 64 rows,See pkl,"[0, 8, 10, 13, 14]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[16]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
nncf_module.bert.encoder.layer.16.attention.self.key,32,"(1024, 1024)","(320, 1024)","(1024,)","(320,)",group of 64 rows,See pkl,"[0, 8, 10, 13, 14]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[16]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
nncf_module.bert.encoder.layer.16.attention.self.query,32,"(1024, 1024)","(320, 1024)","(1024,)","(320,)",group of 64 rows,See pkl,"[0, 8, 10, 13, 14]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[16]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
nncf_module.bert.encoder.layer.16.attention.output.dense,32,"(1024, 1024)","(1024, 320)","(1024,)","(1024,)",group of 64 cols,See pkl,"[0, 8, 10, 13, 14]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[16]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.16.intermediate.dense,33,"(4096, 1024)","(941, 1024)","(4096,)","(941,)",row,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[16]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.16.output.dense,33,"(1024, 4096)","(1024, 941)","(1024,)","(1024,)",col,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[16]/BertOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.17.attention.self.key,34,"(1024, 1024)","(256, 1024)","(1024,)","(256,)",group of 64 rows,See pkl,"[3, 6, 7, 15]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[17]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
nncf_module.bert.encoder.layer.17.attention.self.value,34,"(1024, 1024)","(256, 1024)","(1024,)","(256,)",group of 64 rows,See pkl,"[3, 6, 7, 15]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[17]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
nncf_module.bert.encoder.layer.17.attention.output.dense,34,"(1024, 1024)","(1024, 256)","(1024,)","(1024,)",group of 64 cols,See pkl,"[3, 6, 7, 15]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[17]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.17.attention.self.query,34,"(1024, 1024)","(256, 1024)","(1024,)","(256,)",group of 64 rows,See pkl,"[3, 6, 7, 15]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[17]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
nncf_module.bert.encoder.layer.17.intermediate.dense,35,"(4096, 1024)","(838, 1024)","(4096,)","(838,)",row,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[17]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.17.output.dense,35,"(1024, 4096)","(1024, 838)","(1024,)","(1024,)",col,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[17]/BertOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.18.attention.output.dense,36,"(1024, 1024)","(1024, 192)","(1024,)","(1024,)",group of 64 cols,See pkl,"[6, 8, 12]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[18]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.18.attention.self.value,36,"(1024, 1024)","(192, 1024)","(1024,)","(192,)",group of 64 rows,See pkl,"[6, 8, 12]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[18]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
nncf_module.bert.encoder.layer.18.attention.self.query,36,"(1024, 1024)","(192, 1024)","(1024,)","(192,)",group of 64 rows,See pkl,"[6, 8, 12]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[18]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
nncf_module.bert.encoder.layer.18.attention.self.key,36,"(1024, 1024)","(192, 1024)","(1024,)","(192,)",group of 64 rows,See pkl,"[6, 8, 12]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[18]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
nncf_module.bert.encoder.layer.18.output.dense,37,"(1024, 4096)","(1024, 611)","(1024,)","(1024,)",col,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[18]/BertOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.18.intermediate.dense,37,"(4096, 1024)","(611, 1024)","(4096,)","(611,)",row,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[18]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.19.attention.output.dense,38,"(1024, 1024)","(1024, 192)","(1024,)","(1024,)",group of 64 cols,See pkl,"[7, 9, 10]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[19]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.19.attention.self.key,38,"(1024, 1024)","(192, 1024)","(1024,)","(192,)",group of 64 rows,See pkl,"[7, 9, 10]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[19]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
nncf_module.bert.encoder.layer.19.attention.self.query,38,"(1024, 1024)","(192, 1024)","(1024,)","(192,)",group of 64 rows,See pkl,"[7, 9, 10]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[19]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
nncf_module.bert.encoder.layer.19.attention.self.value,38,"(1024, 1024)","(192, 1024)","(1024,)","(192,)",group of 64 rows,See pkl,"[7, 9, 10]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[19]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
nncf_module.bert.encoder.layer.19.intermediate.dense,39,"(4096, 1024)","(371, 1024)","(4096,)","(371,)",row,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[19]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.19.output.dense,39,"(1024, 4096)","(1024, 371)","(1024,)","(1024,)",col,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[19]/BertOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.20.attention.self.key,40,"(1024, 1024)","(256, 1024)","(1024,)","(256,)",group of 64 rows,See pkl,"[5, 6, 9, 15]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[20]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
nncf_module.bert.encoder.layer.20.attention.self.value,40,"(1024, 1024)","(256, 1024)","(1024,)","(256,)",group of 64 rows,See pkl,"[5, 6, 9, 15]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[20]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
nncf_module.bert.encoder.layer.20.attention.output.dense,40,"(1024, 1024)","(1024, 256)","(1024,)","(1024,)",group of 64 cols,See pkl,"[5, 6, 9, 15]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[20]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.20.attention.self.query,40,"(1024, 1024)","(256, 1024)","(1024,)","(256,)",group of 64 rows,See pkl,"[5, 6, 9, 15]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[20]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
nncf_module.bert.encoder.layer.20.intermediate.dense,41,"(4096, 1024)","(175, 1024)","(4096,)","(175,)",row,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[20]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.20.output.dense,41,"(1024, 4096)","(1024, 175)","(1024,)","(1024,)",col,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[20]/BertOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.21.attention.self.value,42,"(1024, 1024)","(128, 1024)","(1024,)","(128,)",group of 64 rows,See pkl,"[6, 7]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[21]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
nncf_module.bert.encoder.layer.21.attention.output.dense,42,"(1024, 1024)","(1024, 128)","(1024,)","(1024,)",group of 64 cols,See pkl,"[6, 7]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[21]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.21.attention.self.key,42,"(1024, 1024)","(128, 1024)","(1024,)","(128,)",group of 64 rows,See pkl,"[6, 7]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[21]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
nncf_module.bert.encoder.layer.21.attention.self.query,42,"(1024, 1024)","(128, 1024)","(1024,)","(128,)",group of 64 rows,See pkl,"[6, 7]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[21]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
nncf_module.bert.encoder.layer.21.output.dense,43,"(1024, 4096)","(1024, 128)","(1024,)","(1024,)",col,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[21]/BertOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.21.intermediate.dense,43,"(4096, 1024)","(128, 1024)","(4096,)","(128,)",row,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[21]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.22.attention.self.value,44,"(1024, 1024)","(64, 1024)","(1024,)","(64,)",group of 64 rows,See pkl,[14],BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[22]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
nncf_module.bert.encoder.layer.22.attention.self.query,44,"(1024, 1024)","(64, 1024)","(1024,)","(64,)",group of 64 rows,See pkl,[14],BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[22]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
nncf_module.bert.encoder.layer.22.attention.output.dense,44,"(1024, 1024)","(1024, 64)","(1024,)","(1024,)",group of 64 cols,See pkl,[14],BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[22]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.22.attention.self.key,44,"(1024, 1024)","(64, 1024)","(1024,)","(64,)",group of 64 rows,See pkl,[14],BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[22]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
nncf_module.bert.encoder.layer.22.intermediate.dense,45,"(4096, 1024)","(100, 1024)","(4096,)","(100,)",row,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[22]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.22.output.dense,45,"(1024, 4096)","(1024, 100)","(1024,)","(1024,)",col,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[22]/BertOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.23.attention.output.dense,46,"(1024, 1024)","(1024, 704)","(1024,)","(1024,)",group of 64 cols,See pkl,"[0, 1, 3, 5, 7, 8, 10, 11, 13, 14, 15]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[23]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.23.attention.self.key,46,"(1024, 1024)","(704, 1024)","(1024,)","(704,)",group of 64 rows,See pkl,"[0, 1, 3, 5, 7, 8, 10, 11, 13, 14, 15]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[23]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0
nncf_module.bert.encoder.layer.23.attention.self.value,46,"(1024, 1024)","(704, 1024)","(1024,)","(704,)",group of 64 rows,See pkl,"[0, 1, 3, 5, 7, 8, 10, 11, 13, 14, 15]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[23]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0
nncf_module.bert.encoder.layer.23.attention.self.query,46,"(1024, 1024)","(704, 1024)","(1024,)","(704,)",group of 64 rows,See pkl,"[0, 1, 3, 5, 7, 8, 10, 11, 13, 14, 15]",BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[23]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0
nncf_module.bert.encoder.layer.23.output.dense,47,"(1024, 4096)","(1024, 114)","(1024,)","(1024,)",col,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[23]/BertOutput[output]/NNCFLinear[dense]/linear_0
nncf_module.bert.encoder.layer.23.intermediate.dense,47,"(4096, 1024)","(114, 1024)","(4096,)","(114,)",row,See pkl,,BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[23]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0