0 |
nncf_module.bert.encoder.layer.0.attention.self.key |
0 |
(1024, 1024) |
(448, 1024) |
(1024,) |
(448,) |
group of 64 rows |
See pkl |
[1, 2, 6, 7, 10, 13, 14] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[0]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
1 |
nncf_module.bert.encoder.layer.0.attention.self.value |
0 |
(1024, 1024) |
(448, 1024) |
(1024,) |
(448,) |
group of 64 rows |
See pkl |
[1, 2, 6, 7, 10, 13, 14] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[0]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
2 |
nncf_module.bert.encoder.layer.0.attention.self.query |
0 |
(1024, 1024) |
(448, 1024) |
(1024,) |
(448,) |
group of 64 rows |
See pkl |
[1, 2, 6, 7, 10, 13, 14] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[0]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
3 |
nncf_module.bert.encoder.layer.0.attention.output.dense |
0 |
(1024, 1024) |
(1024, 448) |
(1024,) |
(1024,) |
group of 64 cols |
See pkl |
[1, 2, 6, 7, 10, 13, 14] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[0]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
4 |
nncf_module.bert.encoder.layer.0.intermediate.dense |
1 |
(4096, 1024) |
(915, 1024) |
(4096,) |
(915,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[0]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
5 |
nncf_module.bert.encoder.layer.0.output.dense |
1 |
(1024, 4096) |
(1024, 915) |
(1024,) |
(1024,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[0]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
6 |
nncf_module.bert.encoder.layer.1.attention.self.query |
2 |
(1024, 1024) |
(64, 1024) |
(1024,) |
(64,) |
group of 64 rows |
See pkl |
[8] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[1]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
7 |
nncf_module.bert.encoder.layer.1.attention.self.value |
2 |
(1024, 1024) |
(64, 1024) |
(1024,) |
(64,) |
group of 64 rows |
See pkl |
[8] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[1]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
8 |
nncf_module.bert.encoder.layer.1.attention.self.key |
2 |
(1024, 1024) |
(64, 1024) |
(1024,) |
(64,) |
group of 64 rows |
See pkl |
[8] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[1]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
9 |
nncf_module.bert.encoder.layer.1.attention.output.dense |
2 |
(1024, 1024) |
(1024, 64) |
(1024,) |
(1024,) |
group of 64 cols |
See pkl |
[8] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[1]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
10 |
nncf_module.bert.encoder.layer.1.output.dense |
3 |
(1024, 4096) |
(1024, 829) |
(1024,) |
(1024,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[1]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
11 |
nncf_module.bert.encoder.layer.1.intermediate.dense |
3 |
(4096, 1024) |
(829, 1024) |
(4096,) |
(829,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[1]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
12 |
nncf_module.bert.encoder.layer.2.attention.output.dense |
4 |
(1024, 1024) |
(1024, 128) |
(1024,) |
(1024,) |
group of 64 cols |
See pkl |
[3, 5] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[2]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
13 |
nncf_module.bert.encoder.layer.2.attention.self.value |
4 |
(1024, 1024) |
(128, 1024) |
(1024,) |
(128,) |
group of 64 rows |
See pkl |
[3, 5] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[2]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
14 |
nncf_module.bert.encoder.layer.2.attention.self.key |
4 |
(1024, 1024) |
(128, 1024) |
(1024,) |
(128,) |
group of 64 rows |
See pkl |
[3, 5] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[2]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
15 |
nncf_module.bert.encoder.layer.2.attention.self.query |
4 |
(1024, 1024) |
(128, 1024) |
(1024,) |
(128,) |
group of 64 rows |
See pkl |
[3, 5] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[2]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
16 |
nncf_module.bert.encoder.layer.2.output.dense |
5 |
(1024, 4096) |
(1024, 1181) |
(1024,) |
(1024,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[2]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
17 |
nncf_module.bert.encoder.layer.2.intermediate.dense |
5 |
(4096, 1024) |
(1181, 1024) |
(4096,) |
(1181,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[2]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
18 |
nncf_module.bert.encoder.layer.3.attention.self.value |
6 |
(1024, 1024) |
(128, 1024) |
(1024,) |
(128,) |
group of 64 rows |
See pkl |
[4, 12] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[3]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
19 |
nncf_module.bert.encoder.layer.3.attention.self.key |
6 |
(1024, 1024) |
(128, 1024) |
(1024,) |
(128,) |
group of 64 rows |
See pkl |
[4, 12] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[3]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
20 |
nncf_module.bert.encoder.layer.3.attention.self.query |
6 |
(1024, 1024) |
(128, 1024) |
(1024,) |
(128,) |
group of 64 rows |
See pkl |
[4, 12] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[3]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
21 |
nncf_module.bert.encoder.layer.3.attention.output.dense |
6 |
(1024, 1024) |
(1024, 128) |
(1024,) |
(1024,) |
group of 64 cols |
See pkl |
[4, 12] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[3]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
22 |
nncf_module.bert.encoder.layer.3.output.dense |
7 |
(1024, 4096) |
(1024, 1526) |
(1024,) |
(1024,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[3]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
23 |
nncf_module.bert.encoder.layer.3.intermediate.dense |
7 |
(4096, 1024) |
(1526, 1024) |
(4096,) |
(1526,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[3]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
24 |
nncf_module.bert.encoder.layer.4.attention.self.key |
8 |
(1024, 1024) |
(64, 1024) |
(1024,) |
(64,) |
group of 64 rows |
See pkl |
[15] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[4]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
25 |
nncf_module.bert.encoder.layer.4.attention.self.value |
8 |
(1024, 1024) |
(64, 1024) |
(1024,) |
(64,) |
group of 64 rows |
See pkl |
[15] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[4]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
26 |
nncf_module.bert.encoder.layer.4.attention.self.query |
8 |
(1024, 1024) |
(64, 1024) |
(1024,) |
(64,) |
group of 64 rows |
See pkl |
[15] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[4]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
27 |
nncf_module.bert.encoder.layer.4.attention.output.dense |
8 |
(1024, 1024) |
(1024, 64) |
(1024,) |
(1024,) |
group of 64 cols |
See pkl |
[15] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[4]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
28 |
nncf_module.bert.encoder.layer.4.output.dense |
9 |
(1024, 4096) |
(1024, 1749) |
(1024,) |
(1024,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[4]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
29 |
nncf_module.bert.encoder.layer.4.intermediate.dense |
9 |
(4096, 1024) |
(1749, 1024) |
(4096,) |
(1749,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[4]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
30 |
nncf_module.bert.encoder.layer.5.attention.self.query |
10 |
(1024, 1024) |
(1024, 1024) |
(1024,) |
(1024,) |
group of 64 rows |
See pkl |
[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[5]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
31 |
nncf_module.bert.encoder.layer.5.attention.output.dense |
10 |
(1024, 1024) |
(1024, 1024) |
(1024,) |
(1024,) |
group of 64 cols |
See pkl |
[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[5]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
32 |
nncf_module.bert.encoder.layer.5.attention.self.value |
10 |
(1024, 1024) |
(1024, 1024) |
(1024,) |
(1024,) |
group of 64 rows |
See pkl |
[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[5]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
33 |
nncf_module.bert.encoder.layer.5.attention.self.key |
10 |
(1024, 1024) |
(1024, 1024) |
(1024,) |
(1024,) |
group of 64 rows |
See pkl |
[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[5]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
34 |
nncf_module.bert.encoder.layer.5.output.dense |
11 |
(1024, 4096) |
(1024, 2107) |
(1024,) |
(1024,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[5]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
35 |
nncf_module.bert.encoder.layer.5.intermediate.dense |
11 |
(4096, 1024) |
(2107, 1024) |
(4096,) |
(2107,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[5]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
36 |
nncf_module.bert.encoder.layer.6.attention.self.query |
12 |
(1024, 1024) |
(1024, 1024) |
(1024,) |
(1024,) |
group of 64 rows |
See pkl |
[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[6]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
37 |
nncf_module.bert.encoder.layer.6.attention.self.key |
12 |
(1024, 1024) |
(1024, 1024) |
(1024,) |
(1024,) |
group of 64 rows |
See pkl |
[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[6]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
38 |
nncf_module.bert.encoder.layer.6.attention.self.value |
12 |
(1024, 1024) |
(1024, 1024) |
(1024,) |
(1024,) |
group of 64 rows |
See pkl |
[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[6]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
39 |
nncf_module.bert.encoder.layer.6.attention.output.dense |
12 |
(1024, 1024) |
(1024, 1024) |
(1024,) |
(1024,) |
group of 64 cols |
See pkl |
[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[6]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
40 |
nncf_module.bert.encoder.layer.6.output.dense |
13 |
(1024, 4096) |
(1024, 2368) |
(1024,) |
(1024,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[6]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
41 |
nncf_module.bert.encoder.layer.6.intermediate.dense |
13 |
(4096, 1024) |
(2368, 1024) |
(4096,) |
(2368,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[6]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
42 |
nncf_module.bert.encoder.layer.7.attention.self.query |
14 |
(1024, 1024) |
(128, 1024) |
(1024,) |
(128,) |
group of 64 rows |
See pkl |
[1, 6] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[7]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
43 |
nncf_module.bert.encoder.layer.7.attention.self.key |
14 |
(1024, 1024) |
(128, 1024) |
(1024,) |
(128,) |
group of 64 rows |
See pkl |
[1, 6] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[7]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
44 |
nncf_module.bert.encoder.layer.7.attention.output.dense |
14 |
(1024, 1024) |
(1024, 128) |
(1024,) |
(1024,) |
group of 64 cols |
See pkl |
[1, 6] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[7]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
45 |
nncf_module.bert.encoder.layer.7.attention.self.value |
14 |
(1024, 1024) |
(128, 1024) |
(1024,) |
(128,) |
group of 64 rows |
See pkl |
[1, 6] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[7]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
46 |
nncf_module.bert.encoder.layer.7.intermediate.dense |
15 |
(4096, 1024) |
(2395, 1024) |
(4096,) |
(2395,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[7]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
47 |
nncf_module.bert.encoder.layer.7.output.dense |
15 |
(1024, 4096) |
(1024, 2395) |
(1024,) |
(1024,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[7]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
48 |
nncf_module.bert.encoder.layer.8.attention.self.value |
16 |
(1024, 1024) |
(128, 1024) |
(1024,) |
(128,) |
group of 64 rows |
See pkl |
[1, 6] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[8]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
49 |
nncf_module.bert.encoder.layer.8.attention.output.dense |
16 |
(1024, 1024) |
(1024, 128) |
(1024,) |
(1024,) |
group of 64 cols |
See pkl |
[1, 6] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[8]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
50 |
nncf_module.bert.encoder.layer.8.attention.self.query |
16 |
(1024, 1024) |
(128, 1024) |
(1024,) |
(128,) |
group of 64 rows |
See pkl |
[1, 6] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[8]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
51 |
nncf_module.bert.encoder.layer.8.attention.self.key |
16 |
(1024, 1024) |
(128, 1024) |
(1024,) |
(128,) |
group of 64 rows |
See pkl |
[1, 6] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[8]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
52 |
nncf_module.bert.encoder.layer.8.intermediate.dense |
17 |
(4096, 1024) |
(2352, 1024) |
(4096,) |
(2352,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[8]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
53 |
nncf_module.bert.encoder.layer.8.output.dense |
17 |
(1024, 4096) |
(1024, 2352) |
(1024,) |
(1024,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[8]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
54 |
nncf_module.bert.encoder.layer.9.attention.self.query |
18 |
(1024, 1024) |
(64, 1024) |
(1024,) |
(64,) |
group of 64 rows |
See pkl |
[12] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[9]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
55 |
nncf_module.bert.encoder.layer.9.attention.self.key |
18 |
(1024, 1024) |
(64, 1024) |
(1024,) |
(64,) |
group of 64 rows |
See pkl |
[12] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[9]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
56 |
nncf_module.bert.encoder.layer.9.attention.output.dense |
18 |
(1024, 1024) |
(1024, 64) |
(1024,) |
(1024,) |
group of 64 cols |
See pkl |
[12] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[9]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
57 |
nncf_module.bert.encoder.layer.9.attention.self.value |
18 |
(1024, 1024) |
(64, 1024) |
(1024,) |
(64,) |
group of 64 rows |
See pkl |
[12] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[9]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
58 |
nncf_module.bert.encoder.layer.9.output.dense |
19 |
(1024, 4096) |
(1024, 2345) |
(1024,) |
(1024,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[9]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
59 |
nncf_module.bert.encoder.layer.9.intermediate.dense |
19 |
(4096, 1024) |
(2345, 1024) |
(4096,) |
(2345,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[9]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
60 |
nncf_module.bert.encoder.layer.10.attention.self.query |
20 |
(1024, 1024) |
(64, 1024) |
(1024,) |
(64,) |
group of 64 rows |
See pkl |
[0] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[10]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
61 |
nncf_module.bert.encoder.layer.10.attention.self.key |
20 |
(1024, 1024) |
(64, 1024) |
(1024,) |
(64,) |
group of 64 rows |
See pkl |
[0] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[10]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
62 |
nncf_module.bert.encoder.layer.10.attention.output.dense |
20 |
(1024, 1024) |
(1024, 64) |
(1024,) |
(1024,) |
group of 64 cols |
See pkl |
[0] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[10]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
63 |
nncf_module.bert.encoder.layer.10.attention.self.value |
20 |
(1024, 1024) |
(64, 1024) |
(1024,) |
(64,) |
group of 64 rows |
See pkl |
[0] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[10]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
64 |
nncf_module.bert.encoder.layer.10.intermediate.dense |
21 |
(4096, 1024) |
(2261, 1024) |
(4096,) |
(2261,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[10]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
65 |
nncf_module.bert.encoder.layer.10.output.dense |
21 |
(1024, 4096) |
(1024, 2261) |
(1024,) |
(1024,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[10]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
66 |
nncf_module.bert.encoder.layer.11.attention.output.dense |
22 |
(1024, 1024) |
(1024, 256) |
(1024,) |
(1024,) |
group of 64 cols |
See pkl |
[1, 4, 9, 13] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[11]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
67 |
nncf_module.bert.encoder.layer.11.attention.self.key |
22 |
(1024, 1024) |
(256, 1024) |
(1024,) |
(256,) |
group of 64 rows |
See pkl |
[1, 4, 9, 13] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[11]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
68 |
nncf_module.bert.encoder.layer.11.attention.self.value |
22 |
(1024, 1024) |
(256, 1024) |
(1024,) |
(256,) |
group of 64 rows |
See pkl |
[1, 4, 9, 13] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[11]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
69 |
nncf_module.bert.encoder.layer.11.attention.self.query |
22 |
(1024, 1024) |
(256, 1024) |
(1024,) |
(256,) |
group of 64 rows |
See pkl |
[1, 4, 9, 13] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[11]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
70 |
nncf_module.bert.encoder.layer.11.intermediate.dense |
23 |
(4096, 1024) |
(1950, 1024) |
(4096,) |
(1950,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[11]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
71 |
nncf_module.bert.encoder.layer.11.output.dense |
23 |
(1024, 4096) |
(1024, 1950) |
(1024,) |
(1024,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[11]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
72 |
nncf_module.bert.encoder.layer.12.attention.self.query |
24 |
(1024, 1024) |
(320, 1024) |
(1024,) |
(320,) |
group of 64 rows |
See pkl |
[4, 5, 7, 14, 15] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[12]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
73 |
nncf_module.bert.encoder.layer.12.attention.self.value |
24 |
(1024, 1024) |
(320, 1024) |
(1024,) |
(320,) |
group of 64 rows |
See pkl |
[4, 5, 7, 14, 15] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[12]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
74 |
nncf_module.bert.encoder.layer.12.attention.self.key |
24 |
(1024, 1024) |
(320, 1024) |
(1024,) |
(320,) |
group of 64 rows |
See pkl |
[4, 5, 7, 14, 15] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[12]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
75 |
nncf_module.bert.encoder.layer.12.attention.output.dense |
24 |
(1024, 1024) |
(1024, 320) |
(1024,) |
(1024,) |
group of 64 cols |
See pkl |
[4, 5, 7, 14, 15] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[12]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
76 |
nncf_module.bert.encoder.layer.12.intermediate.dense |
25 |
(4096, 1024) |
(1818, 1024) |
(4096,) |
(1818,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[12]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
77 |
nncf_module.bert.encoder.layer.12.output.dense |
25 |
(1024, 4096) |
(1024, 1818) |
(1024,) |
(1024,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[12]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
78 |
nncf_module.bert.encoder.layer.13.attention.self.query |
26 |
(1024, 1024) |
(256, 1024) |
(1024,) |
(256,) |
group of 64 rows |
See pkl |
[4, 7, 13, 14] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[13]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
79 |
nncf_module.bert.encoder.layer.13.attention.output.dense |
26 |
(1024, 1024) |
(1024, 256) |
(1024,) |
(1024,) |
group of 64 cols |
See pkl |
[4, 7, 13, 14] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[13]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
80 |
nncf_module.bert.encoder.layer.13.attention.self.key |
26 |
(1024, 1024) |
(256, 1024) |
(1024,) |
(256,) |
group of 64 rows |
See pkl |
[4, 7, 13, 14] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[13]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
81 |
nncf_module.bert.encoder.layer.13.attention.self.value |
26 |
(1024, 1024) |
(256, 1024) |
(1024,) |
(256,) |
group of 64 rows |
See pkl |
[4, 7, 13, 14] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[13]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
82 |
nncf_module.bert.encoder.layer.13.output.dense |
27 |
(1024, 4096) |
(1024, 1585) |
(1024,) |
(1024,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[13]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
83 |
nncf_module.bert.encoder.layer.13.intermediate.dense |
27 |
(4096, 1024) |
(1585, 1024) |
(4096,) |
(1585,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[13]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
84 |
nncf_module.bert.encoder.layer.14.attention.output.dense |
28 |
(1024, 1024) |
(1024, 320) |
(1024,) |
(1024,) |
group of 64 cols |
See pkl |
[2, 3, 4, 7, 8] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[14]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
85 |
nncf_module.bert.encoder.layer.14.attention.self.value |
28 |
(1024, 1024) |
(320, 1024) |
(1024,) |
(320,) |
group of 64 rows |
See pkl |
[2, 3, 4, 7, 8] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[14]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
86 |
nncf_module.bert.encoder.layer.14.attention.self.key |
28 |
(1024, 1024) |
(320, 1024) |
(1024,) |
(320,) |
group of 64 rows |
See pkl |
[2, 3, 4, 7, 8] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[14]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
87 |
nncf_module.bert.encoder.layer.14.attention.self.query |
28 |
(1024, 1024) |
(320, 1024) |
(1024,) |
(320,) |
group of 64 rows |
See pkl |
[2, 3, 4, 7, 8] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[14]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
88 |
nncf_module.bert.encoder.layer.14.intermediate.dense |
29 |
(4096, 1024) |
(1165, 1024) |
(4096,) |
(1165,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[14]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
89 |
nncf_module.bert.encoder.layer.14.output.dense |
29 |
(1024, 4096) |
(1024, 1165) |
(1024,) |
(1024,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[14]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
90 |
nncf_module.bert.encoder.layer.15.attention.output.dense |
30 |
(1024, 1024) |
(1024, 320) |
(1024,) |
(1024,) |
group of 64 cols |
See pkl |
[2, 7, 8, 10, 14] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[15]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
91 |
nncf_module.bert.encoder.layer.15.attention.self.query |
30 |
(1024, 1024) |
(320, 1024) |
(1024,) |
(320,) |
group of 64 rows |
See pkl |
[2, 7, 8, 10, 14] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[15]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
92 |
nncf_module.bert.encoder.layer.15.attention.self.key |
30 |
(1024, 1024) |
(320, 1024) |
(1024,) |
(320,) |
group of 64 rows |
See pkl |
[2, 7, 8, 10, 14] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[15]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
93 |
nncf_module.bert.encoder.layer.15.attention.self.value |
30 |
(1024, 1024) |
(320, 1024) |
(1024,) |
(320,) |
group of 64 rows |
See pkl |
[2, 7, 8, 10, 14] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[15]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
94 |
nncf_module.bert.encoder.layer.15.output.dense |
31 |
(1024, 4096) |
(1024, 982) |
(1024,) |
(1024,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[15]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
95 |
nncf_module.bert.encoder.layer.15.intermediate.dense |
31 |
(4096, 1024) |
(982, 1024) |
(4096,) |
(982,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[15]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
96 |
nncf_module.bert.encoder.layer.16.attention.self.value |
32 |
(1024, 1024) |
(320, 1024) |
(1024,) |
(320,) |
group of 64 rows |
See pkl |
[0, 8, 10, 13, 14] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[16]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
97 |
nncf_module.bert.encoder.layer.16.attention.self.key |
32 |
(1024, 1024) |
(320, 1024) |
(1024,) |
(320,) |
group of 64 rows |
See pkl |
[0, 8, 10, 13, 14] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[16]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
98 |
nncf_module.bert.encoder.layer.16.attention.self.query |
32 |
(1024, 1024) |
(320, 1024) |
(1024,) |
(320,) |
group of 64 rows |
See pkl |
[0, 8, 10, 13, 14] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[16]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
99 |
nncf_module.bert.encoder.layer.16.attention.output.dense |
32 |
(1024, 1024) |
(1024, 320) |
(1024,) |
(1024,) |
group of 64 cols |
See pkl |
[0, 8, 10, 13, 14] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[16]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
100 |
nncf_module.bert.encoder.layer.16.intermediate.dense |
33 |
(4096, 1024) |
(941, 1024) |
(4096,) |
(941,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[16]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
101 |
nncf_module.bert.encoder.layer.16.output.dense |
33 |
(1024, 4096) |
(1024, 941) |
(1024,) |
(1024,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[16]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
102 |
nncf_module.bert.encoder.layer.17.attention.self.key |
34 |
(1024, 1024) |
(256, 1024) |
(1024,) |
(256,) |
group of 64 rows |
See pkl |
[3, 6, 7, 15] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[17]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
103 |
nncf_module.bert.encoder.layer.17.attention.self.value |
34 |
(1024, 1024) |
(256, 1024) |
(1024,) |
(256,) |
group of 64 rows |
See pkl |
[3, 6, 7, 15] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[17]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
104 |
nncf_module.bert.encoder.layer.17.attention.output.dense |
34 |
(1024, 1024) |
(1024, 256) |
(1024,) |
(1024,) |
group of 64 cols |
See pkl |
[3, 6, 7, 15] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[17]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
105 |
nncf_module.bert.encoder.layer.17.attention.self.query |
34 |
(1024, 1024) |
(256, 1024) |
(1024,) |
(256,) |
group of 64 rows |
See pkl |
[3, 6, 7, 15] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[17]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
106 |
nncf_module.bert.encoder.layer.17.intermediate.dense |
35 |
(4096, 1024) |
(838, 1024) |
(4096,) |
(838,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[17]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
107 |
nncf_module.bert.encoder.layer.17.output.dense |
35 |
(1024, 4096) |
(1024, 838) |
(1024,) |
(1024,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[17]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
108 |
nncf_module.bert.encoder.layer.18.attention.output.dense |
36 |
(1024, 1024) |
(1024, 192) |
(1024,) |
(1024,) |
group of 64 cols |
See pkl |
[6, 8, 12] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[18]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
109 |
nncf_module.bert.encoder.layer.18.attention.self.value |
36 |
(1024, 1024) |
(192, 1024) |
(1024,) |
(192,) |
group of 64 rows |
See pkl |
[6, 8, 12] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[18]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
110 |
nncf_module.bert.encoder.layer.18.attention.self.query |
36 |
(1024, 1024) |
(192, 1024) |
(1024,) |
(192,) |
group of 64 rows |
See pkl |
[6, 8, 12] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[18]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
111 |
nncf_module.bert.encoder.layer.18.attention.self.key |
36 |
(1024, 1024) |
(192, 1024) |
(1024,) |
(192,) |
group of 64 rows |
See pkl |
[6, 8, 12] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[18]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
112 |
nncf_module.bert.encoder.layer.18.output.dense |
37 |
(1024, 4096) |
(1024, 611) |
(1024,) |
(1024,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[18]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
113 |
nncf_module.bert.encoder.layer.18.intermediate.dense |
37 |
(4096, 1024) |
(611, 1024) |
(4096,) |
(611,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[18]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
114 |
nncf_module.bert.encoder.layer.19.attention.output.dense |
38 |
(1024, 1024) |
(1024, 192) |
(1024,) |
(1024,) |
group of 64 cols |
See pkl |
[7, 9, 10] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[19]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
115 |
nncf_module.bert.encoder.layer.19.attention.self.key |
38 |
(1024, 1024) |
(192, 1024) |
(1024,) |
(192,) |
group of 64 rows |
See pkl |
[7, 9, 10] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[19]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
116 |
nncf_module.bert.encoder.layer.19.attention.self.query |
38 |
(1024, 1024) |
(192, 1024) |
(1024,) |
(192,) |
group of 64 rows |
See pkl |
[7, 9, 10] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[19]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
117 |
nncf_module.bert.encoder.layer.19.attention.self.value |
38 |
(1024, 1024) |
(192, 1024) |
(1024,) |
(192,) |
group of 64 rows |
See pkl |
[7, 9, 10] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[19]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
118 |
nncf_module.bert.encoder.layer.19.intermediate.dense |
39 |
(4096, 1024) |
(371, 1024) |
(4096,) |
(371,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[19]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
119 |
nncf_module.bert.encoder.layer.19.output.dense |
39 |
(1024, 4096) |
(1024, 371) |
(1024,) |
(1024,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[19]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
120 |
nncf_module.bert.encoder.layer.20.attention.self.key |
40 |
(1024, 1024) |
(256, 1024) |
(1024,) |
(256,) |
group of 64 rows |
See pkl |
[5, 6, 9, 15] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[20]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
121 |
nncf_module.bert.encoder.layer.20.attention.self.value |
40 |
(1024, 1024) |
(256, 1024) |
(1024,) |
(256,) |
group of 64 rows |
See pkl |
[5, 6, 9, 15] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[20]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
122 |
nncf_module.bert.encoder.layer.20.attention.output.dense |
40 |
(1024, 1024) |
(1024, 256) |
(1024,) |
(1024,) |
group of 64 cols |
See pkl |
[5, 6, 9, 15] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[20]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
123 |
nncf_module.bert.encoder.layer.20.attention.self.query |
40 |
(1024, 1024) |
(256, 1024) |
(1024,) |
(256,) |
group of 64 rows |
See pkl |
[5, 6, 9, 15] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[20]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
124 |
nncf_module.bert.encoder.layer.20.intermediate.dense |
41 |
(4096, 1024) |
(175, 1024) |
(4096,) |
(175,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[20]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
125 |
nncf_module.bert.encoder.layer.20.output.dense |
41 |
(1024, 4096) |
(1024, 175) |
(1024,) |
(1024,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[20]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
126 |
nncf_module.bert.encoder.layer.21.attention.self.value |
42 |
(1024, 1024) |
(128, 1024) |
(1024,) |
(128,) |
group of 64 rows |
See pkl |
[6, 7] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[21]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
127 |
nncf_module.bert.encoder.layer.21.attention.output.dense |
42 |
(1024, 1024) |
(1024, 128) |
(1024,) |
(1024,) |
group of 64 cols |
See pkl |
[6, 7] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[21]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
128 |
nncf_module.bert.encoder.layer.21.attention.self.key |
42 |
(1024, 1024) |
(128, 1024) |
(1024,) |
(128,) |
group of 64 rows |
See pkl |
[6, 7] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[21]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
129 |
nncf_module.bert.encoder.layer.21.attention.self.query |
42 |
(1024, 1024) |
(128, 1024) |
(1024,) |
(128,) |
group of 64 rows |
See pkl |
[6, 7] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[21]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
130 |
nncf_module.bert.encoder.layer.21.output.dense |
43 |
(1024, 4096) |
(1024, 128) |
(1024,) |
(1024,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[21]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
131 |
nncf_module.bert.encoder.layer.21.intermediate.dense |
43 |
(4096, 1024) |
(128, 1024) |
(4096,) |
(128,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[21]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
132 |
nncf_module.bert.encoder.layer.22.attention.self.value |
44 |
(1024, 1024) |
(64, 1024) |
(1024,) |
(64,) |
group of 64 rows |
See pkl |
[14] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[22]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
133 |
nncf_module.bert.encoder.layer.22.attention.self.query |
44 |
(1024, 1024) |
(64, 1024) |
(1024,) |
(64,) |
group of 64 rows |
See pkl |
[14] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[22]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
134 |
nncf_module.bert.encoder.layer.22.attention.output.dense |
44 |
(1024, 1024) |
(1024, 64) |
(1024,) |
(1024,) |
group of 64 cols |
See pkl |
[14] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[22]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
135 |
nncf_module.bert.encoder.layer.22.attention.self.key |
44 |
(1024, 1024) |
(64, 1024) |
(1024,) |
(64,) |
group of 64 rows |
See pkl |
[14] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[22]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
136 |
nncf_module.bert.encoder.layer.22.intermediate.dense |
45 |
(4096, 1024) |
(100, 1024) |
(4096,) |
(100,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[22]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
137 |
nncf_module.bert.encoder.layer.22.output.dense |
45 |
(1024, 4096) |
(1024, 100) |
(1024,) |
(1024,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[22]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
138 |
nncf_module.bert.encoder.layer.23.attention.output.dense |
46 |
(1024, 1024) |
(1024, 704) |
(1024,) |
(1024,) |
group of 64 cols |
See pkl |
[0, 1, 3, 5, 7, 8, 10, 11, 13, 14, 15] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[23]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
139 |
nncf_module.bert.encoder.layer.23.attention.self.key |
46 |
(1024, 1024) |
(704, 1024) |
(1024,) |
(704,) |
group of 64 rows |
See pkl |
[0, 1, 3, 5, 7, 8, 10, 11, 13, 14, 15] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[23]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
140 |
nncf_module.bert.encoder.layer.23.attention.self.value |
46 |
(1024, 1024) |
(704, 1024) |
(1024,) |
(704,) |
group of 64 rows |
See pkl |
[0, 1, 3, 5, 7, 8, 10, 11, 13, 14, 15] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[23]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
141 |
nncf_module.bert.encoder.layer.23.attention.self.query |
46 |
(1024, 1024) |
(704, 1024) |
(1024,) |
(704,) |
group of 64 rows |
See pkl |
[0, 1, 3, 5, 7, 8, 10, 11, 13, 14, 15] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[23]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
142 |
nncf_module.bert.encoder.layer.23.output.dense |
47 |
(1024, 4096) |
(1024, 114) |
(1024,) |
(1024,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[23]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
143 |
nncf_module.bert.encoder.layer.23.intermediate.dense |
47 |
(4096, 1024) |
(114, 1024) |
(4096,) |
(114,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[23]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |