0 |
nncf_module.bert.encoder.layer.0.attention.output.dense |
0 |
(768, 768) |
(768, 192) |
(768,) |
(768,) |
group of 64 cols |
See pkl |
[3, 8, 10] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[0]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
1 |
nncf_module.bert.encoder.layer.0.attention.self.query |
0 |
(768, 768) |
(192, 768) |
(768,) |
(192,) |
group of 64 rows |
See pkl |
[3, 8, 10] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[0]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
2 |
nncf_module.bert.encoder.layer.0.attention.self.value |
0 |
(768, 768) |
(192, 768) |
(768,) |
(192,) |
group of 64 rows |
See pkl |
[3, 8, 10] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[0]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
3 |
nncf_module.bert.encoder.layer.0.attention.self.key |
0 |
(768, 768) |
(192, 768) |
(768,) |
(192,) |
group of 64 rows |
See pkl |
[3, 8, 10] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[0]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
4 |
nncf_module.bert.encoder.layer.0.intermediate.dense |
1 |
(3072, 768) |
(2094, 768) |
(3072,) |
(2094,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[0]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
5 |
nncf_module.bert.encoder.layer.0.output.dense |
1 |
(768, 3072) |
(768, 2094) |
(768,) |
(768,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[0]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
6 |
nncf_module.bert.encoder.layer.1.attention.self.key |
2 |
(768, 768) |
(320, 768) |
(768,) |
(320,) |
group of 64 rows |
See pkl |
[1, 4, 7, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[1]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
7 |
nncf_module.bert.encoder.layer.1.attention.self.value |
2 |
(768, 768) |
(320, 768) |
(768,) |
(320,) |
group of 64 rows |
See pkl |
[1, 4, 7, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[1]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
8 |
nncf_module.bert.encoder.layer.1.attention.output.dense |
2 |
(768, 768) |
(768, 320) |
(768,) |
(768,) |
group of 64 cols |
See pkl |
[1, 4, 7, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[1]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
9 |
nncf_module.bert.encoder.layer.1.attention.self.query |
2 |
(768, 768) |
(320, 768) |
(768,) |
(320,) |
group of 64 rows |
See pkl |
[1, 4, 7, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[1]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
10 |
nncf_module.bert.encoder.layer.1.output.dense |
3 |
(768, 3072) |
(768, 2062) |
(768,) |
(768,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[1]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
11 |
nncf_module.bert.encoder.layer.1.intermediate.dense |
3 |
(3072, 768) |
(2062, 768) |
(3072,) |
(2062,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[1]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
12 |
nncf_module.bert.encoder.layer.2.attention.self.key |
4 |
(768, 768) |
(768, 768) |
(768,) |
(768,) |
group of 64 rows |
See pkl |
[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[2]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
13 |
nncf_module.bert.encoder.layer.2.attention.output.dense |
4 |
(768, 768) |
(768, 768) |
(768,) |
(768,) |
group of 64 cols |
See pkl |
[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[2]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
14 |
nncf_module.bert.encoder.layer.2.attention.self.value |
4 |
(768, 768) |
(768, 768) |
(768,) |
(768,) |
group of 64 rows |
See pkl |
[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[2]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
15 |
nncf_module.bert.encoder.layer.2.attention.self.query |
4 |
(768, 768) |
(768, 768) |
(768,) |
(768,) |
group of 64 rows |
See pkl |
[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[2]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
16 |
nncf_module.bert.encoder.layer.2.output.dense |
5 |
(768, 3072) |
(768, 2229) |
(768,) |
(768,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[2]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
17 |
nncf_module.bert.encoder.layer.2.intermediate.dense |
5 |
(3072, 768) |
(2229, 768) |
(3072,) |
(2229,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[2]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
18 |
nncf_module.bert.encoder.layer.3.attention.self.query |
6 |
(768, 768) |
(448, 768) |
(768,) |
(448,) |
group of 64 rows |
See pkl |
[0, 1, 5, 8, 9, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[3]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
19 |
nncf_module.bert.encoder.layer.3.attention.output.dense |
6 |
(768, 768) |
(768, 448) |
(768,) |
(768,) |
group of 64 cols |
See pkl |
[0, 1, 5, 8, 9, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[3]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
20 |
nncf_module.bert.encoder.layer.3.attention.self.value |
6 |
(768, 768) |
(448, 768) |
(768,) |
(448,) |
group of 64 rows |
See pkl |
[0, 1, 5, 8, 9, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[3]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
21 |
nncf_module.bert.encoder.layer.3.attention.self.key |
6 |
(768, 768) |
(448, 768) |
(768,) |
(448,) |
group of 64 rows |
See pkl |
[0, 1, 5, 8, 9, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[3]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
22 |
nncf_module.bert.encoder.layer.3.intermediate.dense |
7 |
(3072, 768) |
(2155, 768) |
(3072,) |
(2155,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[3]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
23 |
nncf_module.bert.encoder.layer.3.output.dense |
7 |
(768, 3072) |
(768, 2155) |
(768,) |
(768,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[3]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
24 |
nncf_module.bert.encoder.layer.4.attention.output.dense |
8 |
(768, 768) |
(768, 768) |
(768,) |
(768,) |
group of 64 cols |
See pkl |
[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[4]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
25 |
nncf_module.bert.encoder.layer.4.attention.self.query |
8 |
(768, 768) |
(768, 768) |
(768,) |
(768,) |
group of 64 rows |
See pkl |
[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[4]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
26 |
nncf_module.bert.encoder.layer.4.attention.self.key |
8 |
(768, 768) |
(768, 768) |
(768,) |
(768,) |
group of 64 rows |
See pkl |
[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[4]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
27 |
nncf_module.bert.encoder.layer.4.attention.self.value |
8 |
(768, 768) |
(768, 768) |
(768,) |
(768,) |
group of 64 rows |
See pkl |
[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[4]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
28 |
nncf_module.bert.encoder.layer.4.output.dense |
9 |
(768, 3072) |
(768, 1973) |
(768,) |
(768,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[4]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
29 |
nncf_module.bert.encoder.layer.4.intermediate.dense |
9 |
(3072, 768) |
(1973, 768) |
(3072,) |
(1973,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[4]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
30 |
nncf_module.bert.encoder.layer.5.attention.self.key |
10 |
(768, 768) |
(768, 768) |
(768,) |
(768,) |
group of 64 rows |
See pkl |
[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[5]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
31 |
nncf_module.bert.encoder.layer.5.attention.output.dense |
10 |
(768, 768) |
(768, 768) |
(768,) |
(768,) |
group of 64 cols |
See pkl |
[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[5]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
32 |
nncf_module.bert.encoder.layer.5.attention.self.value |
10 |
(768, 768) |
(768, 768) |
(768,) |
(768,) |
group of 64 rows |
See pkl |
[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[5]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
33 |
nncf_module.bert.encoder.layer.5.attention.self.query |
10 |
(768, 768) |
(768, 768) |
(768,) |
(768,) |
group of 64 rows |
See pkl |
[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[5]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
34 |
nncf_module.bert.encoder.layer.5.intermediate.dense |
11 |
(3072, 768) |
(1947, 768) |
(3072,) |
(1947,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[5]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
35 |
nncf_module.bert.encoder.layer.5.output.dense |
11 |
(768, 3072) |
(768, 1947) |
(768,) |
(768,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[5]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
36 |
nncf_module.bert.encoder.layer.6.attention.self.value |
12 |
(768, 768) |
(768, 768) |
(768,) |
(768,) |
group of 64 rows |
See pkl |
[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[6]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
37 |
nncf_module.bert.encoder.layer.6.attention.output.dense |
12 |
(768, 768) |
(768, 768) |
(768,) |
(768,) |
group of 64 cols |
See pkl |
[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[6]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
38 |
nncf_module.bert.encoder.layer.6.attention.self.query |
12 |
(768, 768) |
(768, 768) |
(768,) |
(768,) |
group of 64 rows |
See pkl |
[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[6]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
39 |
nncf_module.bert.encoder.layer.6.attention.self.key |
12 |
(768, 768) |
(768, 768) |
(768,) |
(768,) |
group of 64 rows |
See pkl |
[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[6]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
40 |
nncf_module.bert.encoder.layer.6.output.dense |
13 |
(768, 3072) |
(768, 1539) |
(768,) |
(768,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[6]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
41 |
nncf_module.bert.encoder.layer.6.intermediate.dense |
13 |
(3072, 768) |
(1539, 768) |
(3072,) |
(1539,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[6]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
42 |
nncf_module.bert.encoder.layer.7.attention.self.value |
14 |
(768, 768) |
(768, 768) |
(768,) |
(768,) |
group of 64 rows |
See pkl |
[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[7]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
43 |
nncf_module.bert.encoder.layer.7.attention.self.key |
14 |
(768, 768) |
(768, 768) |
(768,) |
(768,) |
group of 64 rows |
See pkl |
[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[7]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
44 |
nncf_module.bert.encoder.layer.7.attention.self.query |
14 |
(768, 768) |
(768, 768) |
(768,) |
(768,) |
group of 64 rows |
See pkl |
[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[7]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
45 |
nncf_module.bert.encoder.layer.7.attention.output.dense |
14 |
(768, 768) |
(768, 768) |
(768,) |
(768,) |
group of 64 cols |
See pkl |
[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[7]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
46 |
nncf_module.bert.encoder.layer.7.output.dense |
15 |
(768, 3072) |
(768, 1151) |
(768,) |
(768,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[7]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
47 |
nncf_module.bert.encoder.layer.7.intermediate.dense |
15 |
(3072, 768) |
(1151, 768) |
(3072,) |
(1151,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[7]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
48 |
nncf_module.bert.encoder.layer.8.attention.output.dense |
16 |
(768, 768) |
(768, 384) |
(768,) |
(768,) |
group of 64 cols |
See pkl |
[1, 2, 6, 9, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[8]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
49 |
nncf_module.bert.encoder.layer.8.attention.self.value |
16 |
(768, 768) |
(384, 768) |
(768,) |
(384,) |
group of 64 rows |
See pkl |
[1, 2, 6, 9, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[8]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
50 |
nncf_module.bert.encoder.layer.8.attention.self.query |
16 |
(768, 768) |
(384, 768) |
(768,) |
(384,) |
group of 64 rows |
See pkl |
[1, 2, 6, 9, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[8]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
51 |
nncf_module.bert.encoder.layer.8.attention.self.key |
16 |
(768, 768) |
(384, 768) |
(768,) |
(384,) |
group of 64 rows |
See pkl |
[1, 2, 6, 9, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[8]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
52 |
nncf_module.bert.encoder.layer.8.output.dense |
17 |
(768, 3072) |
(768, 714) |
(768,) |
(768,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[8]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
53 |
nncf_module.bert.encoder.layer.8.intermediate.dense |
17 |
(3072, 768) |
(714, 768) |
(3072,) |
(714,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[8]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
54 |
nncf_module.bert.encoder.layer.9.attention.self.value |
18 |
(768, 768) |
(320, 768) |
(768,) |
(320,) |
group of 64 rows |
See pkl |
[0, 2, 6, 8, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[9]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
55 |
nncf_module.bert.encoder.layer.9.attention.self.query |
18 |
(768, 768) |
(320, 768) |
(768,) |
(320,) |
group of 64 rows |
See pkl |
[0, 2, 6, 8, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[9]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
56 |
nncf_module.bert.encoder.layer.9.attention.self.key |
18 |
(768, 768) |
(320, 768) |
(768,) |
(320,) |
group of 64 rows |
See pkl |
[0, 2, 6, 8, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[9]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
57 |
nncf_module.bert.encoder.layer.9.attention.output.dense |
18 |
(768, 768) |
(768, 320) |
(768,) |
(768,) |
group of 64 cols |
See pkl |
[0, 2, 6, 8, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[9]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
58 |
nncf_module.bert.encoder.layer.9.output.dense |
19 |
(768, 3072) |
(768, 266) |
(768,) |
(768,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[9]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
59 |
nncf_module.bert.encoder.layer.9.intermediate.dense |
19 |
(3072, 768) |
(266, 768) |
(3072,) |
(266,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[9]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
60 |
nncf_module.bert.encoder.layer.10.attention.self.query |
20 |
(768, 768) |
(256, 768) |
(768,) |
(256,) |
group of 64 rows |
See pkl |
[3, 7, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[10]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
61 |
nncf_module.bert.encoder.layer.10.attention.self.value |
20 |
(768, 768) |
(256, 768) |
(768,) |
(256,) |
group of 64 rows |
See pkl |
[3, 7, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[10]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
62 |
nncf_module.bert.encoder.layer.10.attention.output.dense |
20 |
(768, 768) |
(768, 256) |
(768,) |
(768,) |
group of 64 cols |
See pkl |
[3, 7, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[10]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
63 |
nncf_module.bert.encoder.layer.10.attention.self.key |
20 |
(768, 768) |
(256, 768) |
(768,) |
(256,) |
group of 64 rows |
See pkl |
[3, 7, 10, 11] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[10]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
64 |
nncf_module.bert.encoder.layer.10.output.dense |
21 |
(768, 3072) |
(768, 297) |
(768,) |
(768,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[10]/BertOutput[output]/NNCFLinear[dense]/linear_0 |
65 |
nncf_module.bert.encoder.layer.10.intermediate.dense |
21 |
(3072, 768) |
(297, 768) |
(3072,) |
(297,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[10]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
66 |
nncf_module.bert.encoder.layer.11.attention.output.dense |
22 |
(768, 768) |
(768, 256) |
(768,) |
(768,) |
group of 64 cols |
See pkl |
[1, 2, 3, 4] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[11]/BertAttention[attention]/BertSelfOutput[output]/NNCFLinear[dense]/linear_0 |
67 |
nncf_module.bert.encoder.layer.11.attention.self.value |
22 |
(768, 768) |
(256, 768) |
(768,) |
(256,) |
group of 64 rows |
See pkl |
[1, 2, 3, 4] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[11]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[value]/linear_0 |
68 |
nncf_module.bert.encoder.layer.11.attention.self.key |
22 |
(768, 768) |
(256, 768) |
(768,) |
(256,) |
group of 64 rows |
See pkl |
[1, 2, 3, 4] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[11]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[key]/linear_0 |
69 |
nncf_module.bert.encoder.layer.11.attention.self.query |
22 |
(768, 768) |
(256, 768) |
(768,) |
(256,) |
group of 64 rows |
See pkl |
[1, 2, 3, 4] |
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[11]/BertAttention[attention]/BertSelfAttention[self]/NNCFLinear[query]/linear_0 |
70 |
nncf_module.bert.encoder.layer.11.intermediate.dense |
23 |
(3072, 768) |
(322, 768) |
(3072,) |
(322,) |
row |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[11]/BertIntermediate[intermediate]/NNCFLinear[dense]/linear_0 |
71 |
nncf_module.bert.encoder.layer.11.output.dense |
23 |
(768, 3072) |
(768, 322) |
(768,) |
(768,) |
col |
See pkl |
|
BertForQuestionAnswering/BertModel[bert]/BertEncoder[encoder]/ModuleList[layer]/BertLayer[11]/BertOutput[output]/NNCFLinear[dense]/linear_0 |