bert-base-squadv1-block-pruning-hybrid-filled-lt-nncf-50.0sparse-qat-lt
/
XP_linear_layer_sparsity_20M_params_50.00_sparsity.csv
,layer_id,layer_type,param_type,shape,nparam,nnz,sparsity | |
5,nncf_module.bert.encoder.layer.0.attention.self.query,NNCFLinear,weight,"[320, 768]",245760,106337,0.5673136115074158 | |
7,nncf_module.bert.encoder.layer.0.attention.self.key,NNCFLinear,weight,"[320, 768]",245760,112375,0.5427449345588684 | |
9,nncf_module.bert.encoder.layer.0.attention.self.value,NNCFLinear,weight,"[320, 768]",245760,131965,0.4630330204963684 | |
11,nncf_module.bert.encoder.layer.0.attention.output.dense,NNCFLinear,weight,"[768, 320]",245760,137497,0.44052326679229736 | |
15,nncf_module.bert.encoder.layer.0.intermediate.dense,NNCFLinear,weight,"[185, 768]",142080,110056,0.2253941297531128 | |
17,nncf_module.bert.encoder.layer.0.output.dense,NNCFLinear,weight,"[768, 185]",142080,108631,0.23542368412017822 | |
21,nncf_module.bert.encoder.layer.1.attention.self.query,NNCFLinear,weight,"[320, 768]",245760,136222,0.44571125507354736 | |
23,nncf_module.bert.encoder.layer.1.attention.self.key,NNCFLinear,weight,"[320, 768]",245760,136267,0.44552814960479736 | |
25,nncf_module.bert.encoder.layer.1.attention.self.value,NNCFLinear,weight,"[320, 768]",245760,124892,0.49181312322616577 | |
27,nncf_module.bert.encoder.layer.1.attention.output.dense,NNCFLinear,weight,"[768, 320]",245760,130185,0.47027587890625 | |
31,nncf_module.bert.encoder.layer.1.intermediate.dense,NNCFLinear,weight,"[315, 768]",241920,176203,0.2716476321220398 | |
33,nncf_module.bert.encoder.layer.1.output.dense,NNCFLinear,weight,"[768, 315]",241920,172407,0.2873387932777405 | |
37,nncf_module.bert.encoder.layer.2.attention.self.query,NNCFLinear,weight,"[576, 768]",442368,198811,0.5505754947662354 | |
39,nncf_module.bert.encoder.layer.2.attention.self.key,NNCFLinear,weight,"[576, 768]",442368,201526,0.5444381237030029 | |
41,nncf_module.bert.encoder.layer.2.attention.self.value,NNCFLinear,weight,"[576, 768]",442368,163541,0.6303055286407471 | |
43,nncf_module.bert.encoder.layer.2.attention.output.dense,NNCFLinear,weight,"[768, 576]",442368,167245,0.6219323873519897 | |
47,nncf_module.bert.encoder.layer.2.intermediate.dense,NNCFLinear,weight,"[339, 768]",260352,185491,0.2875376343727112 | |
49,nncf_module.bert.encoder.layer.2.output.dense,NNCFLinear,weight,"[768, 339]",260352,183083,0.2967866063117981 | |
53,nncf_module.bert.encoder.layer.3.attention.self.query,NNCFLinear,weight,"[576, 768]",442368,205898,0.5345549583435059 | |
55,nncf_module.bert.encoder.layer.3.attention.self.key,NNCFLinear,weight,"[576, 768]",442368,217621,0.5080543756484985 | |
57,nncf_module.bert.encoder.layer.3.attention.self.value,NNCFLinear,weight,"[576, 768]",442368,209726,0.5259014964103699 | |
59,nncf_module.bert.encoder.layer.3.attention.output.dense,NNCFLinear,weight,"[768, 576]",442368,208038,0.5297173261642456 | |
63,nncf_module.bert.encoder.layer.3.intermediate.dense,NNCFLinear,weight,"[368, 768]",282624,198154,0.29887765645980835 | |
65,nncf_module.bert.encoder.layer.3.output.dense,NNCFLinear,weight,"[768, 368]",282624,194127,0.31312626600265503 | |
69,nncf_module.bert.encoder.layer.4.attention.self.query,NNCFLinear,weight,"[576, 768]",442368,212567,0.5194792747497559 | |
71,nncf_module.bert.encoder.layer.4.attention.self.key,NNCFLinear,weight,"[576, 768]",442368,214788,0.5144585371017456 | |
73,nncf_module.bert.encoder.layer.4.attention.self.value,NNCFLinear,weight,"[576, 768]",442368,197159,0.5543099641799927 | |
75,nncf_module.bert.encoder.layer.4.attention.output.dense,NNCFLinear,weight,"[768, 576]",442368,192495,0.5648532509803772 | |
79,nncf_module.bert.encoder.layer.4.intermediate.dense,NNCFLinear,weight,"[386, 768]",296448,205830,0.3056792616844177 | |
81,nncf_module.bert.encoder.layer.4.output.dense,NNCFLinear,weight,"[768, 386]",296448,199567,0.32680606842041016 | |
85,nncf_module.bert.encoder.layer.5.attention.self.query,NNCFLinear,weight,"[384, 768]",294912,131257,0.5549282431602478 | |
87,nncf_module.bert.encoder.layer.5.attention.self.key,NNCFLinear,weight,"[384, 768]",294912,154458,0.47625732421875 | |
89,nncf_module.bert.encoder.layer.5.attention.self.value,NNCFLinear,weight,"[384, 768]",294912,159646,0.4586656093597412 | |
91,nncf_module.bert.encoder.layer.5.attention.output.dense,NNCFLinear,weight,"[768, 384]",294912,156889,0.4680141806602478 | |
95,nncf_module.bert.encoder.layer.5.intermediate.dense,NNCFLinear,weight,"[336, 768]",258048,184774,0.2839548587799072 | |
97,nncf_module.bert.encoder.layer.5.output.dense,NNCFLinear,weight,"[768, 336]",258048,178574,0.3079814314842224 | |
101,nncf_module.bert.encoder.layer.6.attention.self.query,NNCFLinear,weight,"[448, 768]",344064,153126,0.5549490451812744 | |
103,nncf_module.bert.encoder.layer.6.attention.self.key,NNCFLinear,weight,"[448, 768]",344064,169706,0.5067603588104248 | |
105,nncf_module.bert.encoder.layer.6.attention.self.value,NNCFLinear,weight,"[448, 768]",344064,154213,0.5517897605895996 | |
107,nncf_module.bert.encoder.layer.6.attention.output.dense,NNCFLinear,weight,"[768, 448]",344064,148815,0.5674787163734436 | |
111,nncf_module.bert.encoder.layer.6.intermediate.dense,NNCFLinear,weight,"[280, 768]",215040,158800,0.261532723903656 | |
113,nncf_module.bert.encoder.layer.6.output.dense,NNCFLinear,weight,"[768, 280]",215040,156397,0.27270740270614624 | |
117,nncf_module.bert.encoder.layer.7.attention.self.query,NNCFLinear,weight,"[448, 768]",344064,153876,0.5527692437171936 | |
119,nncf_module.bert.encoder.layer.7.attention.self.key,NNCFLinear,weight,"[448, 768]",344064,180384,0.4757254123687744 | |
121,nncf_module.bert.encoder.layer.7.attention.self.value,NNCFLinear,weight,"[448, 768]",344064,166552,0.515927255153656 | |
123,nncf_module.bert.encoder.layer.7.attention.output.dense,NNCFLinear,weight,"[768, 448]",344064,160346,0.5339646339416504 | |
127,nncf_module.bert.encoder.layer.7.intermediate.dense,NNCFLinear,weight,"[211, 768]",162048,125197,0.22740793228149414 | |
129,nncf_module.bert.encoder.layer.7.output.dense,NNCFLinear,weight,"[768, 211]",162048,123451,0.23818248510360718 | |
133,nncf_module.bert.encoder.layer.8.attention.self.query,NNCFLinear,weight,"[448, 768]",344064,149419,0.5657232403755188 | |
135,nncf_module.bert.encoder.layer.8.attention.self.key,NNCFLinear,weight,"[448, 768]",344064,150699,0.5620030164718628 | |
137,nncf_module.bert.encoder.layer.8.attention.self.value,NNCFLinear,weight,"[448, 768]",344064,124770,0.6373639702796936 | |
139,nncf_module.bert.encoder.layer.8.attention.output.dense,NNCFLinear,weight,"[768, 448]",344064,120648,0.6493443250656128 | |
143,nncf_module.bert.encoder.layer.8.intermediate.dense,NNCFLinear,weight,"[108, 768]",82944,68989,0.16824603080749512 | |
145,nncf_module.bert.encoder.layer.8.output.dense,NNCFLinear,weight,"[768, 108]",82944,68556,0.17346644401550293 | |
149,nncf_module.bert.encoder.layer.9.attention.self.query,NNCFLinear,weight,"[320, 768]",245760,121225,0.5067341923713684 | |
151,nncf_module.bert.encoder.layer.9.attention.self.key,NNCFLinear,weight,"[320, 768]",245760,114789,0.5329223275184631 | |
153,nncf_module.bert.encoder.layer.9.attention.self.value,NNCFLinear,weight,"[320, 768]",245760,69260,0.7181802988052368 | |
155,nncf_module.bert.encoder.layer.9.attention.output.dense,NNCFLinear,weight,"[768, 320]",245760,73575,0.70062255859375 | |
159,nncf_module.bert.encoder.layer.9.intermediate.dense,NNCFLinear,weight,"[53, 768]",40704,35399,0.13033121824264526 | |
161,nncf_module.bert.encoder.layer.9.output.dense,NNCFLinear,weight,"[768, 53]",40704,34918,0.1421481966972351 | |
165,nncf_module.bert.encoder.layer.10.attention.self.query,NNCFLinear,weight,"[384, 768]",294912,128113,0.5655890703201294 | |
167,nncf_module.bert.encoder.layer.10.attention.self.key,NNCFLinear,weight,"[384, 768]",294912,124553,0.5776604413986206 | |
169,nncf_module.bert.encoder.layer.10.attention.self.value,NNCFLinear,weight,"[384, 768]",294912,79608,0.7300618886947632 | |
171,nncf_module.bert.encoder.layer.10.attention.output.dense,NNCFLinear,weight,"[768, 384]",294912,85158,0.71124267578125 | |
175,nncf_module.bert.encoder.layer.10.intermediate.dense,NNCFLinear,weight,"[86, 768]",66048,55025,0.16689378023147583 | |
177,nncf_module.bert.encoder.layer.10.output.dense,NNCFLinear,weight,"[768, 86]",66048,54584,0.17357075214385986 | |
181,nncf_module.bert.encoder.layer.11.attention.self.query,NNCFLinear,weight,"[384, 768]",294912,104737,0.6448533535003662 | |
183,nncf_module.bert.encoder.layer.11.attention.self.key,NNCFLinear,weight,"[384, 768]",294912,102558,0.6522420644760132 | |
185,nncf_module.bert.encoder.layer.11.attention.self.value,NNCFLinear,weight,"[384, 768]",294912,64855,0.7800869345664978 | |
187,nncf_module.bert.encoder.layer.11.attention.output.dense,NNCFLinear,weight,"[768, 384]",294912,69674,0.7637465000152588 | |
191,nncf_module.bert.encoder.layer.11.intermediate.dense,NNCFLinear,weight,"[105, 768]",80640,67724,0.16016864776611328 | |
193,nncf_module.bert.encoder.layer.11.output.dense,NNCFLinear,weight,"[768, 105]",80640,67519,0.1627107858657837 | |