madlag commited on
Commit
4b2215f
1 Parent(s): e3e88c8

Adding model, graphs and metadata.

Browse files
README.md CHANGED
@@ -28,7 +28,7 @@ The model contains **32.0%** of the original weights **overall** (the embeddings
28
  With a simple resizing of the linear matrices it ran **2.15x as fast as bert-large-uncased-whole-word-masking** on the evaluation.
29
  This is possible because the pruning method lead to structured matrices: to visualize them, hover below on the plot to see the non-zero/zero parts of each matrix.
30
 
31
- <div class="graph"><script src="/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/density_info.js" id="a85caee3-4b94-4040-a1fc-e7d48dee0140"></script></div>
32
 
33
  In terms of accuracy, its **F1 is 83.22**, compared with 85.85 for , a **F1 drop of 2.63**.
34
 
@@ -38,7 +38,7 @@ This model is case-insensitive: it does not make a difference between english an
38
 
39
  A side-effect of the block pruning is that some of the attention heads are completely removed: 155 heads were removed on a total of 384 (40.4%).
40
  Here is a detailed view on how the remaining heads are distributed in the network after pruning.
41
- <div class="graph"><script src="/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/pruning_info.js" id="28643677-244b-48fb-940c-10f2831ab74e"></script></div>
42
 
43
  ## Details of the SQuAD1.1 dataset
44
 
28
  With a simple resizing of the linear matrices it ran **2.15x as fast as bert-large-uncased-whole-word-masking** on the evaluation.
29
  This is possible because the pruning method lead to structured matrices: to visualize them, hover below on the plot to see the non-zero/zero parts of each matrix.
30
 
31
+ <div class="graph"><script src="/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/density_info.js" id="1debdd41-fd37-4bdc-9680-8b9c19589d73"></script></div>
32
 
33
  In terms of accuracy, its **F1 is 83.22**, compared with 85.85 for , a **F1 drop of 2.63**.
34
 
38
 
39
  A side-effect of the block pruning is that some of the attention heads are completely removed: 155 heads were removed on a total of 384 (40.4%).
40
  Here is a detailed view on how the remaining heads are distributed in the network after pruning.
41
+ <div class="graph"><script src="/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/pruning_info.js" id="275e9fa1-bc94-4a73-a36c-e250fd7810ec"></script></div>
42
 
43
  ## Details of the SQuAD1.1 dataset
44
 
eval/nbest_predictions.json.tgz CHANGED
Binary files a/eval/nbest_predictions.json.tgz and b/eval/nbest_predictions.json.tgz differ
model_card/density_info.js CHANGED
@@ -16,9 +16,9 @@
16
 
17
 
18
 
19
- var element = document.getElementById("a85caee3-4b94-4040-a1fc-e7d48dee0140");
20
  if (element == null) {
21
- console.warn("Bokeh: autoload.js configured with elementid 'a85caee3-4b94-4040-a1fc-e7d48dee0140' but no matching script tag was found.")
22
  }
23
 
24
 
@@ -115,8 +115,8 @@
115
  (function(root) {
116
  function embed_document(root) {
117
 
118
- var docs_json = '{"f56a7c28-6e1b-4927-93b9-4555a3be5feb":{"roots":{"references":[{"attributes":{},"id":"1098","type":"DataRange1d"},{"attributes":{"source":{"id":"1116"}},"id":"1121","type":"CDSView"},{"attributes":{"start":0},"id":"1100","type":"DataRange1d"},{"attributes":{"fill_color":{"value":"#ed5642"},"line_color":{"value":"#ed5642"},"top":{"field":"height"},"width":{"value":0.125},"x":{"field":"x"}},"id":"1124","type":"VBar"},{"attributes":{"data":{"density":["30.3%","37.9%","19.5%","28.4%","20.3%","16.8%","19.9%","35.0%","47.9%","36.4%","43.8%","53.8%","51.2%","50.8%","64.3%","64.9%","76.3%","58.7%","68.7%","60.3%","45.8%","17.2%","17.4%","15.8%"],"height":[0.31744,0.397312,0.2048,0.297984,0.212992,0.176128,0.208896,0.366592,0.50176,0.381952,0.458752,0.564224,0.536576,0.53248,0.673792,0.68096,0.799744,0.615424,0.719872,0.631808,0.480256,0.180224,0.182272,0.165888],"img_height":["128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px"],"img_width":["128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px"],"name":["0.attention.key","1.attention.key","2.attention.key","3.attention.key","4.attention.key","5.attention.key","6.attention.key","7.attention.key","8.attention.key","9.attention.key","10.attention.key","11.attention.key","12.attention.key","13.attention.key","14.attention.key","15.attention.key","16.attention.key","17.attention.key","18.attention.key","19.attention.key","20.attention.key","21.attention.key","22.attention.key","23.attention.key"],"parameters":["0.32","0.40","0.20","0.30","0.21","0.18","0.21","0.37","0.50","0.38","0.46","0.56","0.54","0.53","0.67","0.68","0.80","0.62","0.72","0.63","0.48","0.18","0.18","0.17"],"url":["/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_0_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_1_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_2_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_3_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_4_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_5_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_6_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_7_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_8_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_9_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_10_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_11_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_12_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_13_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_14_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_15_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_16_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_17_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_18_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_19_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_20_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_21_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_22_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_23_attention_self_key.png"],"x":[0.25,1.25,2.25,3.25,4.25,5.25,6.25,7.25,8.25,9.25,10.25,11.25,12.25,13.25,14.25,15.25,16.25,17.25,18.25,19.25,20.25,21.25,22.25,23.25]},"selected":{"id":"1152"},"selection_policy":{"id":"1153"}},"id":"1122","type":"ColumnDataSource"},{"attributes":{"axis_label":"Layer","formatter":{"id":"1149"},"minor_tick_line_color":null,"ticker":{"id":"1107"}},"id":"1106","type":"LinearAxis"},{"attributes":{},"id":"1153","type":"UnionRenderers"},{"attributes":{},"id":"1107","type":"BasicTicker"},{"attributes":{},"id":"1104","type":"LinearScale"},{"attributes":{"axis_label":"Parameters (M)","formatter":{"id":"1147"},"minor_tick_line_color":null,"ticker":{"id":"1111"}},"id":"1110","type":"LinearAxis"},{"attributes":{"data_source":{"id":"1122"},"glyph":{"id":"1124"},"hover_glyph":null,"muted_glyph":null,"name":"key","nonselection_glyph":{"id":"1125"},"selection_glyph":null,"view":{"id":"1127"}},"id":"1126","type":"GlyphRenderer"},{"attributes":{},"id":"1102","type":"LinearScale"},{"attributes":{"data_source":{"id":"1134"},"glyph":{"id":"1136"},"hover_glyph":null,"muted_glyph":null,"name":"fully connected","nonselection_glyph":{"id":"1137"},"selection_glyph":null,"view":{"id":"1139"}},"id":"1138","type":"GlyphRenderer"},{"attributes":{"axis":{"id":"1106"},"grid_line_color":null,"ticker":null},"id":"1109","type":"Grid"},{"attributes":{"fill_alpha":{"value":0.1},"fill_color":{"value":"#ed5642"},"line_alpha":{"value":0.1},"line_color":{"value":"#ed5642"},"top":{"field":"height"},"width":{"value":0.125},"x":{"field":"x"}},"id":"1125","type":"VBar"},{"attributes":{},"id":"1155","type":"UnionRenderers"},{"attributes":{"data":{"density":["31.8%","34.0%","16.4%","26.9%","18.8%","17.6%","19.4%","35.4%","37.8%","28.7%","37.6%","44.5%","44.5%","50.7%","54.0%","54.1%","68.5%","54.7%","57.3%","43.8%","27.6%","12.1%","13.0%","11.2%"],"height":[0.333824,0.356352,0.172032,0.2816,0.196608,0.18432,0.203776,0.371712,0.396288,0.301056,0.39424,0.466944,0.466944,0.531456,0.566272,0.567296,0.717824,0.57344,0.601088,0.458752,0.289792,0.126976,0.136192,0.11776],"img_height":["128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px"],"img_width":["128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px"],"name":["0.attention.value","1.attention.value","2.attention.value","3.attention.value","4.attention.value","5.attention.value","6.attention.value","7.attention.value","8.attention.value","9.attention.value","10.attention.value","11.attention.value","12.attention.value","13.attention.value","14.attention.value","15.attention.value","16.attention.value","17.attention.value","18.attention.value","19.attention.value","20.attention.value","21.attention.value","22.attention.value","23.attention.value"],"parameters":["0.33","0.36","0.17","0.28","0.20","0.18","0.20","0.37","0.40","0.30","0.39","0.47","0.47","0.53","0.57","0.57","0.72","0.57","0.60","0.46","0.29","0.13","0.14","0.12"],"url":["/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_0_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_1_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_2_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_3_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_4_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_5_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_6_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_7_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_8_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_9_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_10_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_11_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_12_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_13_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_14_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_15_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_16_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_17_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_18_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_19_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_20_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_21_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_22_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_23_attention_self_value.png"],"x":[0.41666666666666663,1.4166666666666665,2.416666666666667,3.416666666666667,4.416666666666666,5.416666666666666,6.416666666666666,7.416666666666666,8.416666666666668,9.416666666666668,10.416666666666668,11.416666666666668,12.416666666666668,13.416666666666668,14.416666666666668,15.416666666666668,16.416666666666664,17.416666666666664,18.416666666666664,19.416666666666664,20.416666666666664,21.416666666666664,22.416666666666664,23.416666666666664]},"selected":{"id":"1154"},"selection_policy":{"id":"1155"}},"id":"1128","type":"ColumnDataSource"},{"attributes":{"source":{"id":"1122"}},"id":"1127","type":"CDSView"},{"attributes":{},"id":"1154","type":"Selection"},{"attributes":{"axis":{"id":"1110"},"dimension":1,"ticker":null},"id":"1113","type":"Grid"},{"attributes":{},"id":"1111","type":"BasicTicker"},{"attributes":{"fill_color":{"value":"#20cb97"},"line_color":{"value":"#20cb97"},"top":{"field":"height"},"width":{"value":0.125},"x":{"field":"x"}},"id":"1130","type":"VBar"},{"attributes":{},"id":"1147","type":"BasicTickFormatter"},{"attributes":{"callback":null,"tooltips":"\\n &lt;div&gt;\\n &lt;div style=\\"margin-bottom:10px\\"&gt;\\n &lt;span style=\\"font-size: 15px;\\"&gt;&lt;b&gt;@name&lt;/b&gt;&lt;br/&gt;density=@density&lt;/span&gt;\\n &lt;/div&gt;\\n &lt;div&gt; \\n &lt;img\\n src=\\"@url\\" height=\\"@img_height\\" width=\\"@img_width\\" alt=\\"@url\\"\\n style=\\"float: left; margin: 0px 15px 15px 0px;\\"\\n border=\\"0\\"\\n /&gt;\\n &lt;/div&gt;\\n &lt;/div&gt;\\n "},"id":"1094","type":"HoverTool"},{"attributes":{"active_drag":"auto","active_inspect":"auto","active_multi":null,"active_scroll":"auto","active_tap":"auto","tools":[{"id":"1094"}]},"id":"1114","type":"Toolbar"},{"attributes":{"text":"Transformer Layers"},"id":"1096","type":"Title"},{"attributes":{"data_source":{"id":"1128"},"glyph":{"id":"1130"},"hover_glyph":null,"muted_glyph":null,"name":"value","nonselection_glyph":{"id":"1131"},"selection_glyph":null,"view":{"id":"1133"}},"id":"1132","type":"GlyphRenderer"},{"attributes":{"fill_alpha":{"value":0.1},"fill_color":{"value":"#20cb97"},"line_alpha":{"value":0.1},"line_color":{"value":"#20cb97"},"top":{"field":"height"},"width":{"value":0.125},"x":{"field":"x"}},"id":"1131","type":"VBar"},{"attributes":{},"id":"1157","type":"UnionRenderers"},{"attributes":{"source":{"id":"1128"}},"id":"1133","type":"CDSView"},{"attributes":{},"id":"1150","type":"Selection"},{"attributes":{"fill_color":{"value":"#6573f7"},"line_color":{"value":"#6573f7"},"top":{"field":"height"},"width":{"value":0.125},"x":{"field":"x"}},"id":"1118","type":"VBar"},{"attributes":{"data":{"density":["34.4%","15.4%","15.4%","35.9%","17.0%","17.0%","17.9%","21.2%","21.2%","30.7%","24.2%","24.2%","21.6%","24.3%","24.3%","18.7%","25.3%","25.3%","20.5%","27.6%","27.6%","38.3%","27.9%","27.9%","39.3%","27.8%","27.8%","31.0%","29.4%","29.4%","39.5%","23.7%","23.7%","48.8%","26.3%","26.3%","47.3%","23.7%","23.7%","51.8%","28.5%","28.5%","57.6%","23.1%","23.1%","56.9%","22.3%","22.3%","68.9%","23.7%","23.7%","56.2%","21.7%","21.7%","57.2%","15.0%","15.0%","41.1%","9.3%","9.3%","26.7%","6.1%","6.1%","10.6%","3.1%","3.1%","11.4%","1.8%","1.8%","9.6%","3.4%","3.4%"],"height":[0.360448,0.647168,0.647168,0.376832,0.714752,0.714752,0.187392,0.887808,0.887808,0.321536,1.01376,1.01376,0.226304,1.017856,1.017856,0.195584,1.061888,1.061888,0.21504,1.156096,1.156096,0.401408,1.169408,1.169408,0.411648,1.164288,1.164288,0.324608,1.231872,1.231872,0.413696,0.995328,0.995328,0.512,1.103872,1.103872,0.495616,0.994304,0.994304,0.54272,1.196032,1.196032,0.60416,0.970752,0.970752,0.596992,0.93696,0.93696,0.722944,0.992256,0.992256,0.5888,0.910336,0.910336,0.600064,0.62976,0.62976,0.431104,0.388096,0.388096,0.279552,0.253952,0.253952,0.111616,0.130048,0.130048,0.119808,0.074752,0.074752,0.100352,0.142336,0.142336],"img_height":["128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px"],"img_width":["128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px"],"name":["0.attention.output","0.intermediate","0.output","1.attention.output","1.intermediate","1.output","2.attention.output","2.intermediate","2.output","3.attention.output","3.intermediate","3.output","4.attention.output","4.intermediate","4.output","5.attention.output","5.intermediate","5.output","6.attention.output","6.intermediate","6.output","7.attention.output","7.intermediate","7.output","8.attention.output","8.intermediate","8.output","9.attention.output","9.intermediate","9.output","10.attention.output","10.intermediate","10.output","11.attention.output","11.intermediate","11.output","12.attention.output","12.intermediate","12.output","13.attention.output","13.intermediate","13.output","14.attention.output","14.intermediate","14.output","15.attention.output","15.intermediate","15.output","16.attention.output","16.intermediate","16.output","17.attention.output","17.intermediate","17.output","18.attention.output","18.intermediate","18.output","19.attention.output","19.intermediate","19.output","20.attention.output","20.intermediate","20.output","21.attention.output","21.intermediate","21.output","22.attention.output","22.intermediate","22.output","23.attention.output","23.intermediate","23.output"],"parameters":["0.36","0.65","0.65","0.38","0.71","0.71","0.19","0.89","0.89","0.32","1.01","1.01","0.23","1.02","1.02","0.20","1.06","1.06","0.22","1.16","1.16","0.40","1.17","1.17","0.41","1.16","1.16","0.32","1.23","1.23","0.41","1.00","1.00","0.51","1.10","1.10","0.50","0.99","0.99","0.54","1.20","1.20","0.60","0.97","0.97","0.60","0.94","0.94","0.72","0.99","0.99","0.59","0.91","0.91","0.60","0.63","0.63","0.43","0.39","0.39","0.28","0.25","0.25","0.11","0.13","0.13","0.12","0.07","0.07","0.10","0.14","0.14"],"url":["/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_0_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_0_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_0_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_1_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_1_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_1_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_2_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_2_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_2_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_3_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_3_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_3_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_4_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_4_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_4_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_5_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_5_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_5_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_6_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_6_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_6_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_7_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_7_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_7_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_8_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_8_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_8_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_9_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_9_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_9_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_10_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_10_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_10_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_11_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_11_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_11_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_12_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_12_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_12_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_13_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_13_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_13_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_14_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_14_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_14_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_15_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_15_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_15_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_16_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_16_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_16_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_17_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_17_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_17_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_18_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_18_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_18_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_19_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_19_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_19_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_20_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_20_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_20_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_21_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_21_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_21_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_22_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_22_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_22_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_23_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_23_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_23_output_dense.png"],"x":[0.5833333333333334,0.75,0.9166666666666667,1.5833333333333333,1.75,1.9166666666666665,2.5833333333333335,2.75,2.916666666666667,3.5833333333333335,3.75,3.916666666666667,4.583333333333333,4.75,4.916666666666666,5.583333333333333,5.75,5.916666666666666,6.583333333333333,6.75,6.916666666666666,7.583333333333333,7.75,7.916666666666666,8.583333333333334,8.75,8.916666666666668,9.583333333333334,9.75,9.916666666666668,10.583333333333334,10.75,10.916666666666668,11.583333333333334,11.75,11.916666666666668,12.583333333333334,12.75,12.916666666666668,13.583333333333334,13.75,13.916666666666668,14.583333333333334,14.75,14.916666666666668,15.583333333333334,15.75,15.916666666666668,16.583333333333332,16.75,16.916666666666664,17.583333333333332,17.75,17.916666666666664,18.583333333333332,18.75,18.916666666666664,19.583333333333332,19.75,19.916666666666664,20.583333333333332,20.75,20.916666666666664,21.583333333333332,21.75,21.916666666666664,22.583333333333332,22.75,22.916666666666664,23.583333333333332,23.75,23.916666666666664]},"selected":{"id":"1156"},"selection_policy":{"id":"1157"}},"id":"1134","type":"ColumnDataSource"},{"attributes":{"fill_color":{"value":"#aa69f7"},"line_color":{"value":"#aa69f7"},"top":{"field":"height"},"width":{"value":0.125},"x":{"field":"x"}},"id":"1136","type":"VBar"},{"attributes":{},"id":"1149","type":"BasicTickFormatter"},{"attributes":{"items":[{"id":"1141"},{"id":"1142"},{"id":"1143"},{"id":"1144"}],"location":[10,0],"orientation":"horizontal"},"id":"1140","type":"Legend"},{"attributes":{},"id":"1151","type":"UnionRenderers"},{"attributes":{"fill_alpha":{"value":0.1},"fill_color":{"value":"#aa69f7"},"line_alpha":{"value":0.1},"line_color":{"value":"#aa69f7"},"top":{"field":"height"},"width":{"value":0.125},"x":{"field":"x"}},"id":"1137","type":"VBar"},{"attributes":{},"id":"1152","type":"Selection"},{"attributes":{"source":{"id":"1134"}},"id":"1139","type":"CDSView"},{"attributes":{"label":{"value":"query"},"renderers":[{"id":"1120"}]},"id":"1141","type":"LegendItem"},{"attributes":{"label":{"value":"fully connected"},"renderers":[{"id":"1138"}]},"id":"1144","type":"LegendItem"},{"attributes":{"label":{"value":"key"},"renderers":[{"id":"1126"}]},"id":"1142","type":"LegendItem"},{"attributes":{"data_source":{"id":"1116"},"glyph":{"id":"1118"},"hover_glyph":null,"muted_glyph":null,"name":"query","nonselection_glyph":{"id":"1119"},"selection_glyph":null,"view":{"id":"1121"}},"id":"1120","type":"GlyphRenderer"},{"attributes":{"fill_alpha":{"value":0.1},"fill_color":{"value":"#6573f7"},"line_alpha":{"value":0.1},"line_color":{"value":"#6573f7"},"top":{"field":"height"},"width":{"value":0.125},"x":{"field":"x"}},"id":"1119","type":"VBar"},{"attributes":{"above":[{"id":"1140"}],"below":[{"id":"1106"}],"center":[{"id":"1109"},{"id":"1113"}],"left":[{"id":"1110"}],"outline_line_color":null,"plot_height":300,"plot_width":505,"renderers":[{"id":"1120"},{"id":"1126"},{"id":"1132"},{"id":"1138"}],"title":{"id":"1096"},"toolbar":{"id":"1114"},"x_range":{"id":"1098"},"x_scale":{"id":"1102"},"y_range":{"id":"1100"},"y_scale":{"id":"1104"}},"id":"1095","subtype":"Figure","type":"Plot"},{"attributes":{"label":{"value":"value"},"renderers":[{"id":"1132"}]},"id":"1143","type":"LegendItem"},{"attributes":{},"id":"1156","type":"Selection"},{"attributes":{"data":{"density":["30.3%","39.0%","18.8%","25.1%","19.0%","17.0%","18.0%","34.7%","45.3%","37.1%","43.1%","52.2%","48.8%","50.2%","61.6%","64.0%","72.0%","56.8%","67.5%","58.5%","47.3%","18.1%","17.1%","13.7%"],"height":[0.31744,0.408576,0.197632,0.263168,0.19968,0.178176,0.188416,0.36352,0.475136,0.38912,0.451584,0.54784,0.512,0.526336,0.646144,0.67072,0.754688,0.595968,0.707584,0.613376,0.495616,0.18944,0.1792,0.14336],"img_height":["128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px"],"img_width":["128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px"],"name":["0.attention.query","1.attention.query","2.attention.query","3.attention.query","4.attention.query","5.attention.query","6.attention.query","7.attention.query","8.attention.query","9.attention.query","10.attention.query","11.attention.query","12.attention.query","13.attention.query","14.attention.query","15.attention.query","16.attention.query","17.attention.query","18.attention.query","19.attention.query","20.attention.query","21.attention.query","22.attention.query","23.attention.query"],"parameters":["0.32","0.41","0.20","0.26","0.20","0.18","0.19","0.36","0.48","0.39","0.45","0.55","0.51","0.53","0.65","0.67","0.75","0.60","0.71","0.61","0.50","0.19","0.18","0.14"],"url":["/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_0_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_1_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_2_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_3_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_4_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_5_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_6_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_7_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_8_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_9_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_10_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_11_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_12_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_13_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_14_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_15_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_16_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_17_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_18_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_19_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_20_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_21_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_22_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_23_attention_self_query.png"],"x":[0.08333333333333333,1.0833333333333333,2.0833333333333335,3.0833333333333335,4.083333333333333,5.083333333333333,6.083333333333333,7.083333333333333,8.083333333333334,9.083333333333334,10.083333333333334,11.083333333333334,12.083333333333334,13.083333333333334,14.083333333333334,15.083333333333334,16.083333333333332,17.083333333333332,18.083333333333332,19.083333333333332,20.083333333333332,21.083333333333332,22.083333333333332,23.083333333333332]},"selected":{"id":"1150"},"selection_policy":{"id":"1151"}},"id":"1116","type":"ColumnDataSource"}],"root_ids":["1095"]},"title":"Bokeh Application","version":"2.2.3"}}';
119
- var render_items = [{"docid":"f56a7c28-6e1b-4927-93b9-4555a3be5feb","root_ids":["1095"],"roots":{"1095":"a85caee3-4b94-4040-a1fc-e7d48dee0140"}}];
120
  root.Bokeh.embed.embed_items(docs_json, render_items);
121
 
122
  }
16
 
17
 
18
 
19
+ var element = document.getElementById("1debdd41-fd37-4bdc-9680-8b9c19589d73");
20
  if (element == null) {
21
+ console.warn("Bokeh: autoload.js configured with elementid '1debdd41-fd37-4bdc-9680-8b9c19589d73' but no matching script tag was found.")
22
  }
23
 
24
 
115
  (function(root) {
116
  function embed_document(root) {
117
 
118
+ var docs_json = '{"53909e90-a81a-4854-9fa2-512475f1322d":{"roots":{"references":[{"attributes":{"axis_label":"Parameters (M)","formatter":{"id":"1146"},"minor_tick_line_color":null,"ticker":{"id":"1111"}},"id":"1110","type":"LinearAxis"},{"attributes":{},"id":"1104","type":"LinearScale"},{"attributes":{},"id":"1157","type":"UnionRenderers"},{"attributes":{},"id":"1098","type":"DataRange1d"},{"attributes":{"fill_color":{"value":"#20cb97"},"line_color":{"value":"#20cb97"},"top":{"field":"height"},"width":{"value":0.125},"x":{"field":"x"}},"id":"1130","type":"VBar"},{"attributes":{},"id":"1102","type":"LinearScale"},{"attributes":{"axis_label":"Layer","formatter":{"id":"1148"},"minor_tick_line_color":null,"ticker":{"id":"1107"}},"id":"1106","type":"LinearAxis"},{"attributes":{},"id":"1156","type":"Selection"},{"attributes":{},"id":"1107","type":"BasicTicker"},{"attributes":{"label":{"value":"value"},"renderers":[{"id":"1132"}]},"id":"1143","type":"LegendItem"},{"attributes":{"fill_color":{"value":"#6573f7"},"line_color":{"value":"#6573f7"},"top":{"field":"height"},"width":{"value":0.125},"x":{"field":"x"}},"id":"1118","type":"VBar"},{"attributes":{"source":{"id":"1116"}},"id":"1121","type":"CDSView"},{"attributes":{},"id":"1155","type":"UnionRenderers"},{"attributes":{"axis":{"id":"1106"},"grid_line_color":null,"ticker":null},"id":"1109","type":"Grid"},{"attributes":{},"id":"1152","type":"Selection"},{"attributes":{},"id":"1154","type":"Selection"},{"attributes":{"items":[{"id":"1141"},{"id":"1142"},{"id":"1143"},{"id":"1144"}],"location":[10,0],"orientation":"horizontal"},"id":"1140","type":"Legend"},{"attributes":{"axis":{"id":"1110"},"dimension":1,"ticker":null},"id":"1113","type":"Grid"},{"attributes":{"data_source":{"id":"1134"},"glyph":{"id":"1136"},"hover_glyph":null,"muted_glyph":null,"name":"fully connected","nonselection_glyph":{"id":"1137"},"selection_glyph":null,"view":{"id":"1139"}},"id":"1138","type":"GlyphRenderer"},{"attributes":{"data_source":{"id":"1122"},"glyph":{"id":"1124"},"hover_glyph":null,"muted_glyph":null,"name":"key","nonselection_glyph":{"id":"1125"},"selection_glyph":null,"view":{"id":"1127"}},"id":"1126","type":"GlyphRenderer"},{"attributes":{},"id":"1148","type":"BasicTickFormatter"},{"attributes":{"above":[{"id":"1140"}],"below":[{"id":"1106"}],"center":[{"id":"1109"},{"id":"1113"}],"left":[{"id":"1110"}],"outline_line_color":null,"plot_height":300,"plot_width":505,"renderers":[{"id":"1120"},{"id":"1126"},{"id":"1132"},{"id":"1138"}],"title":{"id":"1096"},"toolbar":{"id":"1114"},"x_range":{"id":"1098"},"x_scale":{"id":"1102"},"y_range":{"id":"1100"},"y_scale":{"id":"1104"}},"id":"1095","subtype":"Figure","type":"Plot"},{"attributes":{"data_source":{"id":"1128"},"glyph":{"id":"1130"},"hover_glyph":null,"muted_glyph":null,"name":"value","nonselection_glyph":{"id":"1131"},"selection_glyph":null,"view":{"id":"1133"}},"id":"1132","type":"GlyphRenderer"},{"attributes":{"fill_color":{"value":"#ed5642"},"line_color":{"value":"#ed5642"},"top":{"field":"height"},"width":{"value":0.125},"x":{"field":"x"}},"id":"1124","type":"VBar"},{"attributes":{"fill_color":{"value":"#aa69f7"},"line_color":{"value":"#aa69f7"},"top":{"field":"height"},"width":{"value":0.125},"x":{"field":"x"}},"id":"1136","type":"VBar"},{"attributes":{},"id":"1146","type":"BasicTickFormatter"},{"attributes":{"data":{"density":["30.3%","39.0%","18.8%","25.1%","19.0%","17.0%","18.0%","34.7%","45.3%","37.1%","43.1%","52.2%","48.8%","50.2%","61.6%","64.0%","72.0%","56.8%","67.5%","58.5%","47.3%","18.1%","17.1%","13.7%"],"height":[0.31744,0.408576,0.197632,0.263168,0.19968,0.178176,0.188416,0.36352,0.475136,0.38912,0.451584,0.54784,0.512,0.526336,0.646144,0.67072,0.754688,0.595968,0.707584,0.613376,0.495616,0.18944,0.1792,0.14336],"img_height":["128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px"],"img_width":["128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px"],"name":["0.attention.query","1.attention.query","2.attention.query","3.attention.query","4.attention.query","5.attention.query","6.attention.query","7.attention.query","8.attention.query","9.attention.query","10.attention.query","11.attention.query","12.attention.query","13.attention.query","14.attention.query","15.attention.query","16.attention.query","17.attention.query","18.attention.query","19.attention.query","20.attention.query","21.attention.query","22.attention.query","23.attention.query"],"parameters":["0.32","0.41","0.20","0.26","0.20","0.18","0.19","0.36","0.48","0.39","0.45","0.55","0.51","0.53","0.65","0.67","0.75","0.60","0.71","0.61","0.50","0.19","0.18","0.14"],"url":["/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_0_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_1_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_2_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_3_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_4_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_5_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_6_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_7_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_8_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_9_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_10_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_11_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_12_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_13_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_14_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_15_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_16_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_17_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_18_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_19_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_20_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_21_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_22_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_23_attention_self_query.png"],"x":[0.08333333333333333,1.0833333333333333,2.0833333333333335,3.0833333333333335,4.083333333333333,5.083333333333333,6.083333333333333,7.083333333333333,8.083333333333334,9.083333333333334,10.083333333333334,11.083333333333334,12.083333333333334,13.083333333333334,14.083333333333334,15.083333333333334,16.083333333333332,17.083333333333332,18.083333333333332,19.083333333333332,20.083333333333332,21.083333333333332,22.083333333333332,23.083333333333332]},"selected":{"id":"1150"},"selection_policy":{"id":"1151"}},"id":"1116","type":"ColumnDataSource"},{"attributes":{"label":{"value":"key"},"renderers":[{"id":"1126"}]},"id":"1142","type":"LegendItem"},{"attributes":{},"id":"1151","type":"UnionRenderers"},{"attributes":{},"id":"1111","type":"BasicTicker"},{"attributes":{"callback":null,"tooltips":"\\n &lt;div&gt;\\n &lt;div style=\\"margin-bottom:10px\\"&gt;\\n &lt;span style=\\"font-size: 15px;\\"&gt;&lt;b&gt;@name&lt;/b&gt;&lt;br/&gt;density=@density&lt;/span&gt;\\n &lt;/div&gt;\\n &lt;div&gt; \\n &lt;img\\n src=\\"@url\\" height=\\"@img_height\\" width=\\"@img_width\\" alt=\\"@url\\"\\n style=\\"float: left; margin: 0px 15px 15px 0px;\\"\\n border=\\"0\\"\\n /&gt;\\n &lt;/div&gt;\\n &lt;/div&gt;\\n "},"id":"1094","type":"HoverTool"},{"attributes":{"data":{"density":["30.3%","37.9%","19.5%","28.4%","20.3%","16.8%","19.9%","35.0%","47.9%","36.4%","43.8%","53.8%","51.2%","50.8%","64.3%","64.9%","76.3%","58.7%","68.7%","60.3%","45.8%","17.2%","17.4%","15.8%"],"height":[0.31744,0.397312,0.2048,0.297984,0.212992,0.176128,0.208896,0.366592,0.50176,0.381952,0.458752,0.564224,0.536576,0.53248,0.673792,0.68096,0.799744,0.615424,0.719872,0.631808,0.480256,0.180224,0.182272,0.165888],"img_height":["128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px"],"img_width":["128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px"],"name":["0.attention.key","1.attention.key","2.attention.key","3.attention.key","4.attention.key","5.attention.key","6.attention.key","7.attention.key","8.attention.key","9.attention.key","10.attention.key","11.attention.key","12.attention.key","13.attention.key","14.attention.key","15.attention.key","16.attention.key","17.attention.key","18.attention.key","19.attention.key","20.attention.key","21.attention.key","22.attention.key","23.attention.key"],"parameters":["0.32","0.40","0.20","0.30","0.21","0.18","0.21","0.37","0.50","0.38","0.46","0.56","0.54","0.53","0.67","0.68","0.80","0.62","0.72","0.63","0.48","0.18","0.18","0.17"],"url":["/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_0_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_1_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_2_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_3_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_4_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_5_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_6_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_7_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_8_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_9_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_10_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_11_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_12_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_13_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_14_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_15_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_16_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_17_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_18_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_19_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_20_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_21_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_22_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_23_attention_self_key.png"],"x":[0.25,1.25,2.25,3.25,4.25,5.25,6.25,7.25,8.25,9.25,10.25,11.25,12.25,13.25,14.25,15.25,16.25,17.25,18.25,19.25,20.25,21.25,22.25,23.25]},"selected":{"id":"1152"},"selection_policy":{"id":"1153"}},"id":"1122","type":"ColumnDataSource"},{"attributes":{"source":{"id":"1128"}},"id":"1133","type":"CDSView"},{"attributes":{},"id":"1150","type":"Selection"},{"attributes":{"fill_alpha":{"value":0.1},"fill_color":{"value":"#aa69f7"},"line_alpha":{"value":0.1},"line_color":{"value":"#aa69f7"},"top":{"field":"height"},"width":{"value":0.125},"x":{"field":"x"}},"id":"1137","type":"VBar"},{"attributes":{"source":{"id":"1134"}},"id":"1139","type":"CDSView"},{"attributes":{"fill_alpha":{"value":0.1},"fill_color":{"value":"#20cb97"},"line_alpha":{"value":0.1},"line_color":{"value":"#20cb97"},"top":{"field":"height"},"width":{"value":0.125},"x":{"field":"x"}},"id":"1131","type":"VBar"},{"attributes":{"active_drag":"auto","active_inspect":"auto","active_multi":null,"active_scroll":"auto","active_tap":"auto","tools":[{"id":"1094"}]},"id":"1114","type":"Toolbar"},{"attributes":{"fill_alpha":{"value":0.1},"fill_color":{"value":"#6573f7"},"line_alpha":{"value":0.1},"line_color":{"value":"#6573f7"},"top":{"field":"height"},"width":{"value":0.125},"x":{"field":"x"}},"id":"1119","type":"VBar"},{"attributes":{"fill_alpha":{"value":0.1},"fill_color":{"value":"#ed5642"},"line_alpha":{"value":0.1},"line_color":{"value":"#ed5642"},"top":{"field":"height"},"width":{"value":0.125},"x":{"field":"x"}},"id":"1125","type":"VBar"},{"attributes":{"start":0},"id":"1100","type":"DataRange1d"},{"attributes":{"label":{"value":"fully connected"},"renderers":[{"id":"1138"}]},"id":"1144","type":"LegendItem"},{"attributes":{"data":{"density":["31.8%","34.0%","16.4%","26.9%","18.8%","17.6%","19.4%","35.4%","37.8%","28.7%","37.6%","44.5%","44.5%","50.7%","54.0%","54.1%","68.5%","54.7%","57.3%","43.8%","27.6%","12.1%","13.0%","11.2%"],"height":[0.333824,0.356352,0.172032,0.2816,0.196608,0.18432,0.203776,0.371712,0.396288,0.301056,0.39424,0.466944,0.466944,0.531456,0.566272,0.567296,0.717824,0.57344,0.601088,0.458752,0.289792,0.126976,0.136192,0.11776],"img_height":["128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px"],"img_width":["128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px"],"name":["0.attention.value","1.attention.value","2.attention.value","3.attention.value","4.attention.value","5.attention.value","6.attention.value","7.attention.value","8.attention.value","9.attention.value","10.attention.value","11.attention.value","12.attention.value","13.attention.value","14.attention.value","15.attention.value","16.attention.value","17.attention.value","18.attention.value","19.attention.value","20.attention.value","21.attention.value","22.attention.value","23.attention.value"],"parameters":["0.33","0.36","0.17","0.28","0.20","0.18","0.20","0.37","0.40","0.30","0.39","0.47","0.47","0.53","0.57","0.57","0.72","0.57","0.60","0.46","0.29","0.13","0.14","0.12"],"url":["/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_0_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_1_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_2_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_3_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_4_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_5_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_6_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_7_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_8_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_9_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_10_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_11_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_12_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_13_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_14_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_15_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_16_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_17_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_18_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_19_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_20_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_21_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_22_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_23_attention_self_value.png"],"x":[0.41666666666666663,1.4166666666666665,2.416666666666667,3.416666666666667,4.416666666666666,5.416666666666666,6.416666666666666,7.416666666666666,8.416666666666668,9.416666666666668,10.416666666666668,11.416666666666668,12.416666666666668,13.416666666666668,14.416666666666668,15.416666666666668,16.416666666666664,17.416666666666664,18.416666666666664,19.416666666666664,20.416666666666664,21.416666666666664,22.416666666666664,23.416666666666664]},"selected":{"id":"1154"},"selection_policy":{"id":"1155"}},"id":"1128","type":"ColumnDataSource"},{"attributes":{"text":"Transformer Layers"},"id":"1096","type":"Title"},{"attributes":{},"id":"1153","type":"UnionRenderers"},{"attributes":{"source":{"id":"1122"}},"id":"1127","type":"CDSView"},{"attributes":{"data_source":{"id":"1116"},"glyph":{"id":"1118"},"hover_glyph":null,"muted_glyph":null,"name":"query","nonselection_glyph":{"id":"1119"},"selection_glyph":null,"view":{"id":"1121"}},"id":"1120","type":"GlyphRenderer"},{"attributes":{"data":{"density":["34.4%","15.4%","15.4%","35.9%","17.0%","17.0%","17.9%","21.2%","21.2%","30.7%","24.2%","24.2%","21.6%","24.3%","24.3%","18.7%","25.3%","25.3%","20.5%","27.6%","27.6%","38.3%","27.9%","27.9%","39.3%","27.8%","27.8%","31.0%","29.4%","29.4%","39.5%","23.7%","23.7%","48.8%","26.3%","26.3%","47.3%","23.7%","23.7%","51.8%","28.5%","28.5%","57.6%","23.1%","23.1%","56.9%","22.3%","22.3%","68.9%","23.7%","23.7%","56.2%","21.7%","21.7%","57.2%","15.0%","15.0%","41.1%","9.3%","9.3%","26.7%","6.1%","6.1%","10.6%","3.1%","3.1%","11.4%","1.8%","1.8%","9.6%","3.4%","3.4%"],"height":[0.360448,0.647168,0.647168,0.376832,0.714752,0.714752,0.187392,0.887808,0.887808,0.321536,1.01376,1.01376,0.226304,1.017856,1.017856,0.195584,1.061888,1.061888,0.21504,1.156096,1.156096,0.401408,1.169408,1.169408,0.411648,1.164288,1.164288,0.324608,1.231872,1.231872,0.413696,0.995328,0.995328,0.512,1.103872,1.103872,0.495616,0.994304,0.994304,0.54272,1.196032,1.196032,0.60416,0.970752,0.970752,0.596992,0.93696,0.93696,0.722944,0.992256,0.992256,0.5888,0.910336,0.910336,0.600064,0.62976,0.62976,0.431104,0.388096,0.388096,0.279552,0.253952,0.253952,0.111616,0.130048,0.130048,0.119808,0.074752,0.074752,0.100352,0.142336,0.142336],"img_height":["128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px"],"img_width":["128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px"],"name":["0.attention.output","0.intermediate","0.output","1.attention.output","1.intermediate","1.output","2.attention.output","2.intermediate","2.output","3.attention.output","3.intermediate","3.output","4.attention.output","4.intermediate","4.output","5.attention.output","5.intermediate","5.output","6.attention.output","6.intermediate","6.output","7.attention.output","7.intermediate","7.output","8.attention.output","8.intermediate","8.output","9.attention.output","9.intermediate","9.output","10.attention.output","10.intermediate","10.output","11.attention.output","11.intermediate","11.output","12.attention.output","12.intermediate","12.output","13.attention.output","13.intermediate","13.output","14.attention.output","14.intermediate","14.output","15.attention.output","15.intermediate","15.output","16.attention.output","16.intermediate","16.output","17.attention.output","17.intermediate","17.output","18.attention.output","18.intermediate","18.output","19.attention.output","19.intermediate","19.output","20.attention.output","20.intermediate","20.output","21.attention.output","21.intermediate","21.output","22.attention.output","22.intermediate","22.output","23.attention.output","23.intermediate","23.output"],"parameters":["0.36","0.65","0.65","0.38","0.71","0.71","0.19","0.89","0.89","0.32","1.01","1.01","0.23","1.02","1.02","0.20","1.06","1.06","0.22","1.16","1.16","0.40","1.17","1.17","0.41","1.16","1.16","0.32","1.23","1.23","0.41","1.00","1.00","0.51","1.10","1.10","0.50","0.99","0.99","0.54","1.20","1.20","0.60","0.97","0.97","0.60","0.94","0.94","0.72","0.99","0.99","0.59","0.91","0.91","0.60","0.63","0.63","0.43","0.39","0.39","0.28","0.25","0.25","0.11","0.13","0.13","0.12","0.07","0.07","0.10","0.14","0.14"],"url":["/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_0_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_0_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_0_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_1_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_1_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_1_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_2_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_2_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_2_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_3_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_3_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_3_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_4_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_4_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_4_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_5_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_5_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_5_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_6_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_6_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_6_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_7_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_7_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_7_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_8_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_8_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_8_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_9_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_9_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_9_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_10_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_10_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_10_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_11_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_11_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_11_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_12_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_12_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_12_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_13_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_13_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_13_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_14_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_14_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_14_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_15_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_15_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_15_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_16_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_16_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_16_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_17_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_17_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_17_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_18_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_18_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_18_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_19_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_19_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_19_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_20_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_20_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_20_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_21_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_21_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_21_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_22_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_22_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_22_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_23_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_23_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.15-f83.2-d25-hybrid-v1/raw/main/model_card/images/layer_23_output_dense.png"],"x":[0.5833333333333334,0.75,0.9166666666666667,1.5833333333333333,1.75,1.9166666666666665,2.5833333333333335,2.75,2.916666666666667,3.5833333333333335,3.75,3.916666666666667,4.583333333333333,4.75,4.916666666666666,5.583333333333333,5.75,5.916666666666666,6.583333333333333,6.75,6.916666666666666,7.583333333333333,7.75,7.916666666666666,8.583333333333334,8.75,8.916666666666668,9.583333333333334,9.75,9.916666666666668,10.583333333333334,10.75,10.916666666666668,11.583333333333334,11.75,11.916666666666668,12.583333333333334,12.75,12.916666666666668,13.583333333333334,13.75,13.916666666666668,14.583333333333334,14.75,14.916666666666668,15.583333333333334,15.75,15.916666666666668,16.583333333333332,16.75,16.916666666666664,17.583333333333332,17.75,17.916666666666664,18.583333333333332,18.75,18.916666666666664,19.583333333333332,19.75,19.916666666666664,20.583333333333332,20.75,20.916666666666664,21.583333333333332,21.75,21.916666666666664,22.583333333333332,22.75,22.916666666666664,23.583333333333332,23.75,23.916666666666664]},"selected":{"id":"1156"},"selection_policy":{"id":"1157"}},"id":"1134","type":"ColumnDataSource"},{"attributes":{"label":{"value":"query"},"renderers":[{"id":"1120"}]},"id":"1141","type":"LegendItem"}],"root_ids":["1095"]},"title":"Bokeh Application","version":"2.2.3"}}';
119
+ var render_items = [{"docid":"53909e90-a81a-4854-9fa2-512475f1322d","root_ids":["1095"],"roots":{"1095":"1debdd41-fd37-4bdc-9680-8b9c19589d73"}}];
120
  root.Bokeh.embed.embed_items(docs_json, render_items);
121
 
122
  }
model_card/pruning_info.js CHANGED
@@ -16,9 +16,9 @@
16
 
17
 
18
 
19
- var element = document.getElementById("28643677-244b-48fb-940c-10f2831ab74e");
20
  if (element == null) {
21
- console.warn("Bokeh: autoload.js configured with elementid '28643677-244b-48fb-940c-10f2831ab74e' but no matching script tag was found.")
22
  }
23
 
24
 
@@ -115,8 +115,8 @@
115
  (function(root) {
116
  function embed_document(root) {
117
 
118
- var docs_json = '{"a16af632-a774-4f60-b023-478254f862f1":{"roots":{"references":[{"attributes":{"start":0},"id":"1006","type":"DataRange1d"},{"attributes":{},"id":"1008","type":"CategoricalScale"},{"attributes":{"axis":{"id":"1012"},"grid_line_color":null,"ticker":null},"id":"1014","type":"Grid"},{"attributes":{"factors":["0","1","2","3","4","5","6","7","8","9","10","11","12","13","14","15","16","17","18","19","20","21","22","23"],"range_padding":0.1},"id":"1004","type":"FactorRange"},{"attributes":{"above":[{"id":"1055"}],"below":[{"id":"1012"}],"center":[{"id":"1014"},{"id":"1018"},{"id":"1037"}],"left":[{"id":"1015"}],"outline_line_color":null,"plot_height":400,"renderers":[{"id":"1028"},{"id":"1043"}],"title":{"id":"1002"},"toolbar":{"id":"1019"},"toolbar_location":null,"x_range":{"id":"1004"},"x_scale":{"id":"1008"},"y_range":{"id":"1006"},"y_scale":{"id":"1010"}},"id":"1001","subtype":"Figure","type":"Plot"},{"attributes":{"items":[{"id":"1056"},{"id":"1057"}],"location":[10,0],"orientation":"horizontal"},"id":"1055","type":"Legend"},{"attributes":{"fields":[]},"id":"1020","type":"Stack"},{"attributes":{},"id":"1052","type":"Selection"},{"attributes":{"label":{"value":"active"},"renderers":[{"id":"1028"}]},"id":"1038","type":"LegendItem"},{"attributes":{},"id":"1053","type":"UnionRenderers"},{"attributes":{},"id":"1032","type":"BasicTickFormatter"},{"attributes":{},"id":"1035","type":"Selection"},{"attributes":{},"id":"1010","type":"LinearScale"},{"attributes":{},"id":"1036","type":"UnionRenderers"},{"attributes":{"text":"Pruned Transformer Heads"},"id":"1002","type":"Title"},{"attributes":{},"id":"1034","type":"CategoricalTickFormatter"},{"attributes":{"data":{"active":[9,9,4,6,5,5,4,8,9,8,8,10,11,10,14,14,16,13,14,15,13,7,8,9],"layers":["0","1","2","3","4","5","6","7","8","9","10","11","12","13","14","15","16","17","18","19","20","21","22","23"],"pruned":[7,7,12,10,11,11,12,8,7,8,8,6,5,6,2,2,0,3,2,1,3,9,8,7]},"selected":{"id":"1052"},"selection_policy":{"id":"1053"}},"id":"1039","type":"ColumnDataSource"},{"attributes":{"label":{"value":"active"},"renderers":[{"id":"1028"}]},"id":"1056","type":"LegendItem"},{"attributes":{"label":{"value":"pruned"},"renderers":[{"id":"1043"}]},"id":"1057","type":"LegendItem"},{"attributes":{"fields":["active"]},"id":"1021","type":"Stack"},{"attributes":{"source":{"id":"1039"}},"id":"1044","type":"CDSView"},{"attributes":{"axis":{"id":"1015"},"dimension":1,"ticker":null},"id":"1018","type":"Grid"},{"attributes":{},"id":"1016","type":"BasicTicker"},{"attributes":{"bottom":{"expr":{"id":"1022"}},"fill_color":{"value":"#ffcccc"},"line_color":{"value":"#ffcccc"},"top":{"expr":{"id":"1023"}},"width":{"value":0.9},"x":{"field":"layers"}},"id":"1041","type":"VBar"},{"attributes":{"label":{"value":"pruned"},"renderers":[{"id":"1043"}]},"id":"1054","type":"LegendItem"},{"attributes":{"bottom":{"expr":{"id":"1022"}},"fill_alpha":{"value":0.1},"fill_color":{"value":"#ffcccc"},"line_alpha":{"value":0.1},"line_color":{"value":"#ffcccc"},"top":{"expr":{"id":"1023"}},"width":{"value":0.9},"x":{"field":"layers"}},"id":"1042","type":"VBar"},{"attributes":{"data":{"active":[9,9,4,6,5,5,4,8,9,8,8,10,11,10,14,14,16,13,14,15,13,7,8,9],"layers":["0","1","2","3","4","5","6","7","8","9","10","11","12","13","14","15","16","17","18","19","20","21","22","23"],"pruned":[7,7,12,10,11,11,12,8,7,8,8,6,5,6,2,2,0,3,2,1,3,9,8,7]},"selected":{"id":"1035"},"selection_policy":{"id":"1036"}},"id":"1024","type":"ColumnDataSource"},{"attributes":{"axis_label":"Heads count","formatter":{"id":"1032"},"minor_tick_line_color":null,"ticker":{"id":"1016"}},"id":"1015","type":"LinearAxis"},{"attributes":{"data_source":{"id":"1039"},"glyph":{"id":"1041"},"hover_glyph":null,"muted_glyph":null,"name":"pruned","nonselection_glyph":{"id":"1042"},"selection_glyph":null,"view":{"id":"1044"}},"id":"1043","type":"GlyphRenderer"},{"attributes":{"fields":["active","pruned"]},"id":"1023","type":"Stack"},{"attributes":{"active_drag":"auto","active_inspect":"auto","active_multi":null,"active_scroll":"auto","active_tap":"auto"},"id":"1019","type":"Toolbar"},{"attributes":{"source":{"id":"1024"}},"id":"1029","type":"CDSView"},{"attributes":{"bottom":{"expr":{"id":"1020"}},"fill_color":{"value":"#0000ff"},"line_color":{"value":"#0000ff"},"top":{"expr":{"id":"1021"}},"width":{"value":0.9},"x":{"field":"layers"}},"id":"1026","type":"VBar"},{"attributes":{"fields":["active"]},"id":"1022","type":"Stack"},{"attributes":{"bottom":{"expr":{"id":"1020"}},"fill_alpha":{"value":0.1},"fill_color":{"value":"#0000ff"},"line_alpha":{"value":0.1},"line_color":{"value":"#0000ff"},"top":{"expr":{"id":"1021"}},"width":{"value":0.9},"x":{"field":"layers"}},"id":"1027","type":"VBar"},{"attributes":{"items":[{"id":"1038"},{"id":"1054"}],"location":null},"id":"1037","type":"Legend"},{"attributes":{},"id":"1013","type":"CategoricalTicker"},{"attributes":{"data_source":{"id":"1024"},"glyph":{"id":"1026"},"hover_glyph":null,"muted_glyph":null,"name":"active","nonselection_glyph":{"id":"1027"},"selection_glyph":null,"view":{"id":"1029"}},"id":"1028","type":"GlyphRenderer"},{"attributes":{"axis_label":"Layer index","formatter":{"id":"1034"},"minor_tick_line_color":null,"ticker":{"id":"1013"}},"id":"1012","type":"CategoricalAxis"}],"root_ids":["1001"]},"title":"Bokeh Application","version":"2.2.3"}}';
119
- var render_items = [{"docid":"a16af632-a774-4f60-b023-478254f862f1","root_ids":["1001"],"roots":{"1001":"28643677-244b-48fb-940c-10f2831ab74e"}}];
120
  root.Bokeh.embed.embed_items(docs_json, render_items);
121
 
122
  }
16
 
17
 
18
 
19
+ var element = document.getElementById("275e9fa1-bc94-4a73-a36c-e250fd7810ec");
20
  if (element == null) {
21
+ console.warn("Bokeh: autoload.js configured with elementid '275e9fa1-bc94-4a73-a36c-e250fd7810ec' but no matching script tag was found.")
22
  }
23
 
24
 
115
  (function(root) {
116
  function embed_document(root) {
117
 
118
+ var docs_json = '{"701239e5-a951-4da6-bd5b-ad008f0dba23":{"roots":{"references":[{"attributes":{"start":0},"id":"1006","type":"DataRange1d"},{"attributes":{},"id":"1036","type":"UnionRenderers"},{"attributes":{},"id":"1008","type":"CategoricalScale"},{"attributes":{"axis":{"id":"1012"},"grid_line_color":null,"ticker":null},"id":"1014","type":"Grid"},{"attributes":{"factors":["0","1","2","3","4","5","6","7","8","9","10","11","12","13","14","15","16","17","18","19","20","21","22","23"],"range_padding":0.1},"id":"1004","type":"FactorRange"},{"attributes":{"above":[{"id":"1055"}],"below":[{"id":"1012"}],"center":[{"id":"1014"},{"id":"1018"},{"id":"1037"}],"left":[{"id":"1015"}],"outline_line_color":null,"plot_height":400,"renderers":[{"id":"1028"},{"id":"1043"}],"title":{"id":"1002"},"toolbar":{"id":"1019"},"toolbar_location":null,"x_range":{"id":"1004"},"x_scale":{"id":"1008"},"y_range":{"id":"1006"},"y_scale":{"id":"1010"}},"id":"1001","subtype":"Figure","type":"Plot"},{"attributes":{"items":[{"id":"1056"},{"id":"1057"}],"location":[10,0],"orientation":"horizontal"},"id":"1055","type":"Legend"},{"attributes":{},"id":"1031","type":"BasicTickFormatter"},{"attributes":{"fields":[]},"id":"1020","type":"Stack"},{"attributes":{"label":{"value":"active"},"renderers":[{"id":"1028"}]},"id":"1038","type":"LegendItem"},{"attributes":{},"id":"1010","type":"LinearScale"},{"attributes":{"text":"Pruned Transformer Heads"},"id":"1002","type":"Title"},{"attributes":{},"id":"1033","type":"CategoricalTickFormatter"},{"attributes":{},"id":"1035","type":"Selection"},{"attributes":{"data":{"active":[9,9,4,6,5,5,4,8,9,8,8,10,11,10,14,14,16,13,14,15,13,7,8,9],"layers":["0","1","2","3","4","5","6","7","8","9","10","11","12","13","14","15","16","17","18","19","20","21","22","23"],"pruned":[7,7,12,10,11,11,12,8,7,8,8,6,5,6,2,2,0,3,2,1,3,9,8,7]},"selected":{"id":"1052"},"selection_policy":{"id":"1053"}},"id":"1039","type":"ColumnDataSource"},{"attributes":{"label":{"value":"active"},"renderers":[{"id":"1028"}]},"id":"1056","type":"LegendItem"},{"attributes":{"label":{"value":"pruned"},"renderers":[{"id":"1043"}]},"id":"1057","type":"LegendItem"},{"attributes":{"fields":["active"]},"id":"1021","type":"Stack"},{"attributes":{"source":{"id":"1039"}},"id":"1044","type":"CDSView"},{"attributes":{"axis":{"id":"1015"},"dimension":1,"ticker":null},"id":"1018","type":"Grid"},{"attributes":{},"id":"1016","type":"BasicTicker"},{"attributes":{"bottom":{"expr":{"id":"1022"}},"fill_color":{"value":"#ffcccc"},"line_color":{"value":"#ffcccc"},"top":{"expr":{"id":"1023"}},"width":{"value":0.9},"x":{"field":"layers"}},"id":"1041","type":"VBar"},{"attributes":{"label":{"value":"pruned"},"renderers":[{"id":"1043"}]},"id":"1054","type":"LegendItem"},{"attributes":{"bottom":{"expr":{"id":"1022"}},"fill_alpha":{"value":0.1},"fill_color":{"value":"#ffcccc"},"line_alpha":{"value":0.1},"line_color":{"value":"#ffcccc"},"top":{"expr":{"id":"1023"}},"width":{"value":0.9},"x":{"field":"layers"}},"id":"1042","type":"VBar"},{"attributes":{"data":{"active":[9,9,4,6,5,5,4,8,9,8,8,10,11,10,14,14,16,13,14,15,13,7,8,9],"layers":["0","1","2","3","4","5","6","7","8","9","10","11","12","13","14","15","16","17","18","19","20","21","22","23"],"pruned":[7,7,12,10,11,11,12,8,7,8,8,6,5,6,2,2,0,3,2,1,3,9,8,7]},"selected":{"id":"1035"},"selection_policy":{"id":"1036"}},"id":"1024","type":"ColumnDataSource"},{"attributes":{"axis_label":"Heads count","formatter":{"id":"1031"},"minor_tick_line_color":null,"ticker":{"id":"1016"}},"id":"1015","type":"LinearAxis"},{"attributes":{"data_source":{"id":"1039"},"glyph":{"id":"1041"},"hover_glyph":null,"muted_glyph":null,"name":"pruned","nonselection_glyph":{"id":"1042"},"selection_glyph":null,"view":{"id":"1044"}},"id":"1043","type":"GlyphRenderer"},{"attributes":{"fields":["active","pruned"]},"id":"1023","type":"Stack"},{"attributes":{"active_drag":"auto","active_inspect":"auto","active_multi":null,"active_scroll":"auto","active_tap":"auto"},"id":"1019","type":"Toolbar"},{"attributes":{"source":{"id":"1024"}},"id":"1029","type":"CDSView"},{"attributes":{"bottom":{"expr":{"id":"1020"}},"fill_color":{"value":"#0000ff"},"line_color":{"value":"#0000ff"},"top":{"expr":{"id":"1021"}},"width":{"value":0.9},"x":{"field":"layers"}},"id":"1026","type":"VBar"},{"attributes":{},"id":"1052","type":"Selection"},{"attributes":{"fields":["active"]},"id":"1022","type":"Stack"},{"attributes":{},"id":"1053","type":"UnionRenderers"},{"attributes":{"bottom":{"expr":{"id":"1020"}},"fill_alpha":{"value":0.1},"fill_color":{"value":"#0000ff"},"line_alpha":{"value":0.1},"line_color":{"value":"#0000ff"},"top":{"expr":{"id":"1021"}},"width":{"value":0.9},"x":{"field":"layers"}},"id":"1027","type":"VBar"},{"attributes":{"items":[{"id":"1038"},{"id":"1054"}],"location":null},"id":"1037","type":"Legend"},{"attributes":{},"id":"1013","type":"CategoricalTicker"},{"attributes":{"data_source":{"id":"1024"},"glyph":{"id":"1026"},"hover_glyph":null,"muted_glyph":null,"name":"active","nonselection_glyph":{"id":"1027"},"selection_glyph":null,"view":{"id":"1029"}},"id":"1028","type":"GlyphRenderer"},{"attributes":{"axis_label":"Layer index","formatter":{"id":"1033"},"minor_tick_line_color":null,"ticker":{"id":"1013"}},"id":"1012","type":"CategoricalAxis"}],"root_ids":["1001"]},"title":"Bokeh Application","version":"2.2.3"}}';
119
+ var render_items = [{"docid":"701239e5-a951-4da6-bd5b-ad008f0dba23","root_ids":["1001"],"roots":{"1001":"275e9fa1-bc94-4a73-a36c-e250fd7810ec"}}];
120
  root.Bokeh.embed.embed_items(docs_json, render_items);
121
 
122
  }
model_info.json ADDED
@@ -0,0 +1,464 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "checkpoint_path": "/data_2to/devel_data/nn_pruning/output/squadv2_test_3/hp_mnop-bert-large-uncased-whole-word-masking_dn-squad_v2_v2wn1_od-__data_2to__devel_data__nn_pruning__output__squadv2_test_3___es-steps_pdtbs8_pdebs128_nte20.06_ls250_stl50_est5000_--128cd5d9b5683065/checkpoint-330000",
3
+ "config": {
4
+ "_name_or_path": "/tmp/tmpxe9vb3vd",
5
+ "architectures": ["BertForQuestionAnswering"],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "gradient_checkpointing": false,
8
+ "hidden_act": "gelu",
9
+ "hidden_dropout_prob": 0.1,
10
+ "hidden_size": 1024,
11
+ "initializer_range": 0.02,
12
+ "intermediate_size": 4096,
13
+ "layer_norm_eps": 1e-12,
14
+ "max_position_embeddings": 512,
15
+ "model_type": "bert",
16
+ "num_attention_heads": 16,
17
+ "num_hidden_layers": 24,
18
+ "pad_token_id": 0,
19
+ "position_embedding_type": "absolute",
20
+ "pruned_heads": {
21
+ "0": [0, 3, 4, 5, 9, 13, 15],
22
+ "1": [0, 1, 7, 9, 10, 13, 14],
23
+ "10": [1, 2, 4, 5, 6, 8, 11, 13],
24
+ "11": [2, 5, 6, 8, 12, 15],
25
+ "12": [0, 2, 6, 9, 13],
26
+ "13": [2, 3, 6, 10, 12, 15],
27
+ "14": [10, 5],
28
+ "15": [0, 9],
29
+ "16": [],
30
+ "17": [1, 4, 12],
31
+ "18": [11, 4],
32
+ "19": [5],
33
+ "2": [0, 1, 4, 6, 7, 8, 9, 11, 12, 13, 14, 15],
34
+ "20": [0, 1, 12],
35
+ "21": [0, 2, 3, 4, 8, 10, 11, 12, 15],
36
+ "22": [0, 1, 3, 7, 9, 10, 11, 13],
37
+ "23": [2, 4, 7, 8, 9, 10, 13],
38
+ "3": [0, 3, 5, 6, 7, 8, 9, 13, 14, 15],
39
+ "4": [0, 2, 3, 5, 6, 7, 9, 10, 11, 12, 14],
40
+ "5": [3, 4, 5, 6, 7, 8, 9, 12, 13, 14, 15],
41
+ "6": [0, 1, 2, 3, 4, 7, 8, 9, 10, 11, 12, 15],
42
+ "7": [3, 5, 8, 9, 10, 11, 12, 13],
43
+ "8": [3, 5, 7, 8, 9, 11, 12],
44
+ "9": [0, 1, 2, 5, 6, 7, 13, 14]
45
+ },
46
+ "transformers_version": "4.7.0.dev0",
47
+ "type_vocab_size": 2,
48
+ "use_cache": true,
49
+ "vocab_size": 30522
50
+ },
51
+ "eval_metrics": {
52
+ "HasAns_exact": 76.48448043184885,
53
+ "HasAns_f1": 82.55514100819374,
54
+ "HasAns_total": 5928,
55
+ "NoAns_exact": 83.8856181665265,
56
+ "NoAns_f1": 83.8856181665265,
57
+ "NoAns_total": 5945,
58
+ "best_exact": 80.19034784805862,
59
+ "best_exact_thresh": 0.0,
60
+ "best_f1": 83.22133208932635,
61
+ "best_f1_thresh": 0.0,
62
+ "exact": 80.19034784805862,
63
+ "f1": 83.22133208932645,
64
+ "main_metric": 83.22133208932645,
65
+ "total": 11873
66
+ },
67
+ "model_args": {
68
+ "cache_dir": null,
69
+ "config_name": null,
70
+ "model_name_or_path": "bert-large-uncased-whole-word-masking",
71
+ "tokenizer_name": null,
72
+ "use_fast_tokenizer": true
73
+ },
74
+ "sparse_args": {
75
+ "ampere_pruning_method": "disabled",
76
+ "attention_block_cols": 32,
77
+ "attention_block_rows": 32,
78
+ "attention_lambda": 1.0,
79
+ "attention_output_with_dense": 0,
80
+ "attention_pruning_method": "sigmoied_threshold",
81
+ "bias_mask": true,
82
+ "decoder_attention_lambda": null,
83
+ "decoder_dense_lambda": null,
84
+ "dense_block_cols": 1,
85
+ "dense_block_rows": 1,
86
+ "dense_lambda": 1.0,
87
+ "dense_pruning_method": "sigmoied_threshold:1d_alt",
88
+ "distil_alpha_ce": 0.1,
89
+ "distil_alpha_teacher": 0.9,
90
+ "distil_teacher_name_or_path": "madlag/bert-large-uncased-whole-word-masking-finetuned-squadv2",
91
+ "distil_temperature": 2.0,
92
+ "eval_with_current_patch_params": false,
93
+ "final_ampere_temperature": 20.0,
94
+ "final_finetune": false,
95
+ "final_threshold": 0.1,
96
+ "final_warmup": 10,
97
+ "gelu_patch": 0,
98
+ "gelu_patch_steps": 50000,
99
+ "initial_ampere_temperature": 0.0,
100
+ "initial_threshold": 0,
101
+ "initial_warmup": 1,
102
+ "layer_norm_patch": 0,
103
+ "layer_norm_patch_start_delta": 0.99,
104
+ "layer_norm_patch_steps": 50000,
105
+ "linear_min_parameters": 0.005,
106
+ "mask_init": "constant",
107
+ "mask_scale": 0.0,
108
+ "mask_scores_learning_rate": 0.01,
109
+ "qat": false,
110
+ "qconfig": "default",
111
+ "regularization": "l1",
112
+ "regularization_final_lambda": 2,
113
+ "rewind_model_name_or_path": null
114
+ },
115
+ "speed": {
116
+ "cuda_eval_elapsed_time": 63.65266278076172,
117
+ "eval_elapsed_time": 68.118653698
118
+ },
119
+ "speedup": 0.6933166669240776,
120
+ "stats": {
121
+ "layers": {
122
+ "0": {
123
+ "linear_attention_nnz": 1329152,
124
+ "linear_attention_total": 4194304,
125
+ "linear_dense_nnz": 1294336,
126
+ "linear_dense_total": 8388608,
127
+ "linear_nnz": 2623488,
128
+ "linear_total": 12582912,
129
+ "nnz": 2631960,
130
+ "total": 12594880
131
+ },
132
+ "1": {
133
+ "linear_attention_nnz": 1539072,
134
+ "linear_attention_total": 4194304,
135
+ "linear_dense_nnz": 1429504,
136
+ "linear_dense_total": 8388608,
137
+ "linear_nnz": 2968576,
138
+ "linear_total": 12582912,
139
+ "nnz": 2977018,
140
+ "total": 12594880
141
+ },
142
+ "10": {
143
+ "linear_attention_nnz": 1718272,
144
+ "linear_attention_total": 4194304,
145
+ "linear_dense_nnz": 1990656,
146
+ "linear_dense_total": 8388608,
147
+ "linear_nnz": 3708928,
148
+ "linear_total": 12582912,
149
+ "nnz": 3717580,
150
+ "total": 12594688
151
+ },
152
+ "11": {
153
+ "linear_attention_nnz": 2091008,
154
+ "linear_attention_total": 4194304,
155
+ "linear_dense_nnz": 2207744,
156
+ "linear_dense_total": 8388608,
157
+ "linear_nnz": 4298752,
158
+ "linear_total": 12582912,
159
+ "nnz": 4307894,
160
+ "total": 12595072
161
+ },
162
+ "12": {
163
+ "linear_attention_nnz": 2011136,
164
+ "linear_attention_total": 4194304,
165
+ "linear_dense_nnz": 1988608,
166
+ "linear_dense_total": 8388608,
167
+ "linear_nnz": 3999744,
168
+ "linear_total": 12582912,
169
+ "nnz": 4008939,
170
+ "total": 12595264
171
+ },
172
+ "13": {
173
+ "linear_attention_nnz": 2132992,
174
+ "linear_attention_total": 4194304,
175
+ "linear_dense_nnz": 2392064,
176
+ "linear_dense_total": 8388608,
177
+ "linear_nnz": 4525056,
178
+ "linear_total": 12582912,
179
+ "nnz": 4534288,
180
+ "total": 12595072
181
+ },
182
+ "14": {
183
+ "linear_attention_nnz": 2490368,
184
+ "linear_attention_total": 4194304,
185
+ "linear_dense_nnz": 1941504,
186
+ "linear_dense_total": 8388608,
187
+ "linear_nnz": 4431872,
188
+ "linear_total": 12582912,
189
+ "nnz": 4441620,
190
+ "total": 12595840
191
+ },
192
+ "15": {
193
+ "linear_attention_nnz": 2515968,
194
+ "linear_attention_total": 4194304,
195
+ "linear_dense_nnz": 1873920,
196
+ "linear_dense_total": 8388608,
197
+ "linear_nnz": 4389888,
198
+ "linear_total": 12582912,
199
+ "nnz": 4399635,
200
+ "total": 12595840
201
+ },
202
+ "16": {
203
+ "linear_attention_nnz": 2995200,
204
+ "linear_attention_total": 4194304,
205
+ "linear_dense_nnz": 1984512,
206
+ "linear_dense_total": 8388608,
207
+ "linear_nnz": 4979712,
208
+ "linear_total": 12582912,
209
+ "nnz": 4989801,
210
+ "total": 12596224
211
+ },
212
+ "17": {
213
+ "linear_attention_nnz": 2373632,
214
+ "linear_attention_total": 4194304,
215
+ "linear_dense_nnz": 1820672,
216
+ "linear_dense_total": 8388608,
217
+ "linear_nnz": 4194304,
218
+ "linear_total": 12582912,
219
+ "nnz": 4203737,
220
+ "total": 12595648
221
+ },
222
+ "18": {
223
+ "linear_attention_nnz": 2628608,
224
+ "linear_attention_total": 4194304,
225
+ "linear_dense_nnz": 1259520,
226
+ "linear_dense_total": 8388608,
227
+ "linear_nnz": 3888128,
228
+ "linear_total": 12582912,
229
+ "nnz": 3897575,
230
+ "total": 12595840
231
+ },
232
+ "19": {
233
+ "linear_attention_nnz": 2135040,
234
+ "linear_attention_total": 4194304,
235
+ "linear_dense_nnz": 776192,
236
+ "linear_dense_total": 8388608,
237
+ "linear_nnz": 2911232,
238
+ "linear_total": 12582912,
239
+ "nnz": 2920315,
240
+ "total": 12596032
241
+ },
242
+ "2": {
243
+ "linear_attention_nnz": 761856,
244
+ "linear_attention_total": 4194304,
245
+ "linear_dense_nnz": 1775616,
246
+ "linear_dense_total": 8388608,
247
+ "linear_nnz": 2537472,
248
+ "linear_total": 12582912,
249
+ "nnz": 2545251,
250
+ "total": 12593920
251
+ },
252
+ "20": {
253
+ "linear_attention_nnz": 1545216,
254
+ "linear_attention_total": 4194304,
255
+ "linear_dense_nnz": 507904,
256
+ "linear_dense_total": 8388608,
257
+ "linear_nnz": 2053120,
258
+ "linear_total": 12582912,
259
+ "nnz": 2061560,
260
+ "total": 12595648
261
+ },
262
+ "21": {
263
+ "linear_attention_nnz": 608256,
264
+ "linear_attention_total": 4194304,
265
+ "linear_dense_nnz": 260096,
266
+ "linear_dense_total": 8388608,
267
+ "linear_nnz": 868352,
268
+ "linear_total": 12582912,
269
+ "nnz": 875551,
270
+ "total": 12594496
271
+ },
272
+ "22": {
273
+ "linear_attention_nnz": 617472,
274
+ "linear_attention_total": 4194304,
275
+ "linear_dense_nnz": 149504,
276
+ "linear_dense_total": 8388608,
277
+ "linear_nnz": 766976,
278
+ "linear_total": 12582912,
279
+ "nnz": 774281,
280
+ "total": 12594688
281
+ },
282
+ "23": {
283
+ "linear_attention_nnz": 527360,
284
+ "linear_attention_total": 4194304,
285
+ "linear_dense_nnz": 284672,
286
+ "linear_dense_total": 8388608,
287
+ "linear_nnz": 812032,
288
+ "linear_total": 12582912,
289
+ "nnz": 819435,
290
+ "total": 12594880
291
+ },
292
+ "3": {
293
+ "linear_attention_nnz": 1164288,
294
+ "linear_attention_total": 4194304,
295
+ "linear_dense_nnz": 2027520,
296
+ "linear_dense_total": 8388608,
297
+ "linear_nnz": 3191808,
298
+ "linear_total": 12582912,
299
+ "nnz": 3200094,
300
+ "total": 12594304
301
+ },
302
+ "4": {
303
+ "linear_attention_nnz": 835584,
304
+ "linear_attention_total": 4194304,
305
+ "linear_dense_nnz": 2035712,
306
+ "linear_dense_total": 8388608,
307
+ "linear_nnz": 2871296,
308
+ "linear_total": 12582912,
309
+ "nnz": 2879362,
310
+ "total": 12594112
311
+ },
312
+ "5": {
313
+ "linear_attention_nnz": 734208,
314
+ "linear_attention_total": 4194304,
315
+ "linear_dense_nnz": 2123776,
316
+ "linear_dense_total": 8388608,
317
+ "linear_nnz": 2857984,
318
+ "linear_total": 12582912,
319
+ "nnz": 2866029,
320
+ "total": 12594112
321
+ },
322
+ "6": {
323
+ "linear_attention_nnz": 816128,
324
+ "linear_attention_total": 4194304,
325
+ "linear_dense_nnz": 2312192,
326
+ "linear_dense_total": 8388608,
327
+ "linear_nnz": 3128320,
328
+ "linear_total": 12582912,
329
+ "nnz": 3136361,
330
+ "total": 12593920
331
+ },
332
+ "7": {
333
+ "linear_attention_nnz": 1503232,
334
+ "linear_attention_total": 4194304,
335
+ "linear_dense_nnz": 2338816,
336
+ "linear_dense_total": 8388608,
337
+ "linear_nnz": 3842048,
338
+ "linear_total": 12582912,
339
+ "nnz": 3850774,
340
+ "total": 12594688
341
+ },
342
+ "8": {
343
+ "linear_attention_nnz": 1784832,
344
+ "linear_attention_total": 4194304,
345
+ "linear_dense_nnz": 2328576,
346
+ "linear_dense_total": 8388608,
347
+ "linear_nnz": 4113408,
348
+ "linear_total": 12582912,
349
+ "nnz": 4122385,
350
+ "total": 12594880
351
+ },
352
+ "9": {
353
+ "linear_attention_nnz": 1396736,
354
+ "linear_attention_total": 4194304,
355
+ "linear_dense_nnz": 2463744,
356
+ "linear_dense_total": 8388608,
357
+ "linear_nnz": 3860480,
358
+ "linear_total": 12582912,
359
+ "nnz": 3869363,
360
+ "total": 12594688
361
+ }
362
+ },
363
+ "linear_nnz": 77822976,
364
+ "linear_sparsity": 74.22993977864583,
365
+ "linear_total": 301989888,
366
+ "nnz": 109815770,
367
+ "pruned_heads": {
368
+ "0": [0, 3, 4, 5, 9, 13, 15],
369
+ "1": [0, 1, 7, 9, 10, 13, 14],
370
+ "10": [1, 2, 4, 5, 6, 8, 11, 13],
371
+ "11": [2, 5, 6, 8, 12, 15],
372
+ "12": [0, 2, 6, 9, 13],
373
+ "13": [2, 3, 6, 10, 12, 15],
374
+ "14": [10, 5],
375
+ "15": [0, 9],
376
+ "16": [],
377
+ "17": [1, 4, 12],
378
+ "18": [11, 4],
379
+ "19": [5],
380
+ "2": [0, 1, 4, 6, 7, 8, 9, 11, 12, 13, 14, 15],
381
+ "20": [0, 1, 12],
382
+ "21": [0, 2, 3, 4, 8, 10, 11, 12, 15],
383
+ "22": [0, 1, 3, 7, 9, 10, 11, 13],
384
+ "23": [2, 4, 7, 8, 9, 10, 13],
385
+ "3": [0, 3, 5, 6, 7, 8, 9, 13, 14, 15],
386
+ "4": [0, 2, 3, 5, 6, 7, 9, 10, 11, 12, 14],
387
+ "5": [3, 4, 5, 6, 7, 8, 9, 12, 13, 14, 15],
388
+ "6": [0, 1, 2, 3, 4, 7, 8, 9, 10, 11, 12, 15],
389
+ "7": [3, 5, 8, 9, 10, 11, 12, 13],
390
+ "8": [3, 5, 7, 8, 9, 11, 12],
391
+ "9": [0, 1, 2, 5, 6, 7, 13, 14]
392
+ },
393
+ "total": 334064578,
394
+ "total_sparsity": 67.12738277806874
395
+ },
396
+ "training_args": {
397
+ "_n_gpu": 1,
398
+ "adafactor": false,
399
+ "adam_beta1": 0.9,
400
+ "adam_beta2": 0.999,
401
+ "adam_epsilon": 1e-08,
402
+ "dataloader_drop_last": false,
403
+ "dataloader_num_workers": 0,
404
+ "dataloader_pin_memory": true,
405
+ "ddp_find_unused_parameters": null,
406
+ "debug": false,
407
+ "deepspeed": null,
408
+ "disable_tqdm": false,
409
+ "do_eval": 1,
410
+ "do_predict": false,
411
+ "do_train": 1,
412
+ "eval_accumulation_steps": null,
413
+ "eval_steps": 5000,
414
+ "evaluation_strategy": "steps",
415
+ "fp16": false,
416
+ "fp16_backend": "auto",
417
+ "fp16_full_eval": false,
418
+ "fp16_opt_level": "O1",
419
+ "gradient_accumulation_steps": 1,
420
+ "greater_is_better": null,
421
+ "group_by_length": false,
422
+ "ignore_data_skip": false,
423
+ "label_names": null,
424
+ "label_smoothing_factor": 0.0,
425
+ "learning_rate": 3e-05,
426
+ "length_column_name": "length",
427
+ "load_best_model_at_end": false,
428
+ "local_rank": -1,
429
+ "logging_dir": "/data_2to/devel_data/nn_pruning/output/squadv2_test_3/",
430
+ "logging_first_step": false,
431
+ "logging_steps": 250,
432
+ "logging_strategy": "steps",
433
+ "lr_scheduler_type": "linear",
434
+ "max_grad_norm": 1.0,
435
+ "max_steps": -1,
436
+ "metric_for_best_model": null,
437
+ "mp_parameters": "",
438
+ "no_cuda": false,
439
+ "num_train_epochs": 20.06,
440
+ "optimize_model_before_eval": "disabled",
441
+ "output_dir": "/data_2to/devel_data/nn_pruning/output/squadv2_test_3/",
442
+ "overwrite_output_dir": 1,
443
+ "past_index": -1,
444
+ "per_device_eval_batch_size": 128,
445
+ "per_device_train_batch_size": 8,
446
+ "per_gpu_eval_batch_size": null,
447
+ "per_gpu_train_batch_size": null,
448
+ "prediction_loss_only": false,
449
+ "remove_unused_columns": true,
450
+ "report_to": ["tensorboard", "wandb"],
451
+ "run_name": "/data_2to/devel_data/nn_pruning/output/squadv2_test_3/",
452
+ "save_steps": 5000,
453
+ "save_strategy": "steps",
454
+ "save_total_limit": 50,
455
+ "seed": 17,
456
+ "sharded_ddp": [],
457
+ "skip_memory_metrics": false,
458
+ "tpu_metrics_debug": false,
459
+ "tpu_num_cores": null,
460
+ "warmup_ratio": 0.0,
461
+ "warmup_steps": 5400,
462
+ "weight_decay": 0.0
463
+ }
464
+ }