madlag commited on
Commit
74a9437
1 Parent(s): ab63cfa

Adding model, graphs and metadata.

Browse files
README.md CHANGED
@@ -28,7 +28,7 @@ The model contains **24.0%** of the original weights **overall** (the embeddings
28
  With a simple resizing of the linear matrices it ran **2.63x as fast as bert-large-uncased-whole-word-masking** on the evaluation.
29
  This is possible because the pruning method lead to structured matrices: to visualize them, hover below on the plot to see the non-zero/zero parts of each matrix.
30
 
31
- <div class="graph"><script src="/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/density_info.js" id="cddd6c5c-2e1d-40c7-b172-f7d5422349a6"></script></div>
32
 
33
  In terms of accuracy, its **F1 is 82.57**, compared with 85.85 for , a **F1 drop of 3.28**.
34
 
@@ -38,7 +38,7 @@ This model is case-insensitive: it does not make a difference between english an
38
 
39
  A side-effect of the block pruning is that some of the attention heads are completely removed: 190 heads were removed on a total of 384 (49.5%).
40
  Here is a detailed view on how the remaining heads are distributed in the network after pruning.
41
- <div class="graph"><script src="/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/pruning_info.js" id="03ad75cf-8048-44ae-a1d6-db69021cc168"></script></div>
42
 
43
  ## Details of the SQuAD1.1 dataset
44
 
28
  With a simple resizing of the linear matrices it ran **2.63x as fast as bert-large-uncased-whole-word-masking** on the evaluation.
29
  This is possible because the pruning method lead to structured matrices: to visualize them, hover below on the plot to see the non-zero/zero parts of each matrix.
30
 
31
+ <div class="graph"><script src="/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/density_info.js" id="64b46a6e-dbe2-4f43-83f9-470cbe9b6ced"></script></div>
32
 
33
  In terms of accuracy, its **F1 is 82.57**, compared with 85.85 for , a **F1 drop of 3.28**.
34
 
38
 
39
  A side-effect of the block pruning is that some of the attention heads are completely removed: 190 heads were removed on a total of 384 (49.5%).
40
  Here is a detailed view on how the remaining heads are distributed in the network after pruning.
41
+ <div class="graph"><script src="/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/pruning_info.js" id="c81effce-5f17-4643-b14a-e5e982bed699"></script></div>
42
 
43
  ## Details of the SQuAD1.1 dataset
44
 
eval/eval_metrics.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "HasAns_exact": 74.79757085020243,
3
+ "HasAns_f1": 80.55343166851642,
4
+ "HasAns_total": 5928,
5
+ "NoAns_exact": 84.57527333894029,
6
+ "NoAns_f1": 84.57527333894029,
7
+ "NoAns_total": 5945,
8
+ "best_exact": 79.69342205002948,
9
+ "best_exact_thresh": 0.0,
10
+ "best_f1": 82.56723178059156,
11
+ "best_f1_thresh": 0.0,
12
+ "exact": 79.69342205002948,
13
+ "f1": 82.5672317805917,
14
+ "total": 11873
15
+ }
eval/evaluate_timing.json ADDED
@@ -0,0 +1 @@
 
1
+ {"eval_elapsed_time": 146.44436294282787, "cuda_eval_elapsed_time": 141.51923974609375}
eval/nbest_predictions.json.tgz ADDED
Binary file (7.44 MB). View file
eval/null_odds.json ADDED
The diff for this file is too large to render. See raw diff
eval/predictions.json ADDED
The diff for this file is too large to render. See raw diff
eval/sparsity_report.json ADDED
@@ -0,0 +1 @@
 
1
+ {"total": 334057858, "nnz": 83313090, "linear_total": 301989888, "linear_nnz": 51337216, "layers": {"0": {"total": 12594496, "nnz": 1593727, "linear_total": 12582912, "linear_nnz": 1586176, "linear_attention_total": 4194304, "linear_attention_nnz": 998400, "linear_dense_total": 8388608, "linear_dense_nnz": 587776}, "1": {"total": 12594496, "nnz": 1657297, "linear_total": 12582912, "linear_nnz": 1649664, "linear_attention_total": 4194304, "linear_attention_nnz": 1025024, "linear_dense_total": 8388608, "linear_dense_nnz": 624640}, "2": {"total": 12593728, "nnz": 1479660, "linear_total": 12582912, "linear_nnz": 1472512, "linear_attention_total": 4194304, "linear_attention_nnz": 595968, "linear_dense_total": 8388608, "linear_dense_nnz": 876544}, "3": {"total": 12594112, "nnz": 2009554, "linear_total": 12582912, "linear_nnz": 2001920, "linear_attention_total": 4194304, "linear_attention_nnz": 916480, "linear_dense_total": 8388608, "linear_dense_nnz": 1085440}, "4": {"total": 12593920, "nnz": 1833264, "linear_total": 12582912, "linear_nnz": 1825792, "linear_attention_total": 4194304, "linear_attention_nnz": 678912, "linear_dense_total": 8388608, "linear_dense_nnz": 1146880}, "5": {"total": 12593920, "nnz": 1825983, "linear_total": 12582912, "linear_nnz": 1818624, "linear_attention_total": 4194304, "linear_attention_nnz": 509952, "linear_dense_total": 8388608, "linear_dense_nnz": 1308672}, "6": {"total": 12593920, "nnz": 2167168, "linear_total": 12582912, "linear_nnz": 2159616, "linear_attention_total": 4194304, "linear_attention_nnz": 717824, "linear_dense_total": 8388608, "linear_dense_nnz": 1441792}, "7": {"total": 12594112, "nnz": 2485901, "linear_total": 12582912, "linear_nnz": 2478080, "linear_attention_total": 4194304, "linear_attention_nnz": 1009664, "linear_dense_total": 8388608, "linear_dense_nnz": 1468416}, "8": {"total": 12594496, "nnz": 2803661, "linear_total": 12582912, "linear_nnz": 2795520, "linear_attention_total": 4194304, "linear_attention_nnz": 1327104, "linear_dense_total": 8388608, "linear_dense_nnz": 1468416}, "9": {"total": 12593920, "nnz": 2171276, "linear_total": 12582912, "linear_nnz": 2163712, "linear_attention_total": 4194304, "linear_attention_nnz": 631808, "linear_dense_total": 8388608, "linear_dense_nnz": 1531904}, "10": {"total": 12594688, "nnz": 2807915, "linear_total": 12582912, "linear_nnz": 2799616, "linear_attention_total": 4194304, "linear_attention_nnz": 1531904, "linear_dense_total": 8388608, "linear_dense_nnz": 1267712}, "11": {"total": 12594496, "nnz": 2868180, "linear_total": 12582912, "linear_nnz": 2860032, "linear_attention_total": 4194304, "linear_attention_nnz": 1508352, "linear_dense_total": 8388608, "linear_dense_nnz": 1351680}, "12": {"total": 12594880, "nnz": 2771132, "linear_total": 12582912, "linear_nnz": 2762752, "linear_attention_total": 4194304, "linear_attention_nnz": 1525760, "linear_dense_total": 8388608, "linear_dense_nnz": 1236992}, "13": {"total": 12595264, "nnz": 3245559, "linear_total": 12582912, "linear_nnz": 3236864, "linear_attention_total": 4194304, "linear_attention_nnz": 1813504, "linear_dense_total": 8388608, "linear_dense_nnz": 1423360}, "14": {"total": 12595072, "nnz": 2936051, "linear_total": 12582912, "linear_nnz": 2927616, "linear_attention_total": 4194304, "linear_attention_nnz": 1774592, "linear_dense_total": 8388608, "linear_dense_nnz": 1153024}, "15": {"total": 12595840, "nnz": 2996110, "linear_total": 12582912, "linear_nnz": 2987008, "linear_attention_total": 4194304, "linear_attention_nnz": 1909760, "linear_dense_total": 8388608, "linear_dense_nnz": 1077248}, "16": {"total": 12595840, "nnz": 3270645, "linear_total": 12582912, "linear_nnz": 3261440, "linear_attention_total": 4194304, "linear_attention_nnz": 2169856, "linear_dense_total": 8388608, "linear_dense_nnz": 1091584}, "17": {"total": 12595264, "nnz": 2903531, "linear_total": 12582912, "linear_nnz": 2894848, "linear_attention_total": 4194304, "linear_attention_nnz": 1823744, "linear_dense_total": 8388608, "linear_dense_nnz": 1071104}, "18": {"total": 12595648, "nnz": 2669146, "linear_total": 12582912, "linear_nnz": 2660352, "linear_attention_total": 4194304, "linear_attention_nnz": 1886208, "linear_dense_total": 8388608, "linear_dense_nnz": 774144}, "19": {"total": 12595648, "nnz": 1927354, "linear_total": 12582912, "linear_nnz": 1918976, "linear_attention_total": 4194304, "linear_attention_nnz": 1472512, "linear_dense_total": 8388608, "linear_dense_nnz": 446464}, "20": {"total": 12595456, "nnz": 1386290, "linear_total": 12582912, "linear_nnz": 1378304, "linear_attention_total": 4194304, "linear_attention_nnz": 1079296, "linear_dense_total": 8388608, "linear_dense_nnz": 299008}, "21": {"total": 12594688, "nnz": 674764, "linear_total": 12582912, "linear_nnz": 667648, "linear_attention_total": 4194304, "linear_attention_nnz": 512000, "linear_dense_total": 8388608, "linear_dense_nnz": 155648}, "22": {"total": 12594304, "nnz": 472716, "linear_total": 12582912, "linear_nnz": 465920, "linear_attention_total": 4194304, "linear_attention_nnz": 375808, "linear_dense_total": 8388608, "linear_dense_nnz": 90112}, "23": {"total": 12594688, "nnz": 571244, "linear_total": 12582912, "linear_nnz": 564224, "linear_attention_total": 4194304, "linear_attention_nnz": 343040, "linear_dense_total": 8388608, "linear_dense_nnz": 221184}}, "total_sparsity": 75.06028132408129, "linear_sparsity": 83.00035264756944, "pruned_heads": {"0": [0, 1, 3, 4, 5, 8, 9, 13, 15], "1": [0, 1, 3, 5, 7, 9, 10, 13, 14], "2": [0, 1, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15], "3": [0, 3, 5, 6, 7, 8, 9, 11, 13, 14, 15], "4": [0, 2, 3, 4, 5, 6, 7, 9, 10, 11, 12, 14], "5": [1, 3, 4, 5, 6, 7, 8, 9, 12, 13, 14, 15], "6": [0, 1, 2, 3, 4, 7, 8, 9, 10, 11, 12, 15], "7": [0, 3, 4, 5, 8, 9, 10, 11, 12, 13, 14], "8": [3, 4, 5, 7, 8, 9, 10, 11, 12], "9": [0, 1, 2, 3, 5, 6, 7, 9, 10, 13, 14, 15], "10": [1, 2, 4, 5, 6, 8, 11, 13], "11": [0, 2, 5, 6, 7, 8, 10, 12, 15], "12": [0, 2, 6, 8, 9, 11, 13], "13": [2, 6, 10, 12, 15], "14": [1, 5, 6, 10, 11, 15], "15": [0, 9], "16": [5, 7], "17": [1, 4, 8, 12, 14], "18": [3, 11, 4], "19": [0, 12, 5], "20": [0, 10, 4, 12], "21": [0, 2, 3, 4, 8, 11, 12, 15], "22": [0, 1, 3, 4, 7, 9, 10, 11, 13, 15], "23": [2, 4, 8, 9, 10, 13, 14, 15]}}
eval/speed_report.json ADDED
@@ -0,0 +1 @@
 
1
+ {"timings": {"eval_elapsed_time": 56.62768604200005, "cuda_eval_elapsed_time": 52.126098907470706}, "metrics": {"HasAns_exact": 74.8144399460189, "HasAns_f1": 80.555306012496, "HasAns_total": 5928, "NoAns_exact": 84.57527333894029, "NoAns_f1": 84.57527333894029, "NoAns_total": 5945, "best_exact": 79.70184452118251, "best_exact_thresh": 0.0, "best_f1": 82.56816761071966, "best_f1_thresh": 0.0, "exact": 79.70184452118251, "f1": 82.56816761071981, "total": 11873}}
model_card/density_info.js CHANGED
@@ -16,9 +16,9 @@
16
 
17
 
18
 
19
- var element = document.getElementById("cddd6c5c-2e1d-40c7-b172-f7d5422349a6");
20
  if (element == null) {
21
- console.warn("Bokeh: autoload.js configured with elementid 'cddd6c5c-2e1d-40c7-b172-f7d5422349a6' but no matching script tag was found.")
22
  }
23
 
24
 
@@ -115,8 +115,8 @@
115
  (function(root) {
116
  function embed_document(root) {
117
 
118
- var docs_json = '{"6f8350c7-6159-4d2b-8e5f-df1c89f733ab":{"roots":{"references":[{"attributes":{},"id":"1152","type":"UnionRenderers"},{"attributes":{"source":{"id":"1128"}},"id":"1133","type":"CDSView"},{"attributes":{},"id":"1153","type":"Selection"},{"attributes":{"data":{"density":["27.2%","7.0%","7.0%","24.2%","7.4%","7.4%","12.7%","10.4%","10.4%","22.9%","12.9%","12.9%","17.0%","13.7%","13.7%","13.4%","15.6%","15.6%","18.9%","17.2%","17.2%","24.6%","17.5%","17.5%","31.2%","17.5%","17.5%","14.8%","18.3%","18.3%","36.1%","15.1%","15.1%","33.6%","16.1%","16.1%","34.7%","14.7%","14.7%","44.4%","17.0%","17.0%","41.4%","13.7%","13.7%","41.5%","12.8%","12.8%","50.1%","13.0%","13.0%","43.1%","12.8%","12.8%","38.4%","9.2%","9.2%","28.5%","5.3%","5.3%","18.5%","3.6%","3.6%","9.5%","1.9%","1.9%","6.1%","1.1%","1.1%","7.3%","2.6%","2.6%"],"height":[0.285696,0.293888,0.293888,0.253952,0.31232,0.31232,0.13312,0.438272,0.438272,0.24064,0.54272,0.54272,0.178176,0.57344,0.57344,0.140288,0.654336,0.654336,0.198656,0.720896,0.720896,0.258048,0.734208,0.734208,0.326656,0.734208,0.734208,0.155648,0.765952,0.765952,0.37888,0.633856,0.633856,0.352256,0.67584,0.67584,0.36352,0.618496,0.618496,0.46592,0.71168,0.71168,0.434176,0.576512,0.576512,0.4352,0.538624,0.538624,0.525312,0.545792,0.545792,0.451584,0.535552,0.535552,0.402432,0.387072,0.387072,0.299008,0.223232,0.223232,0.193536,0.149504,0.149504,0.099328,0.077824,0.077824,0.063488,0.045056,0.045056,0.0768,0.110592,0.110592],"img_height":["128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px"],"img_width":["128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px"],"name":["0.attention.output","0.intermediate","0.output","1.attention.output","1.intermediate","1.output","2.attention.output","2.intermediate","2.output","3.attention.output","3.intermediate","3.output","4.attention.output","4.intermediate","4.output","5.attention.output","5.intermediate","5.output","6.attention.output","6.intermediate","6.output","7.attention.output","7.intermediate","7.output","8.attention.output","8.intermediate","8.output","9.attention.output","9.intermediate","9.output","10.attention.output","10.intermediate","10.output","11.attention.output","11.intermediate","11.output","12.attention.output","12.intermediate","12.output","13.attention.output","13.intermediate","13.output","14.attention.output","14.intermediate","14.output","15.attention.output","15.intermediate","15.output","16.attention.output","16.intermediate","16.output","17.attention.output","17.intermediate","17.output","18.attention.output","18.intermediate","18.output","19.attention.output","19.intermediate","19.output","20.attention.output","20.intermediate","20.output","21.attention.output","21.intermediate","21.output","22.attention.output","22.intermediate","22.output","23.attention.output","23.intermediate","23.output"],"parameters":["0.29","0.29","0.29","0.25","0.31","0.31","0.13","0.44","0.44","0.24","0.54","0.54","0.18","0.57","0.57","0.14","0.65","0.65","0.20","0.72","0.72","0.26","0.73","0.73","0.33","0.73","0.73","0.16","0.77","0.77","0.38","0.63","0.63","0.35","0.68","0.68","0.36","0.62","0.62","0.47","0.71","0.71","0.43","0.58","0.58","0.44","0.54","0.54","0.53","0.55","0.55","0.45","0.54","0.54","0.40","0.39","0.39","0.30","0.22","0.22","0.19","0.15","0.15","0.10","0.08","0.08","0.06","0.05","0.05","0.08","0.11","0.11"],"url":["/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_0_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_0_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_0_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_1_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_1_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_1_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_2_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_2_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_2_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_3_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_3_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_3_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_4_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_4_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_4_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_5_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_5_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_5_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_6_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_6_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_6_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_7_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_7_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_7_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_8_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_8_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_8_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_9_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_9_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_9_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_10_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_10_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_10_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_11_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_11_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_11_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_12_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_12_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_12_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_13_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_13_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_13_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_14_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_14_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_14_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_15_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_15_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_15_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_16_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_16_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_16_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_17_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_17_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_17_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_18_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_18_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_18_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_19_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_19_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_19_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_20_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_20_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_20_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_21_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_21_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_21_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_22_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_22_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_22_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_23_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_23_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_23_output_dense.png"],"x":[0.5833333333333334,0.75,0.9166666666666667,1.5833333333333333,1.75,1.9166666666666665,2.5833333333333335,2.75,2.916666666666667,3.5833333333333335,3.75,3.916666666666667,4.583333333333333,4.75,4.916666666666666,5.583333333333333,5.75,5.916666666666666,6.583333333333333,6.75,6.916666666666666,7.583333333333333,7.75,7.916666666666666,8.583333333333334,8.75,8.916666666666668,9.583333333333334,9.75,9.916666666666668,10.583333333333334,10.75,10.916666666666668,11.583333333333334,11.75,11.916666666666668,12.583333333333334,12.75,12.916666666666668,13.583333333333334,13.75,13.916666666666668,14.583333333333334,14.75,14.916666666666668,15.583333333333334,15.75,15.916666666666668,16.583333333333332,16.75,16.916666666666664,17.583333333333332,17.75,17.916666666666664,18.583333333333332,18.75,18.916666666666664,19.583333333333332,19.75,19.916666666666664,20.583333333333332,20.75,20.916666666666664,21.583333333333332,21.75,21.916666666666664,22.583333333333332,22.75,22.916666666666664,23.583333333333332,23.75,23.916666666666664]},"selected":{"id":"1157"},"selection_policy":{"id":"1156"}},"id":"1134","type":"ColumnDataSource"},{"attributes":{"fill_color":{"value":"#aa69f7"},"line_color":{"value":"#aa69f7"},"top":{"field":"height"},"width":{"value":0.125},"x":{"field":"x"}},"id":"1136","type":"VBar"},{"attributes":{"items":[{"id":"1141"},{"id":"1142"},{"id":"1143"},{"id":"1144"}],"location":[10,0],"orientation":"horizontal"},"id":"1140","type":"Legend"},{"attributes":{"fill_alpha":{"value":0.1},"fill_color":{"value":"#aa69f7"},"line_alpha":{"value":0.1},"line_color":{"value":"#aa69f7"},"top":{"field":"height"},"width":{"value":0.125},"x":{"field":"x"}},"id":"1137","type":"VBar"},{"attributes":{"source":{"id":"1134"}},"id":"1139","type":"CDSView"},{"attributes":{},"id":"1146","type":"BasicTickFormatter"},{"attributes":{},"id":"1154","type":"UnionRenderers"},{"attributes":{"label":{"value":"query"},"renderers":[{"id":"1120"}]},"id":"1141","type":"LegendItem"},{"attributes":{},"id":"1155","type":"Selection"},{"attributes":{"label":{"value":"key"},"renderers":[{"id":"1126"}]},"id":"1142","type":"LegendItem"},{"attributes":{},"id":"1148","type":"BasicTickFormatter"},{"attributes":{"data_source":{"id":"1116"},"glyph":{"id":"1118"},"hover_glyph":null,"muted_glyph":null,"name":"query","nonselection_glyph":{"id":"1119"},"selection_glyph":null,"view":{"id":"1121"}},"id":"1120","type":"GlyphRenderer"},{"attributes":{"fill_alpha":{"value":0.1},"fill_color":{"value":"#6573f7"},"line_alpha":{"value":0.1},"line_color":{"value":"#6573f7"},"top":{"field":"height"},"width":{"value":0.125},"x":{"field":"x"}},"id":"1119","type":"VBar"},{"attributes":{"fill_color":{"value":"#ed5642"},"line_color":{"value":"#ed5642"},"top":{"field":"height"},"width":{"value":0.125},"x":{"field":"x"}},"id":"1124","type":"VBar"},{"attributes":{"active_drag":"auto","active_inspect":"auto","active_multi":null,"active_scroll":"auto","active_tap":"auto","tools":[{"id":"1094"}]},"id":"1114","type":"Toolbar"},{"attributes":{"data":{"density":["21.9%","25.6%","14.8%","20.7%","15.9%","10.5%","15.9%","23.8%","33.8%","15.7%","36.9%","39.3%","37.3%","41.9%","45.7%","49.4%","51.6%","42.2%","48.9%","39.3%","32.0%","15.0%","10.2%","7.9%"],"height":[0.229376,0.268288,0.155648,0.217088,0.166912,0.110592,0.166912,0.249856,0.354304,0.164864,0.387072,0.411648,0.391168,0.439296,0.479232,0.518144,0.540672,0.442368,0.513024,0.411648,0.335872,0.157696,0.106496,0.082944],"img_height":["128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px"],"img_width":["128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px"],"name":["0.attention.query","1.attention.query","2.attention.query","3.attention.query","4.attention.query","5.attention.query","6.attention.query","7.attention.query","8.attention.query","9.attention.query","10.attention.query","11.attention.query","12.attention.query","13.attention.query","14.attention.query","15.attention.query","16.attention.query","17.attention.query","18.attention.query","19.attention.query","20.attention.query","21.attention.query","22.attention.query","23.attention.query"],"parameters":["0.23","0.27","0.16","0.22","0.17","0.11","0.17","0.25","0.35","0.16","0.39","0.41","0.39","0.44","0.48","0.52","0.54","0.44","0.51","0.41","0.34","0.16","0.11","0.08"],"url":["/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_0_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_1_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_2_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_3_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_4_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_5_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_6_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_7_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_8_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_9_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_10_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_11_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_12_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_13_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_14_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_15_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_16_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_17_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_18_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_19_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_20_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_21_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_22_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_23_attention_self_query.png"],"x":[0.08333333333333333,1.0833333333333333,2.0833333333333335,3.0833333333333335,4.083333333333333,5.083333333333333,6.083333333333333,7.083333333333333,8.083333333333334,9.083333333333334,10.083333333333334,11.083333333333334,12.083333333333334,13.083333333333334,14.083333333333334,15.083333333333334,16.083333333333332,17.083333333333332,18.083333333333332,19.083333333333332,20.083333333333332,21.083333333333332,22.083333333333332,23.083333333333332]},"selected":{"id":"1151"},"selection_policy":{"id":"1150"}},"id":"1116","type":"ColumnDataSource"},{"attributes":{"label":{"value":"value"},"renderers":[{"id":"1132"}]},"id":"1143","type":"LegendItem"},{"attributes":{},"id":"1111","type":"BasicTicker"},{"attributes":{"source":{"id":"1116"}},"id":"1121","type":"CDSView"},{"attributes":{"axis_label":"Parameters (M)","formatter":{"id":"1146"},"minor_tick_line_color":null,"ticker":{"id":"1111"}},"id":"1110","type":"LinearAxis"},{"attributes":{"label":{"value":"fully connected"},"renderers":[{"id":"1138"}]},"id":"1144","type":"LegendItem"},{"attributes":{"above":[{"id":"1140"}],"below":[{"id":"1106"}],"center":[{"id":"1109"},{"id":"1113"}],"left":[{"id":"1110"}],"outline_line_color":null,"plot_height":300,"plot_width":505,"renderers":[{"id":"1120"},{"id":"1126"},{"id":"1132"},{"id":"1138"}],"title":{"id":"1096"},"toolbar":{"id":"1114"},"x_range":{"id":"1098"},"x_scale":{"id":"1102"},"y_range":{"id":"1100"},"y_scale":{"id":"1104"}},"id":"1095","subtype":"Figure","type":"Plot"},{"attributes":{"data":{"density":["20.7%","25.8%","16.2%","22.0%","16.6%","11.7%","17.1%","25.6%","34.1%","16.8%","39.8%","39.5%","37.6%","44.2%","44.6%","52.3%","55.2%","44.3%","52.2%","41.5%","33.5%","14.2%","12.1%","9.4%"],"height":[0.217088,0.270336,0.169984,0.2304,0.17408,0.12288,0.1792,0.268288,0.357376,0.176128,0.417792,0.413696,0.39424,0.463872,0.467968,0.548864,0.57856,0.464896,0.54784,0.4352,0.351232,0.14848,0.126976,0.098304],"img_height":["128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px"],"img_width":["128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px"],"name":["0.attention.key","1.attention.key","2.attention.key","3.attention.key","4.attention.key","5.attention.key","6.attention.key","7.attention.key","8.attention.key","9.attention.key","10.attention.key","11.attention.key","12.attention.key","13.attention.key","14.attention.key","15.attention.key","16.attention.key","17.attention.key","18.attention.key","19.attention.key","20.attention.key","21.attention.key","22.attention.key","23.attention.key"],"parameters":["0.22","0.27","0.17","0.23","0.17","0.12","0.18","0.27","0.36","0.18","0.42","0.41","0.39","0.46","0.47","0.55","0.58","0.46","0.55","0.44","0.35","0.15","0.13","0.10"],"url":["/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_0_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_1_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_2_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_3_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_4_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_5_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_6_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_7_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_8_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_9_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_10_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_11_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_12_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_13_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_14_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_15_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_16_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_17_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_18_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_19_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_20_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_21_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_22_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_23_attention_self_key.png"],"x":[0.25,1.25,2.25,3.25,4.25,5.25,6.25,7.25,8.25,9.25,10.25,11.25,12.25,13.25,14.25,15.25,16.25,17.25,18.25,19.25,20.25,21.25,22.25,23.25]},"selected":{"id":"1153"},"selection_policy":{"id":"1152"}},"id":"1122","type":"ColumnDataSource"},{"attributes":{},"id":"1156","type":"UnionRenderers"},{"attributes":{"axis":{"id":"1110"},"dimension":1,"ticker":null},"id":"1113","type":"Grid"},{"attributes":{},"id":"1157","type":"Selection"},{"attributes":{},"id":"1102","type":"LinearScale"},{"attributes":{},"id":"1150","type":"UnionRenderers"},{"attributes":{"callback":null,"tooltips":"\\n &lt;div&gt;\\n &lt;div style=\\"margin-bottom:10px\\"&gt;\\n &lt;span style=\\"font-size: 15px;\\"&gt;&lt;b&gt;@name&lt;/b&gt;&lt;br/&gt;density=@density&lt;/span&gt;\\n &lt;/div&gt;\\n &lt;div&gt; \\n &lt;img\\n src=\\"@url\\" height=\\"@img_height\\" width=\\"@img_width\\" alt=\\"@url\\"\\n style=\\"float: left; margin: 0px 15px 15px 0px;\\"\\n border=\\"0\\"\\n /&gt;\\n &lt;/div&gt;\\n &lt;/div&gt;\\n "},"id":"1094","type":"HoverTool"},{"attributes":{"data_source":{"id":"1122"},"glyph":{"id":"1124"},"hover_glyph":null,"muted_glyph":null,"name":"key","nonselection_glyph":{"id":"1125"},"selection_glyph":null,"view":{"id":"1127"}},"id":"1126","type":"GlyphRenderer"},{"attributes":{"axis":{"id":"1106"},"grid_line_color":null,"ticker":null},"id":"1109","type":"Grid"},{"attributes":{"data_source":{"id":"1134"},"glyph":{"id":"1136"},"hover_glyph":null,"muted_glyph":null,"name":"fully connected","nonselection_glyph":{"id":"1137"},"selection_glyph":null,"view":{"id":"1139"}},"id":"1138","type":"GlyphRenderer"},{"attributes":{},"id":"1151","type":"Selection"},{"attributes":{"fill_alpha":{"value":0.1},"fill_color":{"value":"#ed5642"},"line_alpha":{"value":0.1},"line_color":{"value":"#ed5642"},"top":{"field":"height"},"width":{"value":0.125},"x":{"field":"x"}},"id":"1125","type":"VBar"},{"attributes":{"data":{"density":["25.4%","22.2%","13.1%","21.8%","15.2%","13.0%","16.5%","22.3%","27.5%","12.9%","33.2%","31.5%","35.9%","42.4%","37.5%","38.9%","50.1%","44.3%","40.3%","31.2%","18.9%","10.2%","7.5%","8.1%"],"height":[0.26624,0.232448,0.137216,0.228352,0.159744,0.136192,0.173056,0.233472,0.288768,0.135168,0.34816,0.330752,0.376832,0.444416,0.393216,0.407552,0.525312,0.464896,0.422912,0.326656,0.198656,0.106496,0.078848,0.084992],"img_height":["128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px"],"img_width":["128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px"],"name":["0.attention.value","1.attention.value","2.attention.value","3.attention.value","4.attention.value","5.attention.value","6.attention.value","7.attention.value","8.attention.value","9.attention.value","10.attention.value","11.attention.value","12.attention.value","13.attention.value","14.attention.value","15.attention.value","16.attention.value","17.attention.value","18.attention.value","19.attention.value","20.attention.value","21.attention.value","22.attention.value","23.attention.value"],"parameters":["0.27","0.23","0.14","0.23","0.16","0.14","0.17","0.23","0.29","0.14","0.35","0.33","0.38","0.44","0.39","0.41","0.53","0.46","0.42","0.33","0.20","0.11","0.08","0.08"],"url":["/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_0_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_1_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_2_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_3_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_4_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_5_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_6_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_7_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_8_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_9_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_10_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_11_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_12_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_13_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_14_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_15_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_16_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_17_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_18_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_19_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_20_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_21_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_22_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_23_attention_self_value.png"],"x":[0.41666666666666663,1.4166666666666665,2.416666666666667,3.416666666666667,4.416666666666666,5.416666666666666,6.416666666666666,7.416666666666666,8.416666666666668,9.416666666666668,10.416666666666668,11.416666666666668,12.416666666666668,13.416666666666668,14.416666666666668,15.416666666666668,16.416666666666664,17.416666666666664,18.416666666666664,19.416666666666664,20.416666666666664,21.416666666666664,22.416666666666664,23.416666666666664]},"selected":{"id":"1155"},"selection_policy":{"id":"1154"}},"id":"1128","type":"ColumnDataSource"},{"attributes":{"text":"Transformer Layers"},"id":"1096","type":"Title"},{"attributes":{},"id":"1104","type":"LinearScale"},{"attributes":{"source":{"id":"1122"}},"id":"1127","type":"CDSView"},{"attributes":{"fill_color":{"value":"#6573f7"},"line_color":{"value":"#6573f7"},"top":{"field":"height"},"width":{"value":0.125},"x":{"field":"x"}},"id":"1118","type":"VBar"},{"attributes":{"fill_color":{"value":"#20cb97"},"line_color":{"value":"#20cb97"},"top":{"field":"height"},"width":{"value":0.125},"x":{"field":"x"}},"id":"1130","type":"VBar"},{"attributes":{"start":0},"id":"1100","type":"DataRange1d"},{"attributes":{},"id":"1098","type":"DataRange1d"},{"attributes":{"axis_label":"Layer","formatter":{"id":"1148"},"minor_tick_line_color":null,"ticker":{"id":"1107"}},"id":"1106","type":"LinearAxis"},{"attributes":{"data_source":{"id":"1128"},"glyph":{"id":"1130"},"hover_glyph":null,"muted_glyph":null,"name":"value","nonselection_glyph":{"id":"1131"},"selection_glyph":null,"view":{"id":"1133"}},"id":"1132","type":"GlyphRenderer"},{"attributes":{},"id":"1107","type":"BasicTicker"},{"attributes":{"fill_alpha":{"value":0.1},"fill_color":{"value":"#20cb97"},"line_alpha":{"value":0.1},"line_color":{"value":"#20cb97"},"top":{"field":"height"},"width":{"value":0.125},"x":{"field":"x"}},"id":"1131","type":"VBar"}],"root_ids":["1095"]},"title":"Bokeh Application","version":"2.2.3"}}';
119
- var render_items = [{"docid":"6f8350c7-6159-4d2b-8e5f-df1c89f733ab","root_ids":["1095"],"roots":{"1095":"cddd6c5c-2e1d-40c7-b172-f7d5422349a6"}}];
120
  root.Bokeh.embed.embed_items(docs_json, render_items);
121
 
122
  }
16
 
17
 
18
 
19
+ var element = document.getElementById("64b46a6e-dbe2-4f43-83f9-470cbe9b6ced");
20
  if (element == null) {
21
+ console.warn("Bokeh: autoload.js configured with elementid '64b46a6e-dbe2-4f43-83f9-470cbe9b6ced' but no matching script tag was found.")
22
  }
23
 
24
 
115
  (function(root) {
116
  function embed_document(root) {
117
 
118
+ var docs_json = '{"db9c60ce-feb7-4e96-b7a0-bd8663fdcd25":{"roots":{"references":[{"attributes":{"source":{"id":"1122"}},"id":"1127","type":"CDSView"},{"attributes":{"fill_alpha":{"value":0.1},"fill_color":{"value":"#6573f7"},"line_alpha":{"value":0.1},"line_color":{"value":"#6573f7"},"top":{"field":"height"},"width":{"value":0.125},"x":{"field":"x"}},"id":"1119","type":"VBar"},{"attributes":{"fill_color":{"value":"#20cb97"},"line_color":{"value":"#20cb97"},"top":{"field":"height"},"width":{"value":0.125},"x":{"field":"x"}},"id":"1130","type":"VBar"},{"attributes":{"fill_color":{"value":"#aa69f7"},"line_color":{"value":"#aa69f7"},"top":{"field":"height"},"width":{"value":0.125},"x":{"field":"x"}},"id":"1136","type":"VBar"},{"attributes":{"active_drag":"auto","active_inspect":"auto","active_multi":null,"active_scroll":"auto","active_tap":"auto","tools":[{"id":"1094"}]},"id":"1114","type":"Toolbar"},{"attributes":{"label":{"value":"value"},"renderers":[{"id":"1132"}]},"id":"1143","type":"LegendItem"},{"attributes":{},"id":"1155","type":"UnionRenderers"},{"attributes":{"axis_label":"Parameters (M)","formatter":{"id":"1146"},"minor_tick_line_color":null,"ticker":{"id":"1111"}},"id":"1110","type":"LinearAxis"},{"attributes":{"data_source":{"id":"1116"},"glyph":{"id":"1118"},"hover_glyph":null,"muted_glyph":null,"name":"query","nonselection_glyph":{"id":"1119"},"selection_glyph":null,"view":{"id":"1121"}},"id":"1120","type":"GlyphRenderer"},{"attributes":{},"id":"1148","type":"BasicTickFormatter"},{"attributes":{"axis":{"id":"1110"},"dimension":1,"ticker":null},"id":"1113","type":"Grid"},{"attributes":{},"id":"1151","type":"UnionRenderers"},{"attributes":{},"id":"1111","type":"BasicTicker"},{"attributes":{},"id":"1154","type":"Selection"},{"attributes":{"source":{"id":"1134"}},"id":"1139","type":"CDSView"},{"attributes":{},"id":"1153","type":"UnionRenderers"},{"attributes":{"label":{"value":"fully connected"},"renderers":[{"id":"1138"}]},"id":"1144","type":"LegendItem"},{"attributes":{"data_source":{"id":"1122"},"glyph":{"id":"1124"},"hover_glyph":null,"muted_glyph":null,"name":"key","nonselection_glyph":{"id":"1125"},"selection_glyph":null,"view":{"id":"1127"}},"id":"1126","type":"GlyphRenderer"},{"attributes":{"source":{"id":"1116"}},"id":"1121","type":"CDSView"},{"attributes":{"callback":null,"tooltips":"\\n &lt;div&gt;\\n &lt;div style=\\"margin-bottom:10px\\"&gt;\\n &lt;span style=\\"font-size: 15px;\\"&gt;&lt;b&gt;@name&lt;/b&gt;&lt;br/&gt;density=@density&lt;/span&gt;\\n &lt;/div&gt;\\n &lt;div&gt; \\n &lt;img\\n src=\\"@url\\" height=\\"@img_height\\" width=\\"@img_width\\" alt=\\"@url\\"\\n style=\\"float: left; margin: 0px 15px 15px 0px;\\"\\n border=\\"0\\"\\n /&gt;\\n &lt;/div&gt;\\n &lt;/div&gt;\\n "},"id":"1094","type":"HoverTool"},{"attributes":{"fill_color":{"value":"#ed5642"},"line_color":{"value":"#ed5642"},"top":{"field":"height"},"width":{"value":0.125},"x":{"field":"x"}},"id":"1124","type":"VBar"},{"attributes":{"fill_alpha":{"value":0.1},"fill_color":{"value":"#aa69f7"},"line_alpha":{"value":0.1},"line_color":{"value":"#aa69f7"},"top":{"field":"height"},"width":{"value":0.125},"x":{"field":"x"}},"id":"1137","type":"VBar"},{"attributes":{"data":{"density":["20.7%","25.8%","16.2%","22.0%","16.6%","11.7%","17.1%","25.6%","34.1%","16.8%","39.8%","39.5%","37.6%","44.2%","44.6%","52.3%","55.2%","44.3%","52.2%","41.5%","33.5%","14.2%","12.1%","9.4%"],"height":[0.217088,0.270336,0.169984,0.2304,0.17408,0.12288,0.1792,0.268288,0.357376,0.176128,0.417792,0.413696,0.39424,0.463872,0.467968,0.548864,0.57856,0.464896,0.54784,0.4352,0.351232,0.14848,0.126976,0.098304],"img_height":["128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px"],"img_width":["128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px"],"name":["0.attention.key","1.attention.key","2.attention.key","3.attention.key","4.attention.key","5.attention.key","6.attention.key","7.attention.key","8.attention.key","9.attention.key","10.attention.key","11.attention.key","12.attention.key","13.attention.key","14.attention.key","15.attention.key","16.attention.key","17.attention.key","18.attention.key","19.attention.key","20.attention.key","21.attention.key","22.attention.key","23.attention.key"],"parameters":["0.22","0.27","0.17","0.23","0.17","0.12","0.18","0.27","0.36","0.18","0.42","0.41","0.39","0.46","0.47","0.55","0.58","0.46","0.55","0.44","0.35","0.15","0.13","0.10"],"url":["/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_0_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_1_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_2_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_3_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_4_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_5_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_6_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_7_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_8_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_9_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_10_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_11_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_12_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_13_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_14_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_15_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_16_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_17_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_18_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_19_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_20_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_21_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_22_attention_self_key.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_23_attention_self_key.png"],"x":[0.25,1.25,2.25,3.25,4.25,5.25,6.25,7.25,8.25,9.25,10.25,11.25,12.25,13.25,14.25,15.25,16.25,17.25,18.25,19.25,20.25,21.25,22.25,23.25]},"selected":{"id":"1152"},"selection_policy":{"id":"1153"}},"id":"1122","type":"ColumnDataSource"},{"attributes":{},"id":"1157","type":"UnionRenderers"},{"attributes":{"label":{"value":"key"},"renderers":[{"id":"1126"}]},"id":"1142","type":"LegendItem"},{"attributes":{"data_source":{"id":"1128"},"glyph":{"id":"1130"},"hover_glyph":null,"muted_glyph":null,"name":"value","nonselection_glyph":{"id":"1131"},"selection_glyph":null,"view":{"id":"1133"}},"id":"1132","type":"GlyphRenderer"},{"attributes":{"fill_alpha":{"value":0.1},"fill_color":{"value":"#20cb97"},"line_alpha":{"value":0.1},"line_color":{"value":"#20cb97"},"top":{"field":"height"},"width":{"value":0.125},"x":{"field":"x"}},"id":"1131","type":"VBar"},{"attributes":{"axis":{"id":"1106"},"grid_line_color":null,"ticker":null},"id":"1109","type":"Grid"},{"attributes":{"source":{"id":"1128"}},"id":"1133","type":"CDSView"},{"attributes":{},"id":"1107","type":"BasicTicker"},{"attributes":{"start":0},"id":"1100","type":"DataRange1d"},{"attributes":{"data":{"density":["21.9%","25.6%","14.8%","20.7%","15.9%","10.5%","15.9%","23.8%","33.8%","15.7%","36.9%","39.3%","37.3%","41.9%","45.7%","49.4%","51.6%","42.2%","48.9%","39.3%","32.0%","15.0%","10.2%","7.9%"],"height":[0.229376,0.268288,0.155648,0.217088,0.166912,0.110592,0.166912,0.249856,0.354304,0.164864,0.387072,0.411648,0.391168,0.439296,0.479232,0.518144,0.540672,0.442368,0.513024,0.411648,0.335872,0.157696,0.106496,0.082944],"img_height":["128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px"],"img_width":["128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px"],"name":["0.attention.query","1.attention.query","2.attention.query","3.attention.query","4.attention.query","5.attention.query","6.attention.query","7.attention.query","8.attention.query","9.attention.query","10.attention.query","11.attention.query","12.attention.query","13.attention.query","14.attention.query","15.attention.query","16.attention.query","17.attention.query","18.attention.query","19.attention.query","20.attention.query","21.attention.query","22.attention.query","23.attention.query"],"parameters":["0.23","0.27","0.16","0.22","0.17","0.11","0.17","0.25","0.35","0.16","0.39","0.41","0.39","0.44","0.48","0.52","0.54","0.44","0.51","0.41","0.34","0.16","0.11","0.08"],"url":["/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_0_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_1_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_2_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_3_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_4_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_5_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_6_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_7_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_8_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_9_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_10_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_11_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_12_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_13_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_14_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_15_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_16_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_17_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_18_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_19_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_20_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_21_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_22_attention_self_query.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_23_attention_self_query.png"],"x":[0.08333333333333333,1.0833333333333333,2.0833333333333335,3.0833333333333335,4.083333333333333,5.083333333333333,6.083333333333333,7.083333333333333,8.083333333333334,9.083333333333334,10.083333333333334,11.083333333333334,12.083333333333334,13.083333333333334,14.083333333333334,15.083333333333334,16.083333333333332,17.083333333333332,18.083333333333332,19.083333333333332,20.083333333333332,21.083333333333332,22.083333333333332,23.083333333333332]},"selected":{"id":"1150"},"selection_policy":{"id":"1151"}},"id":"1116","type":"ColumnDataSource"},{"attributes":{},"id":"1150","type":"Selection"},{"attributes":{"label":{"value":"query"},"renderers":[{"id":"1120"}]},"id":"1141","type":"LegendItem"},{"attributes":{},"id":"1146","type":"BasicTickFormatter"},{"attributes":{},"id":"1102","type":"LinearScale"},{"attributes":{"axis_label":"Layer","formatter":{"id":"1148"},"minor_tick_line_color":null,"ticker":{"id":"1107"}},"id":"1106","type":"LinearAxis"},{"attributes":{"fill_alpha":{"value":0.1},"fill_color":{"value":"#ed5642"},"line_alpha":{"value":0.1},"line_color":{"value":"#ed5642"},"top":{"field":"height"},"width":{"value":0.125},"x":{"field":"x"}},"id":"1125","type":"VBar"},{"attributes":{"data":{"density":["25.4%","22.2%","13.1%","21.8%","15.2%","13.0%","16.5%","22.3%","27.5%","12.9%","33.2%","31.5%","35.9%","42.4%","37.5%","38.9%","50.1%","44.3%","40.3%","31.2%","18.9%","10.2%","7.5%","8.1%"],"height":[0.26624,0.232448,0.137216,0.228352,0.159744,0.136192,0.173056,0.233472,0.288768,0.135168,0.34816,0.330752,0.376832,0.444416,0.393216,0.407552,0.525312,0.464896,0.422912,0.326656,0.198656,0.106496,0.078848,0.084992],"img_height":["128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px"],"img_width":["128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px","128px"],"name":["0.attention.value","1.attention.value","2.attention.value","3.attention.value","4.attention.value","5.attention.value","6.attention.value","7.attention.value","8.attention.value","9.attention.value","10.attention.value","11.attention.value","12.attention.value","13.attention.value","14.attention.value","15.attention.value","16.attention.value","17.attention.value","18.attention.value","19.attention.value","20.attention.value","21.attention.value","22.attention.value","23.attention.value"],"parameters":["0.27","0.23","0.14","0.23","0.16","0.14","0.17","0.23","0.29","0.14","0.35","0.33","0.38","0.44","0.39","0.41","0.53","0.46","0.42","0.33","0.20","0.11","0.08","0.08"],"url":["/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_0_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_1_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_2_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_3_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_4_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_5_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_6_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_7_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_8_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_9_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_10_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_11_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_12_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_13_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_14_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_15_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_16_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_17_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_18_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_19_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_20_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_21_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_22_attention_self_value.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_23_attention_self_value.png"],"x":[0.41666666666666663,1.4166666666666665,2.416666666666667,3.416666666666667,4.416666666666666,5.416666666666666,6.416666666666666,7.416666666666666,8.416666666666668,9.416666666666668,10.416666666666668,11.416666666666668,12.416666666666668,13.416666666666668,14.416666666666668,15.416666666666668,16.416666666666664,17.416666666666664,18.416666666666664,19.416666666666664,20.416666666666664,21.416666666666664,22.416666666666664,23.416666666666664]},"selected":{"id":"1154"},"selection_policy":{"id":"1155"}},"id":"1128","type":"ColumnDataSource"},{"attributes":{"above":[{"id":"1140"}],"below":[{"id":"1106"}],"center":[{"id":"1109"},{"id":"1113"}],"left":[{"id":"1110"}],"outline_line_color":null,"plot_height":300,"plot_width":505,"renderers":[{"id":"1120"},{"id":"1126"},{"id":"1132"},{"id":"1138"}],"title":{"id":"1096"},"toolbar":{"id":"1114"},"x_range":{"id":"1098"},"x_scale":{"id":"1102"},"y_range":{"id":"1100"},"y_scale":{"id":"1104"}},"id":"1095","subtype":"Figure","type":"Plot"},{"attributes":{"data":{"density":["27.2%","7.0%","7.0%","24.2%","7.4%","7.4%","12.7%","10.4%","10.4%","22.9%","12.9%","12.9%","17.0%","13.7%","13.7%","13.4%","15.6%","15.6%","18.9%","17.2%","17.2%","24.6%","17.5%","17.5%","31.2%","17.5%","17.5%","14.8%","18.3%","18.3%","36.1%","15.1%","15.1%","33.6%","16.1%","16.1%","34.7%","14.7%","14.7%","44.4%","17.0%","17.0%","41.4%","13.7%","13.7%","41.5%","12.8%","12.8%","50.1%","13.0%","13.0%","43.1%","12.8%","12.8%","38.4%","9.2%","9.2%","28.5%","5.3%","5.3%","18.5%","3.6%","3.6%","9.5%","1.9%","1.9%","6.1%","1.1%","1.1%","7.3%","2.6%","2.6%"],"height":[0.285696,0.293888,0.293888,0.253952,0.31232,0.31232,0.13312,0.438272,0.438272,0.24064,0.54272,0.54272,0.178176,0.57344,0.57344,0.140288,0.654336,0.654336,0.198656,0.720896,0.720896,0.258048,0.734208,0.734208,0.326656,0.734208,0.734208,0.155648,0.765952,0.765952,0.37888,0.633856,0.633856,0.352256,0.67584,0.67584,0.36352,0.618496,0.618496,0.46592,0.71168,0.71168,0.434176,0.576512,0.576512,0.4352,0.538624,0.538624,0.525312,0.545792,0.545792,0.451584,0.535552,0.535552,0.402432,0.387072,0.387072,0.299008,0.223232,0.223232,0.193536,0.149504,0.149504,0.099328,0.077824,0.077824,0.063488,0.045056,0.045056,0.0768,0.110592,0.110592],"img_height":["128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px"],"img_width":["128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px","128px","128px","512px"],"name":["0.attention.output","0.intermediate","0.output","1.attention.output","1.intermediate","1.output","2.attention.output","2.intermediate","2.output","3.attention.output","3.intermediate","3.output","4.attention.output","4.intermediate","4.output","5.attention.output","5.intermediate","5.output","6.attention.output","6.intermediate","6.output","7.attention.output","7.intermediate","7.output","8.attention.output","8.intermediate","8.output","9.attention.output","9.intermediate","9.output","10.attention.output","10.intermediate","10.output","11.attention.output","11.intermediate","11.output","12.attention.output","12.intermediate","12.output","13.attention.output","13.intermediate","13.output","14.attention.output","14.intermediate","14.output","15.attention.output","15.intermediate","15.output","16.attention.output","16.intermediate","16.output","17.attention.output","17.intermediate","17.output","18.attention.output","18.intermediate","18.output","19.attention.output","19.intermediate","19.output","20.attention.output","20.intermediate","20.output","21.attention.output","21.intermediate","21.output","22.attention.output","22.intermediate","22.output","23.attention.output","23.intermediate","23.output"],"parameters":["0.29","0.29","0.29","0.25","0.31","0.31","0.13","0.44","0.44","0.24","0.54","0.54","0.18","0.57","0.57","0.14","0.65","0.65","0.20","0.72","0.72","0.26","0.73","0.73","0.33","0.73","0.73","0.16","0.77","0.77","0.38","0.63","0.63","0.35","0.68","0.68","0.36","0.62","0.62","0.47","0.71","0.71","0.43","0.58","0.58","0.44","0.54","0.54","0.53","0.55","0.55","0.45","0.54","0.54","0.40","0.39","0.39","0.30","0.22","0.22","0.19","0.15","0.15","0.10","0.08","0.08","0.06","0.05","0.05","0.08","0.11","0.11"],"url":["/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_0_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_0_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_0_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_1_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_1_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_1_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_2_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_2_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_2_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_3_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_3_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_3_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_4_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_4_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_4_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_5_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_5_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_5_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_6_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_6_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_6_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_7_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_7_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_7_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_8_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_8_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_8_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_9_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_9_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_9_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_10_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_10_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_10_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_11_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_11_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_11_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_12_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_12_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_12_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_13_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_13_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_13_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_14_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_14_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_14_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_15_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_15_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_15_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_16_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_16_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_16_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_17_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_17_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_17_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_18_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_18_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_18_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_19_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_19_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_19_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_20_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_20_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_20_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_21_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_21_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_21_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_22_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_22_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_22_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_23_attention_output_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_23_intermediate_dense.png","/madlag/bert-large-uncased-wwm-squadv2-x2.63-f82.6-d16-hybrid-v1/raw/main/model_card/images/layer_23_output_dense.png"],"x":[0.5833333333333334,0.75,0.9166666666666667,1.5833333333333333,1.75,1.9166666666666665,2.5833333333333335,2.75,2.916666666666667,3.5833333333333335,3.75,3.916666666666667,4.583333333333333,4.75,4.916666666666666,5.583333333333333,5.75,5.916666666666666,6.583333333333333,6.75,6.916666666666666,7.583333333333333,7.75,7.916666666666666,8.583333333333334,8.75,8.916666666666668,9.583333333333334,9.75,9.916666666666668,10.583333333333334,10.75,10.916666666666668,11.583333333333334,11.75,11.916666666666668,12.583333333333334,12.75,12.916666666666668,13.583333333333334,13.75,13.916666666666668,14.583333333333334,14.75,14.916666666666668,15.583333333333334,15.75,15.916666666666668,16.583333333333332,16.75,16.916666666666664,17.583333333333332,17.75,17.916666666666664,18.583333333333332,18.75,18.916666666666664,19.583333333333332,19.75,19.916666666666664,20.583333333333332,20.75,20.916666666666664,21.583333333333332,21.75,21.916666666666664,22.583333333333332,22.75,22.916666666666664,23.583333333333332,23.75,23.916666666666664]},"selected":{"id":"1156"},"selection_policy":{"id":"1157"}},"id":"1134","type":"ColumnDataSource"},{"attributes":{},"id":"1152","type":"Selection"},{"attributes":{},"id":"1104","type":"LinearScale"},{"attributes":{},"id":"1156","type":"Selection"},{"attributes":{"text":"Transformer Layers"},"id":"1096","type":"Title"},{"attributes":{},"id":"1098","type":"DataRange1d"},{"attributes":{"fill_color":{"value":"#6573f7"},"line_color":{"value":"#6573f7"},"top":{"field":"height"},"width":{"value":0.125},"x":{"field":"x"}},"id":"1118","type":"VBar"},{"attributes":{"items":[{"id":"1141"},{"id":"1142"},{"id":"1143"},{"id":"1144"}],"location":[10,0],"orientation":"horizontal"},"id":"1140","type":"Legend"},{"attributes":{"data_source":{"id":"1134"},"glyph":{"id":"1136"},"hover_glyph":null,"muted_glyph":null,"name":"fully connected","nonselection_glyph":{"id":"1137"},"selection_glyph":null,"view":{"id":"1139"}},"id":"1138","type":"GlyphRenderer"}],"root_ids":["1095"]},"title":"Bokeh Application","version":"2.2.3"}}';
119
+ var render_items = [{"docid":"db9c60ce-feb7-4e96-b7a0-bd8663fdcd25","root_ids":["1095"],"roots":{"1095":"64b46a6e-dbe2-4f43-83f9-470cbe9b6ced"}}];
120
  root.Bokeh.embed.embed_items(docs_json, render_items);
121
 
122
  }
model_card/pruning_info.js CHANGED
@@ -16,9 +16,9 @@
16
 
17
 
18
 
19
- var element = document.getElementById("03ad75cf-8048-44ae-a1d6-db69021cc168");
20
  if (element == null) {
21
- console.warn("Bokeh: autoload.js configured with elementid '03ad75cf-8048-44ae-a1d6-db69021cc168' but no matching script tag was found.")
22
  }
23
 
24
 
@@ -115,8 +115,8 @@
115
  (function(root) {
116
  function embed_document(root) {
117
 
118
- var docs_json = '{"3225a67b-1996-4161-a7db-745c9acaf2b6":{"roots":{"references":[{"attributes":{"axis":{"id":"1015"},"dimension":1,"ticker":null},"id":"1018","type":"Grid"},{"attributes":{"fields":["active"]},"id":"1022","type":"Stack"},{"attributes":{"text":"Pruned Transformer Heads"},"id":"1002","type":"Title"},{"attributes":{"data_source":{"id":"1024"},"glyph":{"id":"1026"},"hover_glyph":null,"muted_glyph":null,"name":"active","nonselection_glyph":{"id":"1027"},"selection_glyph":null,"view":{"id":"1029"}},"id":"1028","type":"GlyphRenderer"},{"attributes":{},"id":"1010","type":"LinearScale"},{"attributes":{},"id":"1013","type":"CategoricalTicker"},{"attributes":{"fields":[]},"id":"1020","type":"Stack"},{"attributes":{"factors":["0","1","2","3","4","5","6","7","8","9","10","11","12","13","14","15","16","17","18","19","20","21","22","23"],"range_padding":0.1},"id":"1004","type":"FactorRange"},{"attributes":{"items":[{"id":"1056"},{"id":"1057"}],"location":[10,0],"orientation":"horizontal"},"id":"1055","type":"Legend"},{"attributes":{"label":{"value":"pruned"},"renderers":[{"id":"1043"}]},"id":"1057","type":"LegendItem"},{"attributes":{"label":{"value":"active"},"renderers":[{"id":"1028"}]},"id":"1056","type":"LegendItem"},{"attributes":{},"id":"1031","type":"BasicTickFormatter"},{"attributes":{"active_drag":"auto","active_inspect":"auto","active_multi":null,"active_scroll":"auto","active_tap":"auto"},"id":"1019","type":"Toolbar"},{"attributes":{"bottom":{"expr":{"id":"1022"}},"fill_color":{"value":"#ffcccc"},"line_color":{"value":"#ffcccc"},"top":{"expr":{"id":"1023"}},"width":{"value":0.9},"x":{"field":"layers"}},"id":"1041","type":"VBar"},{"attributes":{"start":0},"id":"1006","type":"DataRange1d"},{"attributes":{"label":{"value":"pruned"},"renderers":[{"id":"1043"}]},"id":"1054","type":"LegendItem"},{"attributes":{"axis_label":"Layer index","formatter":{"id":"1033"},"minor_tick_line_color":null,"ticker":{"id":"1013"}},"id":"1012","type":"CategoricalAxis"},{"attributes":{},"id":"1033","type":"CategoricalTickFormatter"},{"attributes":{"data":{"active":[7,7,3,5,4,4,4,5,7,4,8,7,9,11,10,14,14,11,13,13,12,8,6,8],"layers":["0","1","2","3","4","5","6","7","8","9","10","11","12","13","14","15","16","17","18","19","20","21","22","23"],"pruned":[9,9,13,11,12,12,12,11,9,12,8,9,7,5,6,2,2,5,3,3,4,8,10,8]},"selected":{"id":"1053"},"selection_policy":{"id":"1052"}},"id":"1039","type":"ColumnDataSource"},{"attributes":{},"id":"1008","type":"CategoricalScale"},{"attributes":{"bottom":{"expr":{"id":"1022"}},"fill_alpha":{"value":0.1},"fill_color":{"value":"#ffcccc"},"line_alpha":{"value":0.1},"line_color":{"value":"#ffcccc"},"top":{"expr":{"id":"1023"}},"width":{"value":0.9},"x":{"field":"layers"}},"id":"1042","type":"VBar"},{"attributes":{"fields":["active"]},"id":"1021","type":"Stack"},{"attributes":{"source":{"id":"1024"}},"id":"1029","type":"CDSView"},{"attributes":{},"id":"1052","type":"UnionRenderers"},{"attributes":{"source":{"id":"1039"}},"id":"1044","type":"CDSView"},{"attributes":{"data_source":{"id":"1039"},"glyph":{"id":"1041"},"hover_glyph":null,"muted_glyph":null,"name":"pruned","nonselection_glyph":{"id":"1042"},"selection_glyph":null,"view":{"id":"1044"}},"id":"1043","type":"GlyphRenderer"},{"attributes":{},"id":"1016","type":"BasicTicker"},{"attributes":{"bottom":{"expr":{"id":"1020"}},"fill_alpha":{"value":0.1},"fill_color":{"value":"#0000ff"},"line_alpha":{"value":0.1},"line_color":{"value":"#0000ff"},"top":{"expr":{"id":"1021"}},"width":{"value":0.9},"x":{"field":"layers"}},"id":"1027","type":"VBar"},{"attributes":{},"id":"1053","type":"Selection"},{"attributes":{},"id":"1035","type":"UnionRenderers"},{"attributes":{"items":[{"id":"1038"},{"id":"1054"}],"location":null},"id":"1037","type":"Legend"},{"attributes":{},"id":"1036","type":"Selection"},{"attributes":{"axis_label":"Heads count","formatter":{"id":"1031"},"minor_tick_line_color":null,"ticker":{"id":"1016"}},"id":"1015","type":"LinearAxis"},{"attributes":{"fields":["active","pruned"]},"id":"1023","type":"Stack"},{"attributes":{"data":{"active":[7,7,3,5,4,4,4,5,7,4,8,7,9,11,10,14,14,11,13,13,12,8,6,8],"layers":["0","1","2","3","4","5","6","7","8","9","10","11","12","13","14","15","16","17","18","19","20","21","22","23"],"pruned":[9,9,13,11,12,12,12,11,9,12,8,9,7,5,6,2,2,5,3,3,4,8,10,8]},"selected":{"id":"1036"},"selection_policy":{"id":"1035"}},"id":"1024","type":"ColumnDataSource"},{"attributes":{"bottom":{"expr":{"id":"1020"}},"fill_color":{"value":"#0000ff"},"line_color":{"value":"#0000ff"},"top":{"expr":{"id":"1021"}},"width":{"value":0.9},"x":{"field":"layers"}},"id":"1026","type":"VBar"},{"attributes":{"axis":{"id":"1012"},"grid_line_color":null,"ticker":null},"id":"1014","type":"Grid"},{"attributes":{"above":[{"id":"1055"}],"below":[{"id":"1012"}],"center":[{"id":"1014"},{"id":"1018"},{"id":"1037"}],"left":[{"id":"1015"}],"outline_line_color":null,"plot_height":400,"renderers":[{"id":"1028"},{"id":"1043"}],"title":{"id":"1002"},"toolbar":{"id":"1019"},"toolbar_location":null,"x_range":{"id":"1004"},"x_scale":{"id":"1008"},"y_range":{"id":"1006"},"y_scale":{"id":"1010"}},"id":"1001","subtype":"Figure","type":"Plot"},{"attributes":{"label":{"value":"active"},"renderers":[{"id":"1028"}]},"id":"1038","type":"LegendItem"}],"root_ids":["1001"]},"title":"Bokeh Application","version":"2.2.3"}}';
119
- var render_items = [{"docid":"3225a67b-1996-4161-a7db-745c9acaf2b6","root_ids":["1001"],"roots":{"1001":"03ad75cf-8048-44ae-a1d6-db69021cc168"}}];
120
  root.Bokeh.embed.embed_items(docs_json, render_items);
121
 
122
  }
16
 
17
 
18
 
19
+ var element = document.getElementById("c81effce-5f17-4643-b14a-e5e982bed699");
20
  if (element == null) {
21
+ console.warn("Bokeh: autoload.js configured with elementid 'c81effce-5f17-4643-b14a-e5e982bed699' but no matching script tag was found.")
22
  }
23
 
24
 
115
  (function(root) {
116
  function embed_document(root) {
117
 
118
+ var docs_json = '{"c2f00807-bf51-4431-be89-feced9319ff4":{"roots":{"references":[{"attributes":{"start":0},"id":"1006","type":"DataRange1d"},{"attributes":{},"id":"1008","type":"CategoricalScale"},{"attributes":{},"id":"1052","type":"Selection"},{"attributes":{"axis":{"id":"1012"},"grid_line_color":null,"ticker":null},"id":"1014","type":"Grid"},{"attributes":{},"id":"1053","type":"UnionRenderers"},{"attributes":{"factors":["0","1","2","3","4","5","6","7","8","9","10","11","12","13","14","15","16","17","18","19","20","21","22","23"],"range_padding":0.1},"id":"1004","type":"FactorRange"},{"attributes":{"above":[{"id":"1055"}],"below":[{"id":"1012"}],"center":[{"id":"1014"},{"id":"1018"},{"id":"1037"}],"left":[{"id":"1015"}],"outline_line_color":null,"plot_height":400,"renderers":[{"id":"1028"},{"id":"1043"}],"title":{"id":"1002"},"toolbar":{"id":"1019"},"toolbar_location":null,"x_range":{"id":"1004"},"x_scale":{"id":"1008"},"y_range":{"id":"1006"},"y_scale":{"id":"1010"}},"id":"1001","subtype":"Figure","type":"Plot"},{"attributes":{"items":[{"id":"1056"},{"id":"1057"}],"location":[10,0],"orientation":"horizontal"},"id":"1055","type":"Legend"},{"attributes":{"fields":[]},"id":"1020","type":"Stack"},{"attributes":{},"id":"1035","type":"Selection"},{"attributes":{},"id":"1031","type":"BasicTickFormatter"},{"attributes":{"label":{"value":"active"},"renderers":[{"id":"1028"}]},"id":"1038","type":"LegendItem"},{"attributes":{},"id":"1036","type":"UnionRenderers"},{"attributes":{},"id":"1010","type":"LinearScale"},{"attributes":{"text":"Pruned Transformer Heads"},"id":"1002","type":"Title"},{"attributes":{},"id":"1033","type":"CategoricalTickFormatter"},{"attributes":{"data":{"active":[7,7,3,5,4,4,4,5,7,4,8,7,9,11,10,14,14,11,13,13,12,8,6,8],"layers":["0","1","2","3","4","5","6","7","8","9","10","11","12","13","14","15","16","17","18","19","20","21","22","23"],"pruned":[9,9,13,11,12,12,12,11,9,12,8,9,7,5,6,2,2,5,3,3,4,8,10,8]},"selected":{"id":"1052"},"selection_policy":{"id":"1053"}},"id":"1039","type":"ColumnDataSource"},{"attributes":{"label":{"value":"active"},"renderers":[{"id":"1028"}]},"id":"1056","type":"LegendItem"},{"attributes":{"label":{"value":"pruned"},"renderers":[{"id":"1043"}]},"id":"1057","type":"LegendItem"},{"attributes":{"fields":["active"]},"id":"1021","type":"Stack"},{"attributes":{"source":{"id":"1039"}},"id":"1044","type":"CDSView"},{"attributes":{"axis":{"id":"1015"},"dimension":1,"ticker":null},"id":"1018","type":"Grid"},{"attributes":{},"id":"1016","type":"BasicTicker"},{"attributes":{"bottom":{"expr":{"id":"1022"}},"fill_color":{"value":"#ffcccc"},"line_color":{"value":"#ffcccc"},"top":{"expr":{"id":"1023"}},"width":{"value":0.9},"x":{"field":"layers"}},"id":"1041","type":"VBar"},{"attributes":{"data_source":{"id":"1039"},"glyph":{"id":"1041"},"hover_glyph":null,"muted_glyph":null,"name":"pruned","nonselection_glyph":{"id":"1042"},"selection_glyph":null,"view":{"id":"1044"}},"id":"1043","type":"GlyphRenderer"},{"attributes":{"bottom":{"expr":{"id":"1022"}},"fill_alpha":{"value":0.1},"fill_color":{"value":"#ffcccc"},"line_alpha":{"value":0.1},"line_color":{"value":"#ffcccc"},"top":{"expr":{"id":"1023"}},"width":{"value":0.9},"x":{"field":"layers"}},"id":"1042","type":"VBar"},{"attributes":{"data":{"active":[7,7,3,5,4,4,4,5,7,4,8,7,9,11,10,14,14,11,13,13,12,8,6,8],"layers":["0","1","2","3","4","5","6","7","8","9","10","11","12","13","14","15","16","17","18","19","20","21","22","23"],"pruned":[9,9,13,11,12,12,12,11,9,12,8,9,7,5,6,2,2,5,3,3,4,8,10,8]},"selected":{"id":"1035"},"selection_policy":{"id":"1036"}},"id":"1024","type":"ColumnDataSource"},{"attributes":{"label":{"value":"pruned"},"renderers":[{"id":"1043"}]},"id":"1054","type":"LegendItem"},{"attributes":{"axis_label":"Heads count","formatter":{"id":"1031"},"minor_tick_line_color":null,"ticker":{"id":"1016"}},"id":"1015","type":"LinearAxis"},{"attributes":{"fields":["active","pruned"]},"id":"1023","type":"Stack"},{"attributes":{"active_drag":"auto","active_inspect":"auto","active_multi":null,"active_scroll":"auto","active_tap":"auto"},"id":"1019","type":"Toolbar"},{"attributes":{"source":{"id":"1024"}},"id":"1029","type":"CDSView"},{"attributes":{"bottom":{"expr":{"id":"1020"}},"fill_color":{"value":"#0000ff"},"line_color":{"value":"#0000ff"},"top":{"expr":{"id":"1021"}},"width":{"value":0.9},"x":{"field":"layers"}},"id":"1026","type":"VBar"},{"attributes":{"fields":["active"]},"id":"1022","type":"Stack"},{"attributes":{"data_source":{"id":"1024"},"glyph":{"id":"1026"},"hover_glyph":null,"muted_glyph":null,"name":"active","nonselection_glyph":{"id":"1027"},"selection_glyph":null,"view":{"id":"1029"}},"id":"1028","type":"GlyphRenderer"},{"attributes":{"bottom":{"expr":{"id":"1020"}},"fill_alpha":{"value":0.1},"fill_color":{"value":"#0000ff"},"line_alpha":{"value":0.1},"line_color":{"value":"#0000ff"},"top":{"expr":{"id":"1021"}},"width":{"value":0.9},"x":{"field":"layers"}},"id":"1027","type":"VBar"},{"attributes":{"items":[{"id":"1038"},{"id":"1054"}],"location":null},"id":"1037","type":"Legend"},{"attributes":{},"id":"1013","type":"CategoricalTicker"},{"attributes":{"axis_label":"Layer index","formatter":{"id":"1033"},"minor_tick_line_color":null,"ticker":{"id":"1013"}},"id":"1012","type":"CategoricalAxis"}],"root_ids":["1001"]},"title":"Bokeh Application","version":"2.2.3"}}';
119
+ var render_items = [{"docid":"c2f00807-bf51-4431-be89-feced9319ff4","root_ids":["1001"],"roots":{"1001":"c81effce-5f17-4643-b14a-e5e982bed699"}}];
120
  root.Bokeh.embed.embed_items(docs_json, render_items);
121
 
122
  }
training/data_args.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_cache_dir": "dataset_cache",
3
+ "dataset_config_name": null,
4
+ "dataset_name": "squad_v2",
5
+ "doc_stride": 128,
6
+ "max_answer_length": 30,
7
+ "max_seq_length": 384,
8
+ "n_best_size": 20,
9
+ "null_score_diff_threshold": 0.0,
10
+ "overwrite_cache": 0,
11
+ "pad_to_max_length": true,
12
+ "preprocessing_num_workers": null,
13
+ "train_file": null,
14
+ "validation_file": null,
15
+ "version_2_with_negative": 1
16
+ }
training/model_args.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
1
+ {
2
+ "cache_dir": null,
3
+ "config_name": null,
4
+ "model_name_or_path": "bert-large-uncased-whole-word-masking",
5
+ "tokenizer_name": null,
6
+ "use_fast_tokenizer": true
7
+ }
training/sparse_args.json ADDED
@@ -0,0 +1,39 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "ampere_pruning_method": "disabled",
3
+ "attention_block_cols": 32,
4
+ "attention_block_rows": 32,
5
+ "attention_lambda": 1.0,
6
+ "attention_output_with_dense": 0,
7
+ "attention_pruning_method": "sigmoied_threshold",
8
+ "bias_mask": true,
9
+ "dense_block_cols": 1,
10
+ "dense_block_rows": 1,
11
+ "dense_lambda": 1.0,
12
+ "dense_pruning_method": "sigmoied_threshold:1d_alt",
13
+ "distil_alpha_ce": 0.1,
14
+ "distil_alpha_teacher": 0.9,
15
+ "distil_teacher_name_or_path": "madlag/bert-large-uncased-whole-word-masking-finetuned-squadv2",
16
+ "distil_temperature": 2.0,
17
+ "eval_with_current_patch_params": false,
18
+ "final_ampere_temperature": 20.0,
19
+ "final_finetune": false,
20
+ "final_threshold": 0.1,
21
+ "final_warmup": 10,
22
+ "gelu_patch": 0,
23
+ "gelu_patch_steps": 50000,
24
+ "initial_ampere_temperature": 0.0,
25
+ "initial_threshold": 0,
26
+ "initial_warmup": 1,
27
+ "layer_norm_patch": 0,
28
+ "layer_norm_patch_start_delta": 0.99,
29
+ "layer_norm_patch_steps": 50000,
30
+ "linear_min_parameters": 0.005,
31
+ "mask_init": "constant",
32
+ "mask_scale": 0.0,
33
+ "mask_scores_learning_rate": 0.01,
34
+ "qat": false,
35
+ "qconfig": "default",
36
+ "regularization": "l1",
37
+ "regularization_final_lambda": 5,
38
+ "rewind_model_name_or_path": null
39
+ }
training/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78b41d66c3a0afbe05264fcba8565ebb11633b8a0a821585f9497748f4d2c9e7
3
+ size 2415