bart-base-cnn-r2-19.4-d35-hybrid / eval /sparsity_report.json
echarlaix's picture
echarlaix HF staff
Adding model, graphs and metadata.
acb6565
{"total": 139420416, "nnz": 75103537, "linear_total": 99090432, "linear_nnz": 34815488, "layers": {"0": {"total": 16539648, "nnz": 5698134, "linear_total": 16515072, "linear_nnz": 5680128, "linear_attention_total": 7077888, "linear_attention_nnz": 5253120, "linear_dense_total": 9437184, "linear_dense_nnz": 427008}, "1": {"total": 16539648, "nnz": 5882390, "linear_total": 16515072, "linear_nnz": 5864448, "linear_attention_total": 7077888, "linear_attention_nnz": 4552704, "linear_dense_total": 9437184, "linear_dense_nnz": 1311744}, "2": {"total": 16539648, "nnz": 6119725, "linear_total": 16515072, "linear_nnz": 6101504, "linear_attention_total": 7077888, "linear_attention_nnz": 4901888, "linear_dense_total": 9437184, "linear_dense_nnz": 1199616}, "3": {"total": 16539648, "nnz": 5134569, "linear_total": 16515072, "linear_nnz": 5117440, "linear_attention_total": 7077888, "linear_attention_nnz": 4071424, "linear_dense_total": 9437184, "linear_dense_nnz": 1046016}, "4": {"total": 16539648, "nnz": 5147372, "linear_total": 16515072, "linear_nnz": 5130240, "linear_attention_total": 7077888, "linear_attention_nnz": 4177920, "linear_dense_total": 9437184, "linear_dense_nnz": 952320}, "5": {"total": 16539648, "nnz": 6940355, "linear_total": 16515072, "linear_nnz": 6921728, "linear_attention_total": 7077888, "linear_attention_nnz": 5688320, "linear_dense_total": 9437184, "linear_dense_nnz": 1233408}}, "total_sparsity": 46.13160743975976, "linear_sparsity": 64.86493468915344, "pruned_heads": {"0": [], "1": [6], "2": [4, 6], "3": [0, 1, 2, 7, 11], "4": [1, 2, 5, 6, 10, 11], "5": [3], "6": [12, 13, 14], "7": [2, 11, 16, 18, 19, 23], "8": [16, 21], "9": [3, 12, 13, 15, 16, 18, 22], "10": [3, 14, 18, 20], "11": [10]}}