echarlaix's picture
echarlaix
HF staff
Adding model, graphs and metadata.
83d7ce2
{"total": 109466882, "nnz": 56374189, "linear_total": 84934656, "linear_nnz": 31863296, "layers": {"0": {"total": 7086528, "nnz": 3073417, "linear_total": 7077888, "linear_nnz": 3066368, "linear_attention_total": 2359296, "linear_attention_nnz": 496640, "linear_dense_total": 4718592, "linear_dense_nnz": 2569728}, "1": {"total": 7086336, "nnz": 3253643, "linear_total": 7077888, "linear_nnz": 3246592, "linear_attention_total": 2359296, "linear_attention_nnz": 526336, "linear_dense_total": 4718592, "linear_dense_nnz": 2720256}, "2": {"total": 7086144, "nnz": 3723797, "linear_total": 7077888, "linear_nnz": 3716608, "linear_attention_total": 2359296, "linear_attention_nnz": 440320, "linear_dense_total": 4718592, "linear_dense_nnz": 3276288}, "3": {"total": 7086144, "nnz": 3890416, "linear_total": 7077888, "linear_nnz": 3883008, "linear_attention_total": 2359296, "linear_attention_nnz": 466944, "linear_dense_total": 4718592, "linear_dense_nnz": 3416064}, "4": {"total": 7086912, "nnz": 3876149, "linear_total": 7077888, "linear_nnz": 3868160, "linear_attention_total": 2359296, "linear_attention_nnz": 591872, "linear_dense_total": 4718592, "linear_dense_nnz": 3276288}, "5": {"total": 7087104, "nnz": 3973982, "linear_total": 7077888, "linear_nnz": 3965952, "linear_attention_total": 2359296, "linear_attention_nnz": 774144, "linear_dense_total": 4718592, "linear_dense_nnz": 3191808}, "6": {"total": 7086720, "nnz": 3478463, "linear_total": 7077888, "linear_nnz": 3470848, "linear_attention_total": 2359296, "linear_attention_nnz": 572416, "linear_dense_total": 4718592, "linear_dense_nnz": 2898432}, "7": {"total": 7086912, "nnz": 3203308, "linear_total": 7077888, "linear_nnz": 3195904, "linear_attention_total": 2359296, "linear_attention_nnz": 867328, "linear_dense_total": 4718592, "linear_dense_nnz": 2328576}, "8": {"total": 7086720, "nnz": 1837865, "linear_total": 7077888, "linear_nnz": 1831424, "linear_attention_total": 2359296, "linear_attention_nnz": 637952, "linear_dense_total": 4718592, "linear_dense_nnz": 1193472}, "9": {"total": 7086336, "nnz": 906736, "linear_total": 7077888, "linear_nnz": 901120, "linear_attention_total": 2359296, "linear_attention_nnz": 385024, "linear_dense_total": 4718592, "linear_dense_nnz": 516096}, "10": {"total": 7085952, "nnz": 481310, "linear_total": 7077888, "linear_nnz": 476160, "linear_attention_total": 2359296, "linear_attention_nnz": 233472, "linear_dense_total": 4718592, "linear_dense_nnz": 242688}, "11": {"total": 7085760, "nnz": 245789, "linear_total": 7077888, "linear_nnz": 241152, "linear_attention_total": 2359296, "linear_attention_nnz": 0, "linear_dense_total": 4718592, "linear_dense_nnz": 241152}}, "total_sparsity": 48.501146675576265, "linear_sparsity": 62.48492959104939, "pruned_heads": {"0": [0, 4, 6, 7, 8, 9, 11], "1": [0, 2, 3, 5, 6, 7, 8, 9], "2": [2, 3, 4, 5, 6, 7, 8, 10, 11], "3": [0, 1, 2, 3, 4, 6, 7, 8, 11], "4": [1, 2, 3, 4, 8], "5": [1, 2, 11, 5], "6": [1, 3, 7, 9, 10, 11], "7": [2, 4, 6, 7, 11], "8": [0, 2, 3, 4, 5, 6], "9": [0, 1, 3, 4, 6, 8, 9, 11], "10": [0, 1, 2, 3, 5, 6, 7, 8, 9, 10], "11": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11]}}