Upload folder using huggingface_hub
Browse files- config.json +61 -0
- model.safetensors +3 -0
- quant_log.csv +561 -0
- quantize_config.json +20 -0
config.json
ADDED
@@ -0,0 +1,61 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_attn_implementation_autoset": true,
|
3 |
+
"_name_or_path": "meta-llama/Llama-3.3-70B-Instruct",
|
4 |
+
"architectures": [
|
5 |
+
"LlamaForCausalLM"
|
6 |
+
],
|
7 |
+
"attention_bias": false,
|
8 |
+
"attention_dropout": 0.0,
|
9 |
+
"bos_token_id": 128000,
|
10 |
+
"eos_token_id": [
|
11 |
+
128001,
|
12 |
+
128008,
|
13 |
+
128009
|
14 |
+
],
|
15 |
+
"head_dim": 128,
|
16 |
+
"hidden_act": "silu",
|
17 |
+
"hidden_size": 8192,
|
18 |
+
"initializer_range": 0.02,
|
19 |
+
"intermediate_size": 28672,
|
20 |
+
"max_position_embeddings": 131072,
|
21 |
+
"mlp_bias": false,
|
22 |
+
"model_type": "llama",
|
23 |
+
"num_attention_heads": 64,
|
24 |
+
"num_hidden_layers": 80,
|
25 |
+
"num_key_value_heads": 8,
|
26 |
+
"pretraining_tp": 1,
|
27 |
+
"quantization_config": {
|
28 |
+
"bits": 4,
|
29 |
+
"checkpoint_format": "gptq",
|
30 |
+
"desc_act": true,
|
31 |
+
"dynamic": null,
|
32 |
+
"group_size": 128,
|
33 |
+
"lm_head": false,
|
34 |
+
"meta": {
|
35 |
+
"damp_auto_increment": 0.0015,
|
36 |
+
"damp_percent": 0.01,
|
37 |
+
"quantizer": [
|
38 |
+
"gptqmodel:1.4.0-dev"
|
39 |
+
],
|
40 |
+
"static_groups": false,
|
41 |
+
"true_sequential": true,
|
42 |
+
"uri": "https://github.com/modelcloud/gptqmodel"
|
43 |
+
},
|
44 |
+
"quant_method": "gptq",
|
45 |
+
"sym": true
|
46 |
+
},
|
47 |
+
"rms_norm_eps": 1e-05,
|
48 |
+
"rope_scaling": {
|
49 |
+
"factor": 8.0,
|
50 |
+
"high_freq_factor": 4.0,
|
51 |
+
"low_freq_factor": 1.0,
|
52 |
+
"original_max_position_embeddings": 8192,
|
53 |
+
"rope_type": "llama3"
|
54 |
+
},
|
55 |
+
"rope_theta": 500000.0,
|
56 |
+
"tie_word_embeddings": false,
|
57 |
+
"torch_dtype": "bfloat16",
|
58 |
+
"transformers_version": "4.47.0",
|
59 |
+
"use_cache": true,
|
60 |
+
"vocab_size": 128256
|
61 |
+
}
|
model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7922de01bdca5ad0d97084163f53b2954a48b179a006c25e838d45432046f587
|
3 |
+
size 39792965480
|
quant_log.csv
ADDED
@@ -0,0 +1,561 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
layer,module,loss,damp,time
|
2 |
+
0,self_attn.k_proj,0.57035,0.01000,2.657
|
3 |
+
0,self_attn.v_proj,1.47052,0.01000,2.351
|
4 |
+
0,self_attn.q_proj,1.32896,0.01000,2.406
|
5 |
+
0,self_attn.o_proj,0.00012,0.01000,2.410
|
6 |
+
0,mlp.up_proj,0.42204,0.01000,2.590
|
7 |
+
0,mlp.gate_proj,0.43135,0.01000,2.543
|
8 |
+
0,mlp.down_proj,0.00059,0.01000,12.464
|
9 |
+
1,self_attn.k_proj,0.42801,0.01000,2.404
|
10 |
+
1,self_attn.v_proj,0.40142,0.01000,2.362
|
11 |
+
1,self_attn.q_proj,1.63970,0.01000,2.426
|
12 |
+
1,self_attn.o_proj,0.00060,0.01000,2.436
|
13 |
+
1,mlp.up_proj,0.42048,0.01000,2.597
|
14 |
+
1,mlp.gate_proj,0.43219,0.01000,2.544
|
15 |
+
1,mlp.down_proj,0.00066,0.01000,12.450
|
16 |
+
2,self_attn.k_proj,0.13810,0.01000,2.390
|
17 |
+
2,self_attn.v_proj,0.02891,0.01000,2.347
|
18 |
+
2,self_attn.q_proj,0.63511,0.01000,2.417
|
19 |
+
2,self_attn.o_proj,0.00098,0.01000,2.426
|
20 |
+
2,mlp.up_proj,0.94861,0.01000,2.574
|
21 |
+
2,mlp.gate_proj,0.97155,0.01000,2.534
|
22 |
+
2,mlp.down_proj,0.00155,0.01000,12.369
|
23 |
+
3,self_attn.k_proj,0.37560,0.01000,2.370
|
24 |
+
3,self_attn.v_proj,0.05439,0.01000,2.339
|
25 |
+
3,self_attn.q_proj,1.19933,0.01000,2.401
|
26 |
+
3,self_attn.o_proj,0.00116,0.01000,2.424
|
27 |
+
3,mlp.up_proj,1.59134,0.01000,2.584
|
28 |
+
3,mlp.gate_proj,1.77250,0.01000,2.544
|
29 |
+
3,mlp.down_proj,0.02647,0.01000,12.401
|
30 |
+
4,self_attn.k_proj,0.41622,0.01000,2.398
|
31 |
+
4,self_attn.v_proj,0.06400,0.01000,2.358
|
32 |
+
4,self_attn.q_proj,1.26602,0.01000,2.411
|
33 |
+
4,self_attn.o_proj,0.00084,0.01000,2.422
|
34 |
+
4,mlp.up_proj,1.74960,0.01000,2.584
|
35 |
+
4,mlp.gate_proj,1.80884,0.01000,2.540
|
36 |
+
4,mlp.down_proj,0.00400,0.01000,12.399
|
37 |
+
5,self_attn.k_proj,0.60114,0.01000,2.393
|
38 |
+
5,self_attn.v_proj,0.13286,0.01000,2.344
|
39 |
+
5,self_attn.q_proj,1.89099,0.01000,2.419
|
40 |
+
5,self_attn.o_proj,0.00190,0.01000,2.437
|
41 |
+
5,mlp.up_proj,2.20372,0.01000,2.589
|
42 |
+
5,mlp.gate_proj,2.37831,0.01000,2.540
|
43 |
+
5,mlp.down_proj,0.00660,0.01000,12.367
|
44 |
+
6,self_attn.k_proj,1.00460,0.01000,2.371
|
45 |
+
6,self_attn.v_proj,0.15128,0.01000,2.326
|
46 |
+
6,self_attn.q_proj,2.92848,0.01000,2.386
|
47 |
+
6,self_attn.o_proj,0.00212,0.01000,2.409
|
48 |
+
6,mlp.up_proj,2.19970,0.01000,2.576
|
49 |
+
6,mlp.gate_proj,2.31402,0.01000,2.532
|
50 |
+
6,mlp.down_proj,0.00919,0.01000,12.448
|
51 |
+
7,self_attn.k_proj,1.19295,0.01000,2.380
|
52 |
+
7,self_attn.v_proj,0.17405,0.01000,2.322
|
53 |
+
7,self_attn.q_proj,3.59537,0.01000,2.403
|
54 |
+
7,self_attn.o_proj,0.00162,0.01000,2.428
|
55 |
+
7,mlp.up_proj,2.58627,0.01000,2.576
|
56 |
+
7,mlp.gate_proj,2.73543,0.01000,2.530
|
57 |
+
7,mlp.down_proj,0.01228,0.01000,12.390
|
58 |
+
8,self_attn.k_proj,0.88642,0.01000,2.384
|
59 |
+
8,self_attn.v_proj,0.16166,0.01000,2.319
|
60 |
+
8,self_attn.q_proj,2.53692,0.01000,2.407
|
61 |
+
8,self_attn.o_proj,0.00341,0.01000,2.410
|
62 |
+
8,mlp.up_proj,3.88630,0.01000,2.579
|
63 |
+
8,mlp.gate_proj,4.10945,0.01000,2.534
|
64 |
+
8,mlp.down_proj,0.01468,0.01000,12.399
|
65 |
+
9,self_attn.k_proj,0.75486,0.01000,2.376
|
66 |
+
9,self_attn.v_proj,0.12879,0.01000,2.322
|
67 |
+
9,self_attn.q_proj,2.22640,0.01000,2.396
|
68 |
+
9,self_attn.o_proj,0.00491,0.01000,2.402
|
69 |
+
9,mlp.up_proj,6.16445,0.01000,2.583
|
70 |
+
9,mlp.gate_proj,6.62525,0.01000,2.535
|
71 |
+
9,mlp.down_proj,0.01891,0.01000,12.377
|
72 |
+
10,self_attn.k_proj,2.21197,0.01000,2.372
|
73 |
+
10,self_attn.v_proj,0.29660,0.01000,2.325
|
74 |
+
10,self_attn.q_proj,6.23046,0.01000,2.413
|
75 |
+
10,self_attn.o_proj,0.00592,0.01000,2.384
|
76 |
+
10,mlp.up_proj,4.15596,0.01000,2.571
|
77 |
+
10,mlp.gate_proj,4.44713,0.01000,2.536
|
78 |
+
10,mlp.down_proj,0.02901,0.01000,12.351
|
79 |
+
11,self_attn.k_proj,2.23967,0.01000,2.400
|
80 |
+
11,self_attn.v_proj,0.31593,0.01000,2.351
|
81 |
+
11,self_attn.q_proj,5.37146,0.01000,2.396
|
82 |
+
11,self_attn.o_proj,0.00716,0.01000,2.390
|
83 |
+
11,mlp.up_proj,6.03220,0.01000,2.578
|
84 |
+
11,mlp.gate_proj,6.44322,0.01000,2.534
|
85 |
+
11,mlp.down_proj,0.03901,0.01000,12.379
|
86 |
+
12,self_attn.k_proj,1.53060,0.01000,2.379
|
87 |
+
12,self_attn.v_proj,0.26643,0.01000,2.330
|
88 |
+
12,self_attn.q_proj,4.37793,0.01000,2.396
|
89 |
+
12,self_attn.o_proj,0.00726,0.01000,2.401
|
90 |
+
12,mlp.up_proj,5.41540,0.01000,2.584
|
91 |
+
12,mlp.gate_proj,5.80091,0.01000,2.539
|
92 |
+
12,mlp.down_proj,0.04740,0.01000,12.316
|
93 |
+
13,self_attn.k_proj,2.27633,0.01000,2.376
|
94 |
+
13,self_attn.v_proj,0.30485,0.01000,2.320
|
95 |
+
13,self_attn.q_proj,6.06090,0.01000,2.388
|
96 |
+
13,self_attn.o_proj,0.02961,0.01000,2.405
|
97 |
+
13,mlp.up_proj,5.01690,0.01000,2.576
|
98 |
+
13,mlp.gate_proj,5.32263,0.01000,2.531
|
99 |
+
13,mlp.down_proj,0.06650,0.01000,12.387
|
100 |
+
14,self_attn.k_proj,2.83633,0.01000,2.373
|
101 |
+
14,self_attn.v_proj,0.37186,0.01000,2.312
|
102 |
+
14,self_attn.q_proj,8.34845,0.01000,2.401
|
103 |
+
14,self_attn.o_proj,0.04001,0.01000,2.407
|
104 |
+
14,mlp.up_proj,6.58338,0.01000,2.553
|
105 |
+
14,mlp.gate_proj,7.04548,0.01000,2.526
|
106 |
+
14,mlp.down_proj,0.09719,0.01000,12.348
|
107 |
+
15,self_attn.k_proj,2.48118,0.01000,2.397
|
108 |
+
15,self_attn.v_proj,0.35579,0.01000,2.340
|
109 |
+
15,self_attn.q_proj,7.05407,0.01000,2.412
|
110 |
+
15,self_attn.o_proj,0.04138,0.01000,2.441
|
111 |
+
15,mlp.up_proj,7.82927,0.01000,2.577
|
112 |
+
15,mlp.gate_proj,8.54841,0.01000,2.537
|
113 |
+
15,mlp.down_proj,0.12537,0.01000,12.442
|
114 |
+
16,self_attn.k_proj,2.62704,0.01000,2.372
|
115 |
+
16,self_attn.v_proj,0.39784,0.01000,2.336
|
116 |
+
16,self_attn.q_proj,8.07435,0.01000,2.379
|
117 |
+
16,self_attn.o_proj,0.05020,0.01000,2.401
|
118 |
+
16,mlp.up_proj,10.08904,0.01000,2.570
|
119 |
+
16,mlp.gate_proj,11.10111,0.01000,2.528
|
120 |
+
16,mlp.down_proj,0.16947,0.01000,12.337
|
121 |
+
17,self_attn.k_proj,4.36580,0.01000,2.385
|
122 |
+
17,self_attn.v_proj,0.46434,0.01000,2.309
|
123 |
+
17,self_attn.q_proj,12.00885,0.01000,2.414
|
124 |
+
17,self_attn.o_proj,0.12850,0.01000,2.425
|
125 |
+
17,mlp.up_proj,12.33495,0.01000,2.574
|
126 |
+
17,mlp.gate_proj,13.55825,0.01000,2.529
|
127 |
+
17,mlp.down_proj,0.24378,0.01000,12.424
|
128 |
+
18,self_attn.k_proj,5.60858,0.01000,2.380
|
129 |
+
18,self_attn.v_proj,0.63289,0.01000,2.354
|
130 |
+
18,self_attn.q_proj,16.55243,0.01000,2.401
|
131 |
+
18,self_attn.o_proj,0.14321,0.01000,2.402
|
132 |
+
18,mlp.up_proj,15.96843,0.01000,2.550
|
133 |
+
18,mlp.gate_proj,17.98333,0.01000,2.500
|
134 |
+
18,mlp.down_proj,0.32340,0.01000,12.371
|
135 |
+
19,self_attn.k_proj,5.16959,0.01000,2.400
|
136 |
+
19,self_attn.v_proj,0.74440,0.01000,2.347
|
137 |
+
19,self_attn.q_proj,14.47852,0.01000,2.394
|
138 |
+
19,self_attn.o_proj,0.14691,0.01000,2.430
|
139 |
+
19,mlp.up_proj,16.84079,0.01000,2.590
|
140 |
+
19,mlp.gate_proj,19.60419,0.01000,2.546
|
141 |
+
19,mlp.down_proj,0.36414,0.01000,12.410
|
142 |
+
20,self_attn.k_proj,6.47528,0.01000,2.380
|
143 |
+
20,self_attn.v_proj,0.74963,0.01000,2.327
|
144 |
+
20,self_attn.q_proj,14.17394,0.01000,2.408
|
145 |
+
20,self_attn.o_proj,0.11211,0.01000,2.410
|
146 |
+
20,mlp.up_proj,18.55169,0.01000,2.570
|
147 |
+
20,mlp.gate_proj,21.14960,0.01000,2.524
|
148 |
+
20,mlp.down_proj,0.37619,0.01000,12.351
|
149 |
+
21,self_attn.k_proj,9.81788,0.01000,2.356
|
150 |
+
21,self_attn.v_proj,0.89676,0.01000,2.299
|
151 |
+
21,self_attn.q_proj,22.92135,0.01000,2.392
|
152 |
+
21,self_attn.o_proj,0.16588,0.01000,2.393
|
153 |
+
21,mlp.up_proj,21.32033,0.01000,2.581
|
154 |
+
21,mlp.gate_proj,24.48094,0.01000,2.538
|
155 |
+
21,mlp.down_proj,0.42420,0.01000,12.352
|
156 |
+
22,self_attn.k_proj,10.66650,0.01000,2.377
|
157 |
+
22,self_attn.v_proj,1.39040,0.01000,2.323
|
158 |
+
22,self_attn.q_proj,23.65294,0.01000,2.398
|
159 |
+
22,self_attn.o_proj,0.09598,0.01000,2.427
|
160 |
+
22,mlp.up_proj,23.02085,0.01000,2.577
|
161 |
+
22,mlp.gate_proj,27.06548,0.01000,2.531
|
162 |
+
22,mlp.down_proj,0.42023,0.01000,12.385
|
163 |
+
23,self_attn.k_proj,11.88396,0.01000,2.400
|
164 |
+
23,self_attn.v_proj,1.27841,0.01000,2.370
|
165 |
+
23,self_attn.q_proj,25.22909,0.01000,2.417
|
166 |
+
23,self_attn.o_proj,0.12637,0.01000,2.437
|
167 |
+
23,mlp.up_proj,24.15950,0.01000,2.603
|
168 |
+
23,mlp.gate_proj,28.57765,0.01000,2.561
|
169 |
+
23,mlp.down_proj,0.42992,0.01000,12.479
|
170 |
+
24,self_attn.k_proj,6.27533,0.01000,2.372
|
171 |
+
24,self_attn.v_proj,0.67591,0.01000,2.308
|
172 |
+
24,self_attn.q_proj,11.09771,0.01000,2.394
|
173 |
+
24,self_attn.o_proj,0.10294,0.01000,2.407
|
174 |
+
24,mlp.up_proj,25.17421,0.01000,2.575
|
175 |
+
24,mlp.gate_proj,29.08055,0.01000,2.531
|
176 |
+
24,mlp.down_proj,0.45674,0.01000,12.389
|
177 |
+
25,self_attn.k_proj,12.02082,0.01000,2.411
|
178 |
+
25,self_attn.v_proj,1.35643,0.01000,2.373
|
179 |
+
25,self_attn.q_proj,23.12022,0.01000,2.414
|
180 |
+
25,self_attn.o_proj,0.11384,0.01000,2.408
|
181 |
+
25,mlp.up_proj,27.31142,0.01000,2.594
|
182 |
+
25,mlp.gate_proj,31.58317,0.01000,2.558
|
183 |
+
25,mlp.down_proj,0.49229,0.01000,12.438
|
184 |
+
26,self_attn.k_proj,11.96870,0.01000,2.423
|
185 |
+
26,self_attn.v_proj,1.38614,0.01000,2.350
|
186 |
+
26,self_attn.q_proj,23.65503,0.01000,2.426
|
187 |
+
26,self_attn.o_proj,0.12416,0.01000,2.423
|
188 |
+
26,mlp.up_proj,28.19983,0.01000,2.614
|
189 |
+
26,mlp.gate_proj,32.36074,0.01000,2.552
|
190 |
+
26,mlp.down_proj,0.52981,0.01000,12.445
|
191 |
+
27,self_attn.k_proj,12.18930,0.01000,2.377
|
192 |
+
27,self_attn.v_proj,0.86143,0.01000,2.337
|
193 |
+
27,self_attn.q_proj,23.78441,0.01000,2.410
|
194 |
+
27,self_attn.o_proj,0.25728,0.01000,2.420
|
195 |
+
27,mlp.up_proj,26.60479,0.01000,2.577
|
196 |
+
27,mlp.gate_proj,29.91342,0.01000,2.543
|
197 |
+
27,mlp.down_proj,0.57599,0.01000,12.401
|
198 |
+
28,self_attn.k_proj,14.01640,0.01000,2.407
|
199 |
+
28,self_attn.v_proj,1.19739,0.01000,2.365
|
200 |
+
28,self_attn.q_proj,28.35421,0.01000,2.401
|
201 |
+
28,self_attn.o_proj,0.21742,0.01000,2.434
|
202 |
+
28,mlp.up_proj,27.32375,0.01000,2.588
|
203 |
+
28,mlp.gate_proj,30.71216,0.01000,2.542
|
204 |
+
28,mlp.down_proj,0.64283,0.01000,12.378
|
205 |
+
29,self_attn.k_proj,14.76551,0.01000,2.398
|
206 |
+
29,self_attn.v_proj,1.14310,0.01000,2.362
|
207 |
+
29,self_attn.q_proj,28.58216,0.01000,2.409
|
208 |
+
29,self_attn.o_proj,0.24004,0.01000,2.427
|
209 |
+
29,mlp.up_proj,28.34542,0.01000,2.598
|
210 |
+
29,mlp.gate_proj,31.86575,0.01000,2.552
|
211 |
+
29,mlp.down_proj,0.68480,0.01000,12.450
|
212 |
+
30,self_attn.k_proj,11.88239,0.01000,2.395
|
213 |
+
30,self_attn.v_proj,0.98647,0.01000,2.343
|
214 |
+
30,self_attn.q_proj,23.09733,0.01000,2.407
|
215 |
+
30,self_attn.o_proj,0.25479,0.01000,2.423
|
216 |
+
30,mlp.up_proj,27.81762,0.01000,2.594
|
217 |
+
30,mlp.gate_proj,30.93171,0.01000,2.547
|
218 |
+
30,mlp.down_proj,0.67414,0.01000,12.351
|
219 |
+
31,self_attn.k_proj,15.44827,0.01000,2.383
|
220 |
+
31,self_attn.v_proj,1.00508,0.01000,2.325
|
221 |
+
31,self_attn.q_proj,33.67770,0.01000,2.384
|
222 |
+
31,self_attn.o_proj,0.44765,0.01000,2.412
|
223 |
+
31,mlp.up_proj,28.46461,0.01000,2.577
|
224 |
+
31,mlp.gate_proj,30.97182,0.01000,2.531
|
225 |
+
31,mlp.down_proj,0.70130,0.01000,12.405
|
226 |
+
32,self_attn.k_proj,10.04720,0.01000,2.386
|
227 |
+
32,self_attn.v_proj,1.12798,0.01000,2.354
|
228 |
+
32,self_attn.q_proj,20.07824,0.01000,2.389
|
229 |
+
32,self_attn.o_proj,0.18536,0.01000,2.413
|
230 |
+
32,mlp.up_proj,28.29184,0.01000,2.573
|
231 |
+
32,mlp.gate_proj,31.21350,0.01000,2.531
|
232 |
+
32,mlp.down_proj,0.73541,0.01000,12.368
|
233 |
+
33,self_attn.k_proj,15.88254,0.01000,2.391
|
234 |
+
33,self_attn.v_proj,1.10900,0.01000,2.339
|
235 |
+
33,self_attn.q_proj,34.42078,0.01000,2.400
|
236 |
+
33,self_attn.o_proj,0.41791,0.01000,2.406
|
237 |
+
33,mlp.up_proj,70.70566,0.01000,2.585
|
238 |
+
33,mlp.gate_proj,75.96263,0.01000,2.542
|
239 |
+
33,mlp.down_proj,0.75321,0.01000,12.361
|
240 |
+
34,self_attn.k_proj,13.84434,0.01000,2.406
|
241 |
+
34,self_attn.v_proj,1.10936,0.01000,2.333
|
242 |
+
34,self_attn.q_proj,29.83056,0.01000,2.424
|
243 |
+
34,self_attn.o_proj,0.38872,0.01000,2.434
|
244 |
+
34,mlp.up_proj,28.14292,0.01000,2.600
|
245 |
+
34,mlp.gate_proj,30.72616,0.01000,2.556
|
246 |
+
34,mlp.down_proj,0.77032,0.01000,12.496
|
247 |
+
35,self_attn.k_proj,15.87492,0.01000,2.381
|
248 |
+
35,self_attn.v_proj,1.14817,0.01000,2.320
|
249 |
+
35,self_attn.q_proj,32.89777,0.01000,2.401
|
250 |
+
35,self_attn.o_proj,0.42289,0.01000,2.409
|
251 |
+
35,mlp.up_proj,28.14214,0.01000,2.578
|
252 |
+
35,mlp.gate_proj,30.94142,0.01000,2.535
|
253 |
+
35,mlp.down_proj,0.71352,0.01000,12.380
|
254 |
+
36,self_attn.k_proj,11.59319,0.01000,2.377
|
255 |
+
36,self_attn.v_proj,0.98563,0.01000,2.318
|
256 |
+
36,self_attn.q_proj,21.57438,0.01000,2.384
|
257 |
+
36,self_attn.o_proj,0.17942,0.01000,2.410
|
258 |
+
36,mlp.up_proj,27.42457,0.01000,2.569
|
259 |
+
36,mlp.gate_proj,30.79939,0.01000,2.525
|
260 |
+
36,mlp.down_proj,0.72106,0.01000,12.391
|
261 |
+
37,self_attn.k_proj,14.81283,0.01000,2.376
|
262 |
+
37,self_attn.v_proj,1.04597,0.01000,2.331
|
263 |
+
37,self_attn.q_proj,28.01339,0.01000,2.409
|
264 |
+
37,self_attn.o_proj,0.22077,0.01000,2.419
|
265 |
+
37,mlp.up_proj,27.39221,0.01000,2.575
|
266 |
+
37,mlp.gate_proj,30.75794,0.01000,2.540
|
267 |
+
37,mlp.down_proj,0.69618,0.01000,12.390
|
268 |
+
38,self_attn.k_proj,13.16148,0.01000,2.380
|
269 |
+
38,self_attn.v_proj,1.12986,0.01000,2.324
|
270 |
+
38,self_attn.q_proj,24.62405,0.01000,2.385
|
271 |
+
38,self_attn.o_proj,0.22751,0.01000,2.415
|
272 |
+
38,mlp.up_proj,27.54411,0.01000,2.548
|
273 |
+
38,mlp.gate_proj,31.43366,0.01000,2.528
|
274 |
+
38,mlp.down_proj,0.67293,0.01000,12.317
|
275 |
+
39,self_attn.k_proj,13.35156,0.01000,2.397
|
276 |
+
39,self_attn.v_proj,1.18738,0.01000,2.355
|
277 |
+
39,self_attn.q_proj,23.59219,0.01000,2.401
|
278 |
+
39,self_attn.o_proj,0.16937,0.01000,2.409
|
279 |
+
39,mlp.up_proj,27.48190,0.01000,2.570
|
280 |
+
39,mlp.gate_proj,31.72308,0.01000,2.532
|
281 |
+
39,mlp.down_proj,0.66521,0.01000,12.420
|
282 |
+
40,self_attn.k_proj,10.13054,0.01000,2.424
|
283 |
+
40,self_attn.v_proj,1.36028,0.01000,2.365
|
284 |
+
40,self_attn.q_proj,20.56631,0.01000,2.418
|
285 |
+
40,self_attn.o_proj,0.12621,0.01000,2.438
|
286 |
+
40,mlp.up_proj,27.66399,0.01000,2.608
|
287 |
+
40,mlp.gate_proj,32.16180,0.01000,2.564
|
288 |
+
40,mlp.down_proj,0.72769,0.01000,12.428
|
289 |
+
41,self_attn.k_proj,12.69510,0.01000,2.375
|
290 |
+
41,self_attn.v_proj,1.12165,0.01000,2.328
|
291 |
+
41,self_attn.q_proj,21.96209,0.01000,2.390
|
292 |
+
41,self_attn.o_proj,0.13793,0.01000,2.423
|
293 |
+
41,mlp.up_proj,28.21097,0.01000,2.587
|
294 |
+
41,mlp.gate_proj,32.82212,0.01000,2.546
|
295 |
+
41,mlp.down_proj,0.69244,0.01000,12.410
|
296 |
+
42,self_attn.k_proj,8.44118,0.01000,2.378
|
297 |
+
42,self_attn.v_proj,0.90866,0.01000,2.322
|
298 |
+
42,self_attn.q_proj,13.04269,0.01000,2.396
|
299 |
+
42,self_attn.o_proj,0.08163,0.01000,2.397
|
300 |
+
42,mlp.up_proj,28.56101,0.01000,2.581
|
301 |
+
42,mlp.gate_proj,33.50828,0.01000,2.542
|
302 |
+
42,mlp.down_proj,0.64698,0.01000,12.371
|
303 |
+
43,self_attn.k_proj,8.92527,0.01000,2.391
|
304 |
+
43,self_attn.v_proj,0.98848,0.01000,2.324
|
305 |
+
43,self_attn.q_proj,14.44163,0.01000,2.393
|
306 |
+
43,self_attn.o_proj,0.09209,0.01000,2.430
|
307 |
+
43,mlp.up_proj,29.11296,0.01000,2.580
|
308 |
+
43,mlp.gate_proj,34.40512,0.01000,2.531
|
309 |
+
43,mlp.down_proj,0.68803,0.01000,12.424
|
310 |
+
44,self_attn.k_proj,13.99534,0.01000,2.388
|
311 |
+
44,self_attn.v_proj,1.57364,0.01000,2.340
|
312 |
+
44,self_attn.q_proj,28.14628,0.01000,2.410
|
313 |
+
44,self_attn.o_proj,0.14434,0.01000,2.418
|
314 |
+
44,mlp.up_proj,29.51572,0.01000,2.598
|
315 |
+
44,mlp.gate_proj,35.05244,0.01000,2.552
|
316 |
+
44,mlp.down_proj,0.76233,0.01000,12.385
|
317 |
+
45,self_attn.k_proj,8.35592,0.01000,2.405
|
318 |
+
45,self_attn.v_proj,0.92035,0.01000,2.346
|
319 |
+
45,self_attn.q_proj,13.71338,0.01000,2.417
|
320 |
+
45,self_attn.o_proj,0.12826,0.01000,2.435
|
321 |
+
45,mlp.up_proj,29.94445,0.01000,2.594
|
322 |
+
45,mlp.gate_proj,35.62438,0.01000,2.567
|
323 |
+
45,mlp.down_proj,0.75896,0.01000,12.476
|
324 |
+
46,self_attn.k_proj,5.03439,0.01000,2.413
|
325 |
+
46,self_attn.v_proj,0.41520,0.01000,2.373
|
326 |
+
46,self_attn.q_proj,3.65707,0.01000,2.418
|
327 |
+
46,self_attn.o_proj,0.02733,0.01000,2.429
|
328 |
+
46,mlp.up_proj,30.43668,0.01000,2.596
|
329 |
+
46,mlp.gate_proj,36.21279,0.01000,2.555
|
330 |
+
46,mlp.down_proj,0.70465,0.01000,12.484
|
331 |
+
47,self_attn.k_proj,9.32724,0.01000,2.419
|
332 |
+
47,self_attn.v_proj,1.12588,0.01000,2.366
|
333 |
+
47,self_attn.q_proj,13.99360,0.01000,2.424
|
334 |
+
47,self_attn.o_proj,0.07536,0.01000,2.429
|
335 |
+
47,mlp.up_proj,30.93128,0.01000,2.606
|
336 |
+
47,mlp.gate_proj,36.81147,0.01000,2.562
|
337 |
+
47,mlp.down_proj,0.75357,0.01000,12.446
|
338 |
+
48,self_attn.k_proj,9.56606,0.01000,2.397
|
339 |
+
48,self_attn.v_proj,1.20021,0.01000,2.341
|
340 |
+
48,self_attn.q_proj,14.59574,0.01000,2.424
|
341 |
+
48,self_attn.o_proj,0.05555,0.01000,2.431
|
342 |
+
48,mlp.up_proj,31.49958,0.01000,2.590
|
343 |
+
48,mlp.gate_proj,37.59175,0.01000,2.550
|
344 |
+
48,mlp.down_proj,0.85475,0.01000,12.454
|
345 |
+
49,self_attn.k_proj,9.73940,0.01000,2.409
|
346 |
+
49,self_attn.v_proj,1.12793,0.01000,2.345
|
347 |
+
49,self_attn.q_proj,14.39461,0.01000,2.426
|
348 |
+
49,self_attn.o_proj,0.07215,0.01000,2.433
|
349 |
+
49,mlp.up_proj,32.26957,0.01000,2.601
|
350 |
+
49,mlp.gate_proj,38.52919,0.01000,2.558
|
351 |
+
49,mlp.down_proj,0.85321,0.01000,12.449
|
352 |
+
50,self_attn.k_proj,7.50268,0.01000,2.412
|
353 |
+
50,self_attn.v_proj,0.91148,0.01000,2.363
|
354 |
+
50,self_attn.q_proj,9.03854,0.01000,2.414
|
355 |
+
50,self_attn.o_proj,0.05698,0.01000,2.413
|
356 |
+
50,mlp.up_proj,32.78205,0.01000,2.599
|
357 |
+
50,mlp.gate_proj,39.19064,0.01000,2.560
|
358 |
+
50,mlp.down_proj,0.78843,0.01000,12.456
|
359 |
+
51,self_attn.k_proj,8.62929,0.01000,2.384
|
360 |
+
51,self_attn.v_proj,1.10167,0.01000,2.355
|
361 |
+
51,self_attn.q_proj,12.73033,0.01000,2.422
|
362 |
+
51,self_attn.o_proj,0.08332,0.01000,2.427
|
363 |
+
51,mlp.up_proj,33.36840,0.01000,2.602
|
364 |
+
51,mlp.gate_proj,39.81268,0.01000,2.552
|
365 |
+
51,mlp.down_proj,0.84592,0.01000,12.439
|
366 |
+
52,self_attn.k_proj,14.24103,0.01000,2.402
|
367 |
+
52,self_attn.v_proj,1.52739,0.01000,2.350
|
368 |
+
52,self_attn.q_proj,26.98552,0.01000,2.419
|
369 |
+
52,self_attn.o_proj,0.23821,0.01000,2.426
|
370 |
+
52,mlp.up_proj,34.04603,0.01000,2.598
|
371 |
+
52,mlp.gate_proj,40.77630,0.01000,2.553
|
372 |
+
52,mlp.down_proj,0.94730,0.01000,12.492
|
373 |
+
53,self_attn.k_proj,11.13863,0.01000,2.406
|
374 |
+
53,self_attn.v_proj,1.26610,0.01000,2.380
|
375 |
+
53,self_attn.q_proj,15.89432,0.01000,2.417
|
376 |
+
53,self_attn.o_proj,0.05793,0.01000,2.423
|
377 |
+
53,mlp.up_proj,34.83026,0.01000,2.582
|
378 |
+
53,mlp.gate_proj,41.77624,0.01000,2.552
|
379 |
+
53,mlp.down_proj,0.92240,0.01000,12.391
|
380 |
+
54,self_attn.k_proj,7.40175,0.01000,2.406
|
381 |
+
54,self_attn.v_proj,0.79817,0.01000,2.341
|
382 |
+
54,self_attn.q_proj,8.95007,0.01000,2.415
|
383 |
+
54,self_attn.o_proj,0.10005,0.01000,2.442
|
384 |
+
54,mlp.up_proj,35.37103,0.01000,2.599
|
385 |
+
54,mlp.gate_proj,41.93651,0.01000,2.536
|
386 |
+
54,mlp.down_proj,0.86324,0.01000,12.377
|
387 |
+
55,self_attn.k_proj,6.85297,0.01000,2.419
|
388 |
+
55,self_attn.v_proj,0.80341,0.01000,2.341
|
389 |
+
55,self_attn.q_proj,9.80242,0.01000,2.419
|
390 |
+
55,self_attn.o_proj,0.10725,0.01000,2.435
|
391 |
+
55,mlp.up_proj,35.42970,0.01000,2.590
|
392 |
+
55,mlp.gate_proj,42.14802,0.01000,2.560
|
393 |
+
55,mlp.down_proj,0.90768,0.01000,12.442
|
394 |
+
56,self_attn.k_proj,13.88305,0.01000,2.394
|
395 |
+
56,self_attn.v_proj,1.85680,0.01000,2.350
|
396 |
+
56,self_attn.q_proj,26.94255,0.01000,2.390
|
397 |
+
56,self_attn.o_proj,0.20183,0.01000,2.436
|
398 |
+
56,mlp.up_proj,36.07793,0.01000,2.592
|
399 |
+
56,mlp.gate_proj,43.35723,0.01000,2.545
|
400 |
+
56,mlp.down_proj,1.01939,0.01000,12.415
|
401 |
+
57,self_attn.k_proj,10.69875,0.01000,2.405
|
402 |
+
57,self_attn.v_proj,1.38184,0.01000,2.319
|
403 |
+
57,self_attn.q_proj,15.78839,0.01000,2.408
|
404 |
+
57,self_attn.o_proj,0.15118,0.01000,2.438
|
405 |
+
57,mlp.up_proj,36.95335,0.01000,2.595
|
406 |
+
57,mlp.gate_proj,44.50830,0.01000,2.544
|
407 |
+
57,mlp.down_proj,0.99837,0.01000,12.462
|
408 |
+
58,self_attn.k_proj,7.56804,0.01000,2.398
|
409 |
+
58,self_attn.v_proj,1.12267,0.01000,2.348
|
410 |
+
58,self_attn.q_proj,10.17075,0.01000,2.424
|
411 |
+
58,self_attn.o_proj,0.08434,0.01000,2.441
|
412 |
+
58,mlp.up_proj,37.68964,0.01000,2.599
|
413 |
+
58,mlp.gate_proj,44.71976,0.01000,2.543
|
414 |
+
58,mlp.down_proj,0.94810,0.01000,12.437
|
415 |
+
59,self_attn.k_proj,7.43233,0.01000,2.413
|
416 |
+
59,self_attn.v_proj,0.91834,0.01000,2.343
|
417 |
+
59,self_attn.q_proj,8.87059,0.01000,2.395
|
418 |
+
59,self_attn.o_proj,0.05050,0.01000,2.433
|
419 |
+
59,mlp.up_proj,38.86263,0.01000,2.591
|
420 |
+
59,mlp.gate_proj,46.91222,0.01000,2.557
|
421 |
+
59,mlp.down_proj,1.04556,0.01000,12.446
|
422 |
+
60,self_attn.k_proj,13.29610,0.01000,2.405
|
423 |
+
60,self_attn.v_proj,2.16565,0.01000,2.373
|
424 |
+
60,self_attn.q_proj,25.22976,0.01000,2.430
|
425 |
+
60,self_attn.o_proj,0.16070,0.01000,2.401
|
426 |
+
60,mlp.up_proj,39.92323,0.01000,2.594
|
427 |
+
60,mlp.gate_proj,48.80389,0.01000,2.562
|
428 |
+
60,mlp.down_proj,1.19647,0.01000,12.480
|
429 |
+
61,self_attn.k_proj,9.04602,0.01000,2.407
|
430 |
+
61,self_attn.v_proj,1.31423,0.01000,2.354
|
431 |
+
61,self_attn.q_proj,11.27571,0.01000,2.430
|
432 |
+
61,self_attn.o_proj,0.11997,0.01000,2.426
|
433 |
+
61,mlp.up_proj,40.52758,0.01000,2.601
|
434 |
+
61,mlp.gate_proj,49.42426,0.01000,2.551
|
435 |
+
61,mlp.down_proj,1.14733,0.01000,12.427
|
436 |
+
62,self_attn.k_proj,6.08225,0.01000,2.400
|
437 |
+
62,self_attn.v_proj,0.54749,0.01000,2.341
|
438 |
+
62,self_attn.q_proj,3.91657,0.01000,2.427
|
439 |
+
62,self_attn.o_proj,0.03115,0.01000,2.430
|
440 |
+
62,mlp.up_proj,40.40889,0.01000,2.569
|
441 |
+
62,mlp.gate_proj,48.50503,0.01000,2.558
|
442 |
+
62,mlp.down_proj,1.03680,0.01000,12.433
|
443 |
+
63,self_attn.k_proj,7.13903,0.01000,2.395
|
444 |
+
63,self_attn.v_proj,0.90019,0.01000,2.339
|
445 |
+
63,self_attn.q_proj,8.04566,0.01000,2.423
|
446 |
+
63,self_attn.o_proj,0.06037,0.01000,2.428
|
447 |
+
63,mlp.up_proj,42.07748,0.01000,2.598
|
448 |
+
63,mlp.gate_proj,51.37971,0.01000,2.556
|
449 |
+
63,mlp.down_proj,1.16115,0.01000,12.440
|
450 |
+
64,self_attn.k_proj,12.30144,0.01000,2.389
|
451 |
+
64,self_attn.v_proj,1.94175,0.01000,2.347
|
452 |
+
64,self_attn.q_proj,20.16385,0.01000,2.420
|
453 |
+
64,self_attn.o_proj,0.24632,0.01000,2.439
|
454 |
+
64,mlp.up_proj,44.01347,0.01000,2.588
|
455 |
+
64,mlp.gate_proj,55.13173,0.01000,2.553
|
456 |
+
64,mlp.down_proj,1.38282,0.01000,12.488
|
457 |
+
65,self_attn.k_proj,6.82733,0.01000,2.398
|
458 |
+
65,self_attn.v_proj,0.78277,0.01000,2.352
|
459 |
+
65,self_attn.q_proj,6.81213,0.01000,2.420
|
460 |
+
65,self_attn.o_proj,0.07622,0.01000,2.441
|
461 |
+
65,mlp.up_proj,44.64717,0.01000,2.598
|
462 |
+
65,mlp.gate_proj,55.94937,0.01000,2.550
|
463 |
+
65,mlp.down_proj,1.31563,0.01000,12.353
|
464 |
+
66,self_attn.k_proj,7.05296,0.01000,2.387
|
465 |
+
66,self_attn.v_proj,1.03377,0.01000,2.330
|
466 |
+
66,self_attn.q_proj,8.85096,0.01000,2.411
|
467 |
+
66,self_attn.o_proj,0.13433,0.01000,2.434
|
468 |
+
66,mlp.up_proj,44.82061,0.01000,2.602
|
469 |
+
66,mlp.gate_proj,54.01328,0.01000,2.544
|
470 |
+
66,mlp.down_proj,1.22117,0.01000,12.403
|
471 |
+
67,self_attn.k_proj,12.34406,0.01000,2.394
|
472 |
+
67,self_attn.v_proj,2.19811,0.01000,2.371
|
473 |
+
67,self_attn.q_proj,20.21918,0.01000,2.421
|
474 |
+
67,self_attn.o_proj,0.23947,0.01000,2.428
|
475 |
+
67,mlp.up_proj,46.74456,0.01000,2.591
|
476 |
+
67,mlp.gate_proj,56.45784,0.01000,2.545
|
477 |
+
67,mlp.down_proj,1.34151,0.01000,12.484
|
478 |
+
68,self_attn.k_proj,13.16044,0.01000,2.423
|
479 |
+
68,self_attn.v_proj,2.73707,0.01000,2.354
|
480 |
+
68,self_attn.q_proj,24.21140,0.01000,2.414
|
481 |
+
68,self_attn.o_proj,0.30300,0.01000,2.456
|
482 |
+
68,mlp.up_proj,49.65003,0.01000,2.607
|
483 |
+
68,mlp.gate_proj,61.89810,0.01000,2.551
|
484 |
+
68,mlp.down_proj,1.64361,0.01000,12.423
|
485 |
+
69,self_attn.k_proj,10.67953,0.01000,2.396
|
486 |
+
69,self_attn.v_proj,2.16242,0.01000,2.341
|
487 |
+
69,self_attn.q_proj,18.11952,0.01000,2.400
|
488 |
+
69,self_attn.o_proj,0.20832,0.01000,2.421
|
489 |
+
69,mlp.up_proj,50.93095,0.01000,2.596
|
490 |
+
69,mlp.gate_proj,62.72586,0.01000,2.549
|
491 |
+
69,mlp.down_proj,1.61045,0.01000,12.533
|
492 |
+
70,self_attn.k_proj,10.28304,0.01000,2.399
|
493 |
+
70,self_attn.v_proj,1.98366,0.01000,2.359
|
494 |
+
70,self_attn.q_proj,19.90069,0.01000,2.390
|
495 |
+
70,self_attn.o_proj,0.35756,0.01000,2.436
|
496 |
+
70,mlp.up_proj,51.26246,0.01000,2.604
|
497 |
+
70,mlp.gate_proj,60.92408,0.01000,2.563
|
498 |
+
70,mlp.down_proj,1.57580,0.01000,12.480
|
499 |
+
71,self_attn.k_proj,12.47268,0.01000,2.396
|
500 |
+
71,self_attn.v_proj,2.70028,0.01000,2.355
|
501 |
+
71,self_attn.q_proj,27.55191,0.01000,2.385
|
502 |
+
71,self_attn.o_proj,0.93984,0.01000,2.428
|
503 |
+
71,mlp.up_proj,55.26141,0.01000,2.595
|
504 |
+
71,mlp.gate_proj,65.54773,0.01000,2.549
|
505 |
+
71,mlp.down_proj,1.90825,0.01000,12.460
|
506 |
+
72,self_attn.k_proj,13.01985,0.01000,2.408
|
507 |
+
72,self_attn.v_proj,3.01720,0.01000,2.357
|
508 |
+
72,self_attn.q_proj,30.32354,0.01000,2.437
|
509 |
+
72,self_attn.o_proj,0.44778,0.01000,2.445
|
510 |
+
72,mlp.up_proj,58.38693,0.01000,2.610
|
511 |
+
72,mlp.gate_proj,71.82819,0.01000,2.559
|
512 |
+
72,mlp.down_proj,2.24979,0.01000,12.446
|
513 |
+
73,self_attn.k_proj,12.93038,0.01000,2.406
|
514 |
+
73,self_attn.v_proj,3.20805,0.01000,2.342
|
515 |
+
73,self_attn.q_proj,29.55270,0.01000,2.424
|
516 |
+
73,self_attn.o_proj,1.00655,0.01000,2.436
|
517 |
+
73,mlp.up_proj,58.70067,0.01000,2.594
|
518 |
+
73,mlp.gate_proj,71.63084,0.01000,2.556
|
519 |
+
73,mlp.down_proj,2.31351,0.01000,12.468
|
520 |
+
74,self_attn.k_proj,12.20197,0.01000,2.403
|
521 |
+
74,self_attn.v_proj,3.11274,0.01000,2.358
|
522 |
+
74,self_attn.q_proj,28.71220,0.01000,2.423
|
523 |
+
74,self_attn.o_proj,1.16861,0.01000,2.403
|
524 |
+
74,mlp.up_proj,61.27262,0.01000,2.587
|
525 |
+
74,mlp.gate_proj,74.21090,0.01000,2.548
|
526 |
+
74,mlp.down_proj,2.48106,0.01000,12.486
|
527 |
+
75,self_attn.k_proj,11.45592,0.01000,2.423
|
528 |
+
75,self_attn.v_proj,3.51124,0.01000,2.359
|
529 |
+
75,self_attn.q_proj,30.38795,0.01000,2.413
|
530 |
+
75,self_attn.o_proj,2.18176,0.01000,2.446
|
531 |
+
75,mlp.up_proj,66.98369,0.01000,2.612
|
532 |
+
75,mlp.gate_proj,83.39505,0.01000,2.540
|
533 |
+
75,mlp.down_proj,3.69956,0.01000,12.424
|
534 |
+
76,self_attn.k_proj,10.18937,0.01000,2.412
|
535 |
+
76,self_attn.v_proj,3.41040,0.01000,2.366
|
536 |
+
76,self_attn.q_proj,27.26140,0.01000,2.445
|
537 |
+
76,self_attn.o_proj,1.05649,0.01000,2.450
|
538 |
+
76,mlp.up_proj,78.13490,0.01000,2.615
|
539 |
+
76,mlp.gate_proj,118.95868,0.01000,2.555
|
540 |
+
76,mlp.down_proj,5.51300,0.01000,12.506
|
541 |
+
77,self_attn.k_proj,11.54971,0.01000,2.413
|
542 |
+
77,self_attn.v_proj,4.01822,0.01000,2.364
|
543 |
+
77,self_attn.q_proj,29.42512,0.01000,2.424
|
544 |
+
77,self_attn.o_proj,1.65369,0.01000,2.446
|
545 |
+
77,mlp.up_proj,74.31666,0.01000,2.601
|
546 |
+
77,mlp.gate_proj,93.92165,0.01000,2.547
|
547 |
+
77,mlp.down_proj,6.31596,0.01000,12.536
|
548 |
+
78,self_attn.k_proj,10.21922,0.01000,2.425
|
549 |
+
78,self_attn.v_proj,2.88337,0.01000,2.382
|
550 |
+
78,self_attn.q_proj,24.15326,0.01000,2.417
|
551 |
+
78,self_attn.o_proj,1.91129,0.01000,2.453
|
552 |
+
78,mlp.up_proj,71.57212,0.01000,2.619
|
553 |
+
78,mlp.gate_proj,88.37552,0.01000,2.566
|
554 |
+
78,mlp.down_proj,13.54613,0.01000,12.559
|
555 |
+
79,self_attn.k_proj,4.50027,0.01000,2.416
|
556 |
+
79,self_attn.v_proj,1.45889,0.01000,2.372
|
557 |
+
79,self_attn.q_proj,8.78865,0.01000,2.427
|
558 |
+
79,self_attn.o_proj,1.06731,0.01000,2.438
|
559 |
+
79,mlp.up_proj,44.81396,0.01000,2.621
|
560 |
+
79,mlp.gate_proj,52.70864,0.01000,2.574
|
561 |
+
79,mlp.down_proj,18.51311,0.01000,12.513
|
quantize_config.json
ADDED
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bits": 4,
|
3 |
+
"dynamic": null,
|
4 |
+
"group_size": 128,
|
5 |
+
"desc_act": true,
|
6 |
+
"sym": true,
|
7 |
+
"lm_head": false,
|
8 |
+
"quant_method": "gptq",
|
9 |
+
"checkpoint_format": "gptq",
|
10 |
+
"meta": {
|
11 |
+
"quantizer": [
|
12 |
+
"gptqmodel:1.4.0-dev"
|
13 |
+
],
|
14 |
+
"uri": "https://github.com/modelcloud/gptqmodel",
|
15 |
+
"damp_percent": 0.01,
|
16 |
+
"damp_auto_increment": 0.0015,
|
17 |
+
"static_groups": false,
|
18 |
+
"true_sequential": true
|
19 |
+
}
|
20 |
+
}
|