shuyuej commited on
Commit
f9adbd7
1 Parent(s): 49f84ae

Upload folder using huggingface_hub

Browse files
Files changed (4) hide show
  1. config.json +61 -0
  2. model.safetensors +3 -0
  3. quant_log.csv +561 -0
  4. quantize_config.json +20 -0
config.json ADDED
@@ -0,0 +1,61 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_attn_implementation_autoset": true,
3
+ "_name_or_path": "meta-llama/Llama-3.3-70B-Instruct",
4
+ "architectures": [
5
+ "LlamaForCausalLM"
6
+ ],
7
+ "attention_bias": false,
8
+ "attention_dropout": 0.0,
9
+ "bos_token_id": 128000,
10
+ "eos_token_id": [
11
+ 128001,
12
+ 128008,
13
+ 128009
14
+ ],
15
+ "head_dim": 128,
16
+ "hidden_act": "silu",
17
+ "hidden_size": 8192,
18
+ "initializer_range": 0.02,
19
+ "intermediate_size": 28672,
20
+ "max_position_embeddings": 131072,
21
+ "mlp_bias": false,
22
+ "model_type": "llama",
23
+ "num_attention_heads": 64,
24
+ "num_hidden_layers": 80,
25
+ "num_key_value_heads": 8,
26
+ "pretraining_tp": 1,
27
+ "quantization_config": {
28
+ "bits": 4,
29
+ "checkpoint_format": "gptq",
30
+ "desc_act": true,
31
+ "dynamic": null,
32
+ "group_size": 128,
33
+ "lm_head": false,
34
+ "meta": {
35
+ "damp_auto_increment": 0.0015,
36
+ "damp_percent": 0.01,
37
+ "quantizer": [
38
+ "gptqmodel:1.4.0-dev"
39
+ ],
40
+ "static_groups": false,
41
+ "true_sequential": true,
42
+ "uri": "https://github.com/modelcloud/gptqmodel"
43
+ },
44
+ "quant_method": "gptq",
45
+ "sym": true
46
+ },
47
+ "rms_norm_eps": 1e-05,
48
+ "rope_scaling": {
49
+ "factor": 8.0,
50
+ "high_freq_factor": 4.0,
51
+ "low_freq_factor": 1.0,
52
+ "original_max_position_embeddings": 8192,
53
+ "rope_type": "llama3"
54
+ },
55
+ "rope_theta": 500000.0,
56
+ "tie_word_embeddings": false,
57
+ "torch_dtype": "bfloat16",
58
+ "transformers_version": "4.47.0",
59
+ "use_cache": true,
60
+ "vocab_size": 128256
61
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7922de01bdca5ad0d97084163f53b2954a48b179a006c25e838d45432046f587
3
+ size 39792965480
quant_log.csv ADDED
@@ -0,0 +1,561 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ layer,module,loss,damp,time
2
+ 0,self_attn.k_proj,0.57035,0.01000,2.657
3
+ 0,self_attn.v_proj,1.47052,0.01000,2.351
4
+ 0,self_attn.q_proj,1.32896,0.01000,2.406
5
+ 0,self_attn.o_proj,0.00012,0.01000,2.410
6
+ 0,mlp.up_proj,0.42204,0.01000,2.590
7
+ 0,mlp.gate_proj,0.43135,0.01000,2.543
8
+ 0,mlp.down_proj,0.00059,0.01000,12.464
9
+ 1,self_attn.k_proj,0.42801,0.01000,2.404
10
+ 1,self_attn.v_proj,0.40142,0.01000,2.362
11
+ 1,self_attn.q_proj,1.63970,0.01000,2.426
12
+ 1,self_attn.o_proj,0.00060,0.01000,2.436
13
+ 1,mlp.up_proj,0.42048,0.01000,2.597
14
+ 1,mlp.gate_proj,0.43219,0.01000,2.544
15
+ 1,mlp.down_proj,0.00066,0.01000,12.450
16
+ 2,self_attn.k_proj,0.13810,0.01000,2.390
17
+ 2,self_attn.v_proj,0.02891,0.01000,2.347
18
+ 2,self_attn.q_proj,0.63511,0.01000,2.417
19
+ 2,self_attn.o_proj,0.00098,0.01000,2.426
20
+ 2,mlp.up_proj,0.94861,0.01000,2.574
21
+ 2,mlp.gate_proj,0.97155,0.01000,2.534
22
+ 2,mlp.down_proj,0.00155,0.01000,12.369
23
+ 3,self_attn.k_proj,0.37560,0.01000,2.370
24
+ 3,self_attn.v_proj,0.05439,0.01000,2.339
25
+ 3,self_attn.q_proj,1.19933,0.01000,2.401
26
+ 3,self_attn.o_proj,0.00116,0.01000,2.424
27
+ 3,mlp.up_proj,1.59134,0.01000,2.584
28
+ 3,mlp.gate_proj,1.77250,0.01000,2.544
29
+ 3,mlp.down_proj,0.02647,0.01000,12.401
30
+ 4,self_attn.k_proj,0.41622,0.01000,2.398
31
+ 4,self_attn.v_proj,0.06400,0.01000,2.358
32
+ 4,self_attn.q_proj,1.26602,0.01000,2.411
33
+ 4,self_attn.o_proj,0.00084,0.01000,2.422
34
+ 4,mlp.up_proj,1.74960,0.01000,2.584
35
+ 4,mlp.gate_proj,1.80884,0.01000,2.540
36
+ 4,mlp.down_proj,0.00400,0.01000,12.399
37
+ 5,self_attn.k_proj,0.60114,0.01000,2.393
38
+ 5,self_attn.v_proj,0.13286,0.01000,2.344
39
+ 5,self_attn.q_proj,1.89099,0.01000,2.419
40
+ 5,self_attn.o_proj,0.00190,0.01000,2.437
41
+ 5,mlp.up_proj,2.20372,0.01000,2.589
42
+ 5,mlp.gate_proj,2.37831,0.01000,2.540
43
+ 5,mlp.down_proj,0.00660,0.01000,12.367
44
+ 6,self_attn.k_proj,1.00460,0.01000,2.371
45
+ 6,self_attn.v_proj,0.15128,0.01000,2.326
46
+ 6,self_attn.q_proj,2.92848,0.01000,2.386
47
+ 6,self_attn.o_proj,0.00212,0.01000,2.409
48
+ 6,mlp.up_proj,2.19970,0.01000,2.576
49
+ 6,mlp.gate_proj,2.31402,0.01000,2.532
50
+ 6,mlp.down_proj,0.00919,0.01000,12.448
51
+ 7,self_attn.k_proj,1.19295,0.01000,2.380
52
+ 7,self_attn.v_proj,0.17405,0.01000,2.322
53
+ 7,self_attn.q_proj,3.59537,0.01000,2.403
54
+ 7,self_attn.o_proj,0.00162,0.01000,2.428
55
+ 7,mlp.up_proj,2.58627,0.01000,2.576
56
+ 7,mlp.gate_proj,2.73543,0.01000,2.530
57
+ 7,mlp.down_proj,0.01228,0.01000,12.390
58
+ 8,self_attn.k_proj,0.88642,0.01000,2.384
59
+ 8,self_attn.v_proj,0.16166,0.01000,2.319
60
+ 8,self_attn.q_proj,2.53692,0.01000,2.407
61
+ 8,self_attn.o_proj,0.00341,0.01000,2.410
62
+ 8,mlp.up_proj,3.88630,0.01000,2.579
63
+ 8,mlp.gate_proj,4.10945,0.01000,2.534
64
+ 8,mlp.down_proj,0.01468,0.01000,12.399
65
+ 9,self_attn.k_proj,0.75486,0.01000,2.376
66
+ 9,self_attn.v_proj,0.12879,0.01000,2.322
67
+ 9,self_attn.q_proj,2.22640,0.01000,2.396
68
+ 9,self_attn.o_proj,0.00491,0.01000,2.402
69
+ 9,mlp.up_proj,6.16445,0.01000,2.583
70
+ 9,mlp.gate_proj,6.62525,0.01000,2.535
71
+ 9,mlp.down_proj,0.01891,0.01000,12.377
72
+ 10,self_attn.k_proj,2.21197,0.01000,2.372
73
+ 10,self_attn.v_proj,0.29660,0.01000,2.325
74
+ 10,self_attn.q_proj,6.23046,0.01000,2.413
75
+ 10,self_attn.o_proj,0.00592,0.01000,2.384
76
+ 10,mlp.up_proj,4.15596,0.01000,2.571
77
+ 10,mlp.gate_proj,4.44713,0.01000,2.536
78
+ 10,mlp.down_proj,0.02901,0.01000,12.351
79
+ 11,self_attn.k_proj,2.23967,0.01000,2.400
80
+ 11,self_attn.v_proj,0.31593,0.01000,2.351
81
+ 11,self_attn.q_proj,5.37146,0.01000,2.396
82
+ 11,self_attn.o_proj,0.00716,0.01000,2.390
83
+ 11,mlp.up_proj,6.03220,0.01000,2.578
84
+ 11,mlp.gate_proj,6.44322,0.01000,2.534
85
+ 11,mlp.down_proj,0.03901,0.01000,12.379
86
+ 12,self_attn.k_proj,1.53060,0.01000,2.379
87
+ 12,self_attn.v_proj,0.26643,0.01000,2.330
88
+ 12,self_attn.q_proj,4.37793,0.01000,2.396
89
+ 12,self_attn.o_proj,0.00726,0.01000,2.401
90
+ 12,mlp.up_proj,5.41540,0.01000,2.584
91
+ 12,mlp.gate_proj,5.80091,0.01000,2.539
92
+ 12,mlp.down_proj,0.04740,0.01000,12.316
93
+ 13,self_attn.k_proj,2.27633,0.01000,2.376
94
+ 13,self_attn.v_proj,0.30485,0.01000,2.320
95
+ 13,self_attn.q_proj,6.06090,0.01000,2.388
96
+ 13,self_attn.o_proj,0.02961,0.01000,2.405
97
+ 13,mlp.up_proj,5.01690,0.01000,2.576
98
+ 13,mlp.gate_proj,5.32263,0.01000,2.531
99
+ 13,mlp.down_proj,0.06650,0.01000,12.387
100
+ 14,self_attn.k_proj,2.83633,0.01000,2.373
101
+ 14,self_attn.v_proj,0.37186,0.01000,2.312
102
+ 14,self_attn.q_proj,8.34845,0.01000,2.401
103
+ 14,self_attn.o_proj,0.04001,0.01000,2.407
104
+ 14,mlp.up_proj,6.58338,0.01000,2.553
105
+ 14,mlp.gate_proj,7.04548,0.01000,2.526
106
+ 14,mlp.down_proj,0.09719,0.01000,12.348
107
+ 15,self_attn.k_proj,2.48118,0.01000,2.397
108
+ 15,self_attn.v_proj,0.35579,0.01000,2.340
109
+ 15,self_attn.q_proj,7.05407,0.01000,2.412
110
+ 15,self_attn.o_proj,0.04138,0.01000,2.441
111
+ 15,mlp.up_proj,7.82927,0.01000,2.577
112
+ 15,mlp.gate_proj,8.54841,0.01000,2.537
113
+ 15,mlp.down_proj,0.12537,0.01000,12.442
114
+ 16,self_attn.k_proj,2.62704,0.01000,2.372
115
+ 16,self_attn.v_proj,0.39784,0.01000,2.336
116
+ 16,self_attn.q_proj,8.07435,0.01000,2.379
117
+ 16,self_attn.o_proj,0.05020,0.01000,2.401
118
+ 16,mlp.up_proj,10.08904,0.01000,2.570
119
+ 16,mlp.gate_proj,11.10111,0.01000,2.528
120
+ 16,mlp.down_proj,0.16947,0.01000,12.337
121
+ 17,self_attn.k_proj,4.36580,0.01000,2.385
122
+ 17,self_attn.v_proj,0.46434,0.01000,2.309
123
+ 17,self_attn.q_proj,12.00885,0.01000,2.414
124
+ 17,self_attn.o_proj,0.12850,0.01000,2.425
125
+ 17,mlp.up_proj,12.33495,0.01000,2.574
126
+ 17,mlp.gate_proj,13.55825,0.01000,2.529
127
+ 17,mlp.down_proj,0.24378,0.01000,12.424
128
+ 18,self_attn.k_proj,5.60858,0.01000,2.380
129
+ 18,self_attn.v_proj,0.63289,0.01000,2.354
130
+ 18,self_attn.q_proj,16.55243,0.01000,2.401
131
+ 18,self_attn.o_proj,0.14321,0.01000,2.402
132
+ 18,mlp.up_proj,15.96843,0.01000,2.550
133
+ 18,mlp.gate_proj,17.98333,0.01000,2.500
134
+ 18,mlp.down_proj,0.32340,0.01000,12.371
135
+ 19,self_attn.k_proj,5.16959,0.01000,2.400
136
+ 19,self_attn.v_proj,0.74440,0.01000,2.347
137
+ 19,self_attn.q_proj,14.47852,0.01000,2.394
138
+ 19,self_attn.o_proj,0.14691,0.01000,2.430
139
+ 19,mlp.up_proj,16.84079,0.01000,2.590
140
+ 19,mlp.gate_proj,19.60419,0.01000,2.546
141
+ 19,mlp.down_proj,0.36414,0.01000,12.410
142
+ 20,self_attn.k_proj,6.47528,0.01000,2.380
143
+ 20,self_attn.v_proj,0.74963,0.01000,2.327
144
+ 20,self_attn.q_proj,14.17394,0.01000,2.408
145
+ 20,self_attn.o_proj,0.11211,0.01000,2.410
146
+ 20,mlp.up_proj,18.55169,0.01000,2.570
147
+ 20,mlp.gate_proj,21.14960,0.01000,2.524
148
+ 20,mlp.down_proj,0.37619,0.01000,12.351
149
+ 21,self_attn.k_proj,9.81788,0.01000,2.356
150
+ 21,self_attn.v_proj,0.89676,0.01000,2.299
151
+ 21,self_attn.q_proj,22.92135,0.01000,2.392
152
+ 21,self_attn.o_proj,0.16588,0.01000,2.393
153
+ 21,mlp.up_proj,21.32033,0.01000,2.581
154
+ 21,mlp.gate_proj,24.48094,0.01000,2.538
155
+ 21,mlp.down_proj,0.42420,0.01000,12.352
156
+ 22,self_attn.k_proj,10.66650,0.01000,2.377
157
+ 22,self_attn.v_proj,1.39040,0.01000,2.323
158
+ 22,self_attn.q_proj,23.65294,0.01000,2.398
159
+ 22,self_attn.o_proj,0.09598,0.01000,2.427
160
+ 22,mlp.up_proj,23.02085,0.01000,2.577
161
+ 22,mlp.gate_proj,27.06548,0.01000,2.531
162
+ 22,mlp.down_proj,0.42023,0.01000,12.385
163
+ 23,self_attn.k_proj,11.88396,0.01000,2.400
164
+ 23,self_attn.v_proj,1.27841,0.01000,2.370
165
+ 23,self_attn.q_proj,25.22909,0.01000,2.417
166
+ 23,self_attn.o_proj,0.12637,0.01000,2.437
167
+ 23,mlp.up_proj,24.15950,0.01000,2.603
168
+ 23,mlp.gate_proj,28.57765,0.01000,2.561
169
+ 23,mlp.down_proj,0.42992,0.01000,12.479
170
+ 24,self_attn.k_proj,6.27533,0.01000,2.372
171
+ 24,self_attn.v_proj,0.67591,0.01000,2.308
172
+ 24,self_attn.q_proj,11.09771,0.01000,2.394
173
+ 24,self_attn.o_proj,0.10294,0.01000,2.407
174
+ 24,mlp.up_proj,25.17421,0.01000,2.575
175
+ 24,mlp.gate_proj,29.08055,0.01000,2.531
176
+ 24,mlp.down_proj,0.45674,0.01000,12.389
177
+ 25,self_attn.k_proj,12.02082,0.01000,2.411
178
+ 25,self_attn.v_proj,1.35643,0.01000,2.373
179
+ 25,self_attn.q_proj,23.12022,0.01000,2.414
180
+ 25,self_attn.o_proj,0.11384,0.01000,2.408
181
+ 25,mlp.up_proj,27.31142,0.01000,2.594
182
+ 25,mlp.gate_proj,31.58317,0.01000,2.558
183
+ 25,mlp.down_proj,0.49229,0.01000,12.438
184
+ 26,self_attn.k_proj,11.96870,0.01000,2.423
185
+ 26,self_attn.v_proj,1.38614,0.01000,2.350
186
+ 26,self_attn.q_proj,23.65503,0.01000,2.426
187
+ 26,self_attn.o_proj,0.12416,0.01000,2.423
188
+ 26,mlp.up_proj,28.19983,0.01000,2.614
189
+ 26,mlp.gate_proj,32.36074,0.01000,2.552
190
+ 26,mlp.down_proj,0.52981,0.01000,12.445
191
+ 27,self_attn.k_proj,12.18930,0.01000,2.377
192
+ 27,self_attn.v_proj,0.86143,0.01000,2.337
193
+ 27,self_attn.q_proj,23.78441,0.01000,2.410
194
+ 27,self_attn.o_proj,0.25728,0.01000,2.420
195
+ 27,mlp.up_proj,26.60479,0.01000,2.577
196
+ 27,mlp.gate_proj,29.91342,0.01000,2.543
197
+ 27,mlp.down_proj,0.57599,0.01000,12.401
198
+ 28,self_attn.k_proj,14.01640,0.01000,2.407
199
+ 28,self_attn.v_proj,1.19739,0.01000,2.365
200
+ 28,self_attn.q_proj,28.35421,0.01000,2.401
201
+ 28,self_attn.o_proj,0.21742,0.01000,2.434
202
+ 28,mlp.up_proj,27.32375,0.01000,2.588
203
+ 28,mlp.gate_proj,30.71216,0.01000,2.542
204
+ 28,mlp.down_proj,0.64283,0.01000,12.378
205
+ 29,self_attn.k_proj,14.76551,0.01000,2.398
206
+ 29,self_attn.v_proj,1.14310,0.01000,2.362
207
+ 29,self_attn.q_proj,28.58216,0.01000,2.409
208
+ 29,self_attn.o_proj,0.24004,0.01000,2.427
209
+ 29,mlp.up_proj,28.34542,0.01000,2.598
210
+ 29,mlp.gate_proj,31.86575,0.01000,2.552
211
+ 29,mlp.down_proj,0.68480,0.01000,12.450
212
+ 30,self_attn.k_proj,11.88239,0.01000,2.395
213
+ 30,self_attn.v_proj,0.98647,0.01000,2.343
214
+ 30,self_attn.q_proj,23.09733,0.01000,2.407
215
+ 30,self_attn.o_proj,0.25479,0.01000,2.423
216
+ 30,mlp.up_proj,27.81762,0.01000,2.594
217
+ 30,mlp.gate_proj,30.93171,0.01000,2.547
218
+ 30,mlp.down_proj,0.67414,0.01000,12.351
219
+ 31,self_attn.k_proj,15.44827,0.01000,2.383
220
+ 31,self_attn.v_proj,1.00508,0.01000,2.325
221
+ 31,self_attn.q_proj,33.67770,0.01000,2.384
222
+ 31,self_attn.o_proj,0.44765,0.01000,2.412
223
+ 31,mlp.up_proj,28.46461,0.01000,2.577
224
+ 31,mlp.gate_proj,30.97182,0.01000,2.531
225
+ 31,mlp.down_proj,0.70130,0.01000,12.405
226
+ 32,self_attn.k_proj,10.04720,0.01000,2.386
227
+ 32,self_attn.v_proj,1.12798,0.01000,2.354
228
+ 32,self_attn.q_proj,20.07824,0.01000,2.389
229
+ 32,self_attn.o_proj,0.18536,0.01000,2.413
230
+ 32,mlp.up_proj,28.29184,0.01000,2.573
231
+ 32,mlp.gate_proj,31.21350,0.01000,2.531
232
+ 32,mlp.down_proj,0.73541,0.01000,12.368
233
+ 33,self_attn.k_proj,15.88254,0.01000,2.391
234
+ 33,self_attn.v_proj,1.10900,0.01000,2.339
235
+ 33,self_attn.q_proj,34.42078,0.01000,2.400
236
+ 33,self_attn.o_proj,0.41791,0.01000,2.406
237
+ 33,mlp.up_proj,70.70566,0.01000,2.585
238
+ 33,mlp.gate_proj,75.96263,0.01000,2.542
239
+ 33,mlp.down_proj,0.75321,0.01000,12.361
240
+ 34,self_attn.k_proj,13.84434,0.01000,2.406
241
+ 34,self_attn.v_proj,1.10936,0.01000,2.333
242
+ 34,self_attn.q_proj,29.83056,0.01000,2.424
243
+ 34,self_attn.o_proj,0.38872,0.01000,2.434
244
+ 34,mlp.up_proj,28.14292,0.01000,2.600
245
+ 34,mlp.gate_proj,30.72616,0.01000,2.556
246
+ 34,mlp.down_proj,0.77032,0.01000,12.496
247
+ 35,self_attn.k_proj,15.87492,0.01000,2.381
248
+ 35,self_attn.v_proj,1.14817,0.01000,2.320
249
+ 35,self_attn.q_proj,32.89777,0.01000,2.401
250
+ 35,self_attn.o_proj,0.42289,0.01000,2.409
251
+ 35,mlp.up_proj,28.14214,0.01000,2.578
252
+ 35,mlp.gate_proj,30.94142,0.01000,2.535
253
+ 35,mlp.down_proj,0.71352,0.01000,12.380
254
+ 36,self_attn.k_proj,11.59319,0.01000,2.377
255
+ 36,self_attn.v_proj,0.98563,0.01000,2.318
256
+ 36,self_attn.q_proj,21.57438,0.01000,2.384
257
+ 36,self_attn.o_proj,0.17942,0.01000,2.410
258
+ 36,mlp.up_proj,27.42457,0.01000,2.569
259
+ 36,mlp.gate_proj,30.79939,0.01000,2.525
260
+ 36,mlp.down_proj,0.72106,0.01000,12.391
261
+ 37,self_attn.k_proj,14.81283,0.01000,2.376
262
+ 37,self_attn.v_proj,1.04597,0.01000,2.331
263
+ 37,self_attn.q_proj,28.01339,0.01000,2.409
264
+ 37,self_attn.o_proj,0.22077,0.01000,2.419
265
+ 37,mlp.up_proj,27.39221,0.01000,2.575
266
+ 37,mlp.gate_proj,30.75794,0.01000,2.540
267
+ 37,mlp.down_proj,0.69618,0.01000,12.390
268
+ 38,self_attn.k_proj,13.16148,0.01000,2.380
269
+ 38,self_attn.v_proj,1.12986,0.01000,2.324
270
+ 38,self_attn.q_proj,24.62405,0.01000,2.385
271
+ 38,self_attn.o_proj,0.22751,0.01000,2.415
272
+ 38,mlp.up_proj,27.54411,0.01000,2.548
273
+ 38,mlp.gate_proj,31.43366,0.01000,2.528
274
+ 38,mlp.down_proj,0.67293,0.01000,12.317
275
+ 39,self_attn.k_proj,13.35156,0.01000,2.397
276
+ 39,self_attn.v_proj,1.18738,0.01000,2.355
277
+ 39,self_attn.q_proj,23.59219,0.01000,2.401
278
+ 39,self_attn.o_proj,0.16937,0.01000,2.409
279
+ 39,mlp.up_proj,27.48190,0.01000,2.570
280
+ 39,mlp.gate_proj,31.72308,0.01000,2.532
281
+ 39,mlp.down_proj,0.66521,0.01000,12.420
282
+ 40,self_attn.k_proj,10.13054,0.01000,2.424
283
+ 40,self_attn.v_proj,1.36028,0.01000,2.365
284
+ 40,self_attn.q_proj,20.56631,0.01000,2.418
285
+ 40,self_attn.o_proj,0.12621,0.01000,2.438
286
+ 40,mlp.up_proj,27.66399,0.01000,2.608
287
+ 40,mlp.gate_proj,32.16180,0.01000,2.564
288
+ 40,mlp.down_proj,0.72769,0.01000,12.428
289
+ 41,self_attn.k_proj,12.69510,0.01000,2.375
290
+ 41,self_attn.v_proj,1.12165,0.01000,2.328
291
+ 41,self_attn.q_proj,21.96209,0.01000,2.390
292
+ 41,self_attn.o_proj,0.13793,0.01000,2.423
293
+ 41,mlp.up_proj,28.21097,0.01000,2.587
294
+ 41,mlp.gate_proj,32.82212,0.01000,2.546
295
+ 41,mlp.down_proj,0.69244,0.01000,12.410
296
+ 42,self_attn.k_proj,8.44118,0.01000,2.378
297
+ 42,self_attn.v_proj,0.90866,0.01000,2.322
298
+ 42,self_attn.q_proj,13.04269,0.01000,2.396
299
+ 42,self_attn.o_proj,0.08163,0.01000,2.397
300
+ 42,mlp.up_proj,28.56101,0.01000,2.581
301
+ 42,mlp.gate_proj,33.50828,0.01000,2.542
302
+ 42,mlp.down_proj,0.64698,0.01000,12.371
303
+ 43,self_attn.k_proj,8.92527,0.01000,2.391
304
+ 43,self_attn.v_proj,0.98848,0.01000,2.324
305
+ 43,self_attn.q_proj,14.44163,0.01000,2.393
306
+ 43,self_attn.o_proj,0.09209,0.01000,2.430
307
+ 43,mlp.up_proj,29.11296,0.01000,2.580
308
+ 43,mlp.gate_proj,34.40512,0.01000,2.531
309
+ 43,mlp.down_proj,0.68803,0.01000,12.424
310
+ 44,self_attn.k_proj,13.99534,0.01000,2.388
311
+ 44,self_attn.v_proj,1.57364,0.01000,2.340
312
+ 44,self_attn.q_proj,28.14628,0.01000,2.410
313
+ 44,self_attn.o_proj,0.14434,0.01000,2.418
314
+ 44,mlp.up_proj,29.51572,0.01000,2.598
315
+ 44,mlp.gate_proj,35.05244,0.01000,2.552
316
+ 44,mlp.down_proj,0.76233,0.01000,12.385
317
+ 45,self_attn.k_proj,8.35592,0.01000,2.405
318
+ 45,self_attn.v_proj,0.92035,0.01000,2.346
319
+ 45,self_attn.q_proj,13.71338,0.01000,2.417
320
+ 45,self_attn.o_proj,0.12826,0.01000,2.435
321
+ 45,mlp.up_proj,29.94445,0.01000,2.594
322
+ 45,mlp.gate_proj,35.62438,0.01000,2.567
323
+ 45,mlp.down_proj,0.75896,0.01000,12.476
324
+ 46,self_attn.k_proj,5.03439,0.01000,2.413
325
+ 46,self_attn.v_proj,0.41520,0.01000,2.373
326
+ 46,self_attn.q_proj,3.65707,0.01000,2.418
327
+ 46,self_attn.o_proj,0.02733,0.01000,2.429
328
+ 46,mlp.up_proj,30.43668,0.01000,2.596
329
+ 46,mlp.gate_proj,36.21279,0.01000,2.555
330
+ 46,mlp.down_proj,0.70465,0.01000,12.484
331
+ 47,self_attn.k_proj,9.32724,0.01000,2.419
332
+ 47,self_attn.v_proj,1.12588,0.01000,2.366
333
+ 47,self_attn.q_proj,13.99360,0.01000,2.424
334
+ 47,self_attn.o_proj,0.07536,0.01000,2.429
335
+ 47,mlp.up_proj,30.93128,0.01000,2.606
336
+ 47,mlp.gate_proj,36.81147,0.01000,2.562
337
+ 47,mlp.down_proj,0.75357,0.01000,12.446
338
+ 48,self_attn.k_proj,9.56606,0.01000,2.397
339
+ 48,self_attn.v_proj,1.20021,0.01000,2.341
340
+ 48,self_attn.q_proj,14.59574,0.01000,2.424
341
+ 48,self_attn.o_proj,0.05555,0.01000,2.431
342
+ 48,mlp.up_proj,31.49958,0.01000,2.590
343
+ 48,mlp.gate_proj,37.59175,0.01000,2.550
344
+ 48,mlp.down_proj,0.85475,0.01000,12.454
345
+ 49,self_attn.k_proj,9.73940,0.01000,2.409
346
+ 49,self_attn.v_proj,1.12793,0.01000,2.345
347
+ 49,self_attn.q_proj,14.39461,0.01000,2.426
348
+ 49,self_attn.o_proj,0.07215,0.01000,2.433
349
+ 49,mlp.up_proj,32.26957,0.01000,2.601
350
+ 49,mlp.gate_proj,38.52919,0.01000,2.558
351
+ 49,mlp.down_proj,0.85321,0.01000,12.449
352
+ 50,self_attn.k_proj,7.50268,0.01000,2.412
353
+ 50,self_attn.v_proj,0.91148,0.01000,2.363
354
+ 50,self_attn.q_proj,9.03854,0.01000,2.414
355
+ 50,self_attn.o_proj,0.05698,0.01000,2.413
356
+ 50,mlp.up_proj,32.78205,0.01000,2.599
357
+ 50,mlp.gate_proj,39.19064,0.01000,2.560
358
+ 50,mlp.down_proj,0.78843,0.01000,12.456
359
+ 51,self_attn.k_proj,8.62929,0.01000,2.384
360
+ 51,self_attn.v_proj,1.10167,0.01000,2.355
361
+ 51,self_attn.q_proj,12.73033,0.01000,2.422
362
+ 51,self_attn.o_proj,0.08332,0.01000,2.427
363
+ 51,mlp.up_proj,33.36840,0.01000,2.602
364
+ 51,mlp.gate_proj,39.81268,0.01000,2.552
365
+ 51,mlp.down_proj,0.84592,0.01000,12.439
366
+ 52,self_attn.k_proj,14.24103,0.01000,2.402
367
+ 52,self_attn.v_proj,1.52739,0.01000,2.350
368
+ 52,self_attn.q_proj,26.98552,0.01000,2.419
369
+ 52,self_attn.o_proj,0.23821,0.01000,2.426
370
+ 52,mlp.up_proj,34.04603,0.01000,2.598
371
+ 52,mlp.gate_proj,40.77630,0.01000,2.553
372
+ 52,mlp.down_proj,0.94730,0.01000,12.492
373
+ 53,self_attn.k_proj,11.13863,0.01000,2.406
374
+ 53,self_attn.v_proj,1.26610,0.01000,2.380
375
+ 53,self_attn.q_proj,15.89432,0.01000,2.417
376
+ 53,self_attn.o_proj,0.05793,0.01000,2.423
377
+ 53,mlp.up_proj,34.83026,0.01000,2.582
378
+ 53,mlp.gate_proj,41.77624,0.01000,2.552
379
+ 53,mlp.down_proj,0.92240,0.01000,12.391
380
+ 54,self_attn.k_proj,7.40175,0.01000,2.406
381
+ 54,self_attn.v_proj,0.79817,0.01000,2.341
382
+ 54,self_attn.q_proj,8.95007,0.01000,2.415
383
+ 54,self_attn.o_proj,0.10005,0.01000,2.442
384
+ 54,mlp.up_proj,35.37103,0.01000,2.599
385
+ 54,mlp.gate_proj,41.93651,0.01000,2.536
386
+ 54,mlp.down_proj,0.86324,0.01000,12.377
387
+ 55,self_attn.k_proj,6.85297,0.01000,2.419
388
+ 55,self_attn.v_proj,0.80341,0.01000,2.341
389
+ 55,self_attn.q_proj,9.80242,0.01000,2.419
390
+ 55,self_attn.o_proj,0.10725,0.01000,2.435
391
+ 55,mlp.up_proj,35.42970,0.01000,2.590
392
+ 55,mlp.gate_proj,42.14802,0.01000,2.560
393
+ 55,mlp.down_proj,0.90768,0.01000,12.442
394
+ 56,self_attn.k_proj,13.88305,0.01000,2.394
395
+ 56,self_attn.v_proj,1.85680,0.01000,2.350
396
+ 56,self_attn.q_proj,26.94255,0.01000,2.390
397
+ 56,self_attn.o_proj,0.20183,0.01000,2.436
398
+ 56,mlp.up_proj,36.07793,0.01000,2.592
399
+ 56,mlp.gate_proj,43.35723,0.01000,2.545
400
+ 56,mlp.down_proj,1.01939,0.01000,12.415
401
+ 57,self_attn.k_proj,10.69875,0.01000,2.405
402
+ 57,self_attn.v_proj,1.38184,0.01000,2.319
403
+ 57,self_attn.q_proj,15.78839,0.01000,2.408
404
+ 57,self_attn.o_proj,0.15118,0.01000,2.438
405
+ 57,mlp.up_proj,36.95335,0.01000,2.595
406
+ 57,mlp.gate_proj,44.50830,0.01000,2.544
407
+ 57,mlp.down_proj,0.99837,0.01000,12.462
408
+ 58,self_attn.k_proj,7.56804,0.01000,2.398
409
+ 58,self_attn.v_proj,1.12267,0.01000,2.348
410
+ 58,self_attn.q_proj,10.17075,0.01000,2.424
411
+ 58,self_attn.o_proj,0.08434,0.01000,2.441
412
+ 58,mlp.up_proj,37.68964,0.01000,2.599
413
+ 58,mlp.gate_proj,44.71976,0.01000,2.543
414
+ 58,mlp.down_proj,0.94810,0.01000,12.437
415
+ 59,self_attn.k_proj,7.43233,0.01000,2.413
416
+ 59,self_attn.v_proj,0.91834,0.01000,2.343
417
+ 59,self_attn.q_proj,8.87059,0.01000,2.395
418
+ 59,self_attn.o_proj,0.05050,0.01000,2.433
419
+ 59,mlp.up_proj,38.86263,0.01000,2.591
420
+ 59,mlp.gate_proj,46.91222,0.01000,2.557
421
+ 59,mlp.down_proj,1.04556,0.01000,12.446
422
+ 60,self_attn.k_proj,13.29610,0.01000,2.405
423
+ 60,self_attn.v_proj,2.16565,0.01000,2.373
424
+ 60,self_attn.q_proj,25.22976,0.01000,2.430
425
+ 60,self_attn.o_proj,0.16070,0.01000,2.401
426
+ 60,mlp.up_proj,39.92323,0.01000,2.594
427
+ 60,mlp.gate_proj,48.80389,0.01000,2.562
428
+ 60,mlp.down_proj,1.19647,0.01000,12.480
429
+ 61,self_attn.k_proj,9.04602,0.01000,2.407
430
+ 61,self_attn.v_proj,1.31423,0.01000,2.354
431
+ 61,self_attn.q_proj,11.27571,0.01000,2.430
432
+ 61,self_attn.o_proj,0.11997,0.01000,2.426
433
+ 61,mlp.up_proj,40.52758,0.01000,2.601
434
+ 61,mlp.gate_proj,49.42426,0.01000,2.551
435
+ 61,mlp.down_proj,1.14733,0.01000,12.427
436
+ 62,self_attn.k_proj,6.08225,0.01000,2.400
437
+ 62,self_attn.v_proj,0.54749,0.01000,2.341
438
+ 62,self_attn.q_proj,3.91657,0.01000,2.427
439
+ 62,self_attn.o_proj,0.03115,0.01000,2.430
440
+ 62,mlp.up_proj,40.40889,0.01000,2.569
441
+ 62,mlp.gate_proj,48.50503,0.01000,2.558
442
+ 62,mlp.down_proj,1.03680,0.01000,12.433
443
+ 63,self_attn.k_proj,7.13903,0.01000,2.395
444
+ 63,self_attn.v_proj,0.90019,0.01000,2.339
445
+ 63,self_attn.q_proj,8.04566,0.01000,2.423
446
+ 63,self_attn.o_proj,0.06037,0.01000,2.428
447
+ 63,mlp.up_proj,42.07748,0.01000,2.598
448
+ 63,mlp.gate_proj,51.37971,0.01000,2.556
449
+ 63,mlp.down_proj,1.16115,0.01000,12.440
450
+ 64,self_attn.k_proj,12.30144,0.01000,2.389
451
+ 64,self_attn.v_proj,1.94175,0.01000,2.347
452
+ 64,self_attn.q_proj,20.16385,0.01000,2.420
453
+ 64,self_attn.o_proj,0.24632,0.01000,2.439
454
+ 64,mlp.up_proj,44.01347,0.01000,2.588
455
+ 64,mlp.gate_proj,55.13173,0.01000,2.553
456
+ 64,mlp.down_proj,1.38282,0.01000,12.488
457
+ 65,self_attn.k_proj,6.82733,0.01000,2.398
458
+ 65,self_attn.v_proj,0.78277,0.01000,2.352
459
+ 65,self_attn.q_proj,6.81213,0.01000,2.420
460
+ 65,self_attn.o_proj,0.07622,0.01000,2.441
461
+ 65,mlp.up_proj,44.64717,0.01000,2.598
462
+ 65,mlp.gate_proj,55.94937,0.01000,2.550
463
+ 65,mlp.down_proj,1.31563,0.01000,12.353
464
+ 66,self_attn.k_proj,7.05296,0.01000,2.387
465
+ 66,self_attn.v_proj,1.03377,0.01000,2.330
466
+ 66,self_attn.q_proj,8.85096,0.01000,2.411
467
+ 66,self_attn.o_proj,0.13433,0.01000,2.434
468
+ 66,mlp.up_proj,44.82061,0.01000,2.602
469
+ 66,mlp.gate_proj,54.01328,0.01000,2.544
470
+ 66,mlp.down_proj,1.22117,0.01000,12.403
471
+ 67,self_attn.k_proj,12.34406,0.01000,2.394
472
+ 67,self_attn.v_proj,2.19811,0.01000,2.371
473
+ 67,self_attn.q_proj,20.21918,0.01000,2.421
474
+ 67,self_attn.o_proj,0.23947,0.01000,2.428
475
+ 67,mlp.up_proj,46.74456,0.01000,2.591
476
+ 67,mlp.gate_proj,56.45784,0.01000,2.545
477
+ 67,mlp.down_proj,1.34151,0.01000,12.484
478
+ 68,self_attn.k_proj,13.16044,0.01000,2.423
479
+ 68,self_attn.v_proj,2.73707,0.01000,2.354
480
+ 68,self_attn.q_proj,24.21140,0.01000,2.414
481
+ 68,self_attn.o_proj,0.30300,0.01000,2.456
482
+ 68,mlp.up_proj,49.65003,0.01000,2.607
483
+ 68,mlp.gate_proj,61.89810,0.01000,2.551
484
+ 68,mlp.down_proj,1.64361,0.01000,12.423
485
+ 69,self_attn.k_proj,10.67953,0.01000,2.396
486
+ 69,self_attn.v_proj,2.16242,0.01000,2.341
487
+ 69,self_attn.q_proj,18.11952,0.01000,2.400
488
+ 69,self_attn.o_proj,0.20832,0.01000,2.421
489
+ 69,mlp.up_proj,50.93095,0.01000,2.596
490
+ 69,mlp.gate_proj,62.72586,0.01000,2.549
491
+ 69,mlp.down_proj,1.61045,0.01000,12.533
492
+ 70,self_attn.k_proj,10.28304,0.01000,2.399
493
+ 70,self_attn.v_proj,1.98366,0.01000,2.359
494
+ 70,self_attn.q_proj,19.90069,0.01000,2.390
495
+ 70,self_attn.o_proj,0.35756,0.01000,2.436
496
+ 70,mlp.up_proj,51.26246,0.01000,2.604
497
+ 70,mlp.gate_proj,60.92408,0.01000,2.563
498
+ 70,mlp.down_proj,1.57580,0.01000,12.480
499
+ 71,self_attn.k_proj,12.47268,0.01000,2.396
500
+ 71,self_attn.v_proj,2.70028,0.01000,2.355
501
+ 71,self_attn.q_proj,27.55191,0.01000,2.385
502
+ 71,self_attn.o_proj,0.93984,0.01000,2.428
503
+ 71,mlp.up_proj,55.26141,0.01000,2.595
504
+ 71,mlp.gate_proj,65.54773,0.01000,2.549
505
+ 71,mlp.down_proj,1.90825,0.01000,12.460
506
+ 72,self_attn.k_proj,13.01985,0.01000,2.408
507
+ 72,self_attn.v_proj,3.01720,0.01000,2.357
508
+ 72,self_attn.q_proj,30.32354,0.01000,2.437
509
+ 72,self_attn.o_proj,0.44778,0.01000,2.445
510
+ 72,mlp.up_proj,58.38693,0.01000,2.610
511
+ 72,mlp.gate_proj,71.82819,0.01000,2.559
512
+ 72,mlp.down_proj,2.24979,0.01000,12.446
513
+ 73,self_attn.k_proj,12.93038,0.01000,2.406
514
+ 73,self_attn.v_proj,3.20805,0.01000,2.342
515
+ 73,self_attn.q_proj,29.55270,0.01000,2.424
516
+ 73,self_attn.o_proj,1.00655,0.01000,2.436
517
+ 73,mlp.up_proj,58.70067,0.01000,2.594
518
+ 73,mlp.gate_proj,71.63084,0.01000,2.556
519
+ 73,mlp.down_proj,2.31351,0.01000,12.468
520
+ 74,self_attn.k_proj,12.20197,0.01000,2.403
521
+ 74,self_attn.v_proj,3.11274,0.01000,2.358
522
+ 74,self_attn.q_proj,28.71220,0.01000,2.423
523
+ 74,self_attn.o_proj,1.16861,0.01000,2.403
524
+ 74,mlp.up_proj,61.27262,0.01000,2.587
525
+ 74,mlp.gate_proj,74.21090,0.01000,2.548
526
+ 74,mlp.down_proj,2.48106,0.01000,12.486
527
+ 75,self_attn.k_proj,11.45592,0.01000,2.423
528
+ 75,self_attn.v_proj,3.51124,0.01000,2.359
529
+ 75,self_attn.q_proj,30.38795,0.01000,2.413
530
+ 75,self_attn.o_proj,2.18176,0.01000,2.446
531
+ 75,mlp.up_proj,66.98369,0.01000,2.612
532
+ 75,mlp.gate_proj,83.39505,0.01000,2.540
533
+ 75,mlp.down_proj,3.69956,0.01000,12.424
534
+ 76,self_attn.k_proj,10.18937,0.01000,2.412
535
+ 76,self_attn.v_proj,3.41040,0.01000,2.366
536
+ 76,self_attn.q_proj,27.26140,0.01000,2.445
537
+ 76,self_attn.o_proj,1.05649,0.01000,2.450
538
+ 76,mlp.up_proj,78.13490,0.01000,2.615
539
+ 76,mlp.gate_proj,118.95868,0.01000,2.555
540
+ 76,mlp.down_proj,5.51300,0.01000,12.506
541
+ 77,self_attn.k_proj,11.54971,0.01000,2.413
542
+ 77,self_attn.v_proj,4.01822,0.01000,2.364
543
+ 77,self_attn.q_proj,29.42512,0.01000,2.424
544
+ 77,self_attn.o_proj,1.65369,0.01000,2.446
545
+ 77,mlp.up_proj,74.31666,0.01000,2.601
546
+ 77,mlp.gate_proj,93.92165,0.01000,2.547
547
+ 77,mlp.down_proj,6.31596,0.01000,12.536
548
+ 78,self_attn.k_proj,10.21922,0.01000,2.425
549
+ 78,self_attn.v_proj,2.88337,0.01000,2.382
550
+ 78,self_attn.q_proj,24.15326,0.01000,2.417
551
+ 78,self_attn.o_proj,1.91129,0.01000,2.453
552
+ 78,mlp.up_proj,71.57212,0.01000,2.619
553
+ 78,mlp.gate_proj,88.37552,0.01000,2.566
554
+ 78,mlp.down_proj,13.54613,0.01000,12.559
555
+ 79,self_attn.k_proj,4.50027,0.01000,2.416
556
+ 79,self_attn.v_proj,1.45889,0.01000,2.372
557
+ 79,self_attn.q_proj,8.78865,0.01000,2.427
558
+ 79,self_attn.o_proj,1.06731,0.01000,2.438
559
+ 79,mlp.up_proj,44.81396,0.01000,2.621
560
+ 79,mlp.gate_proj,52.70864,0.01000,2.574
561
+ 79,mlp.down_proj,18.51311,0.01000,12.513
quantize_config.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bits": 4,
3
+ "dynamic": null,
4
+ "group_size": 128,
5
+ "desc_act": true,
6
+ "sym": true,
7
+ "lm_head": false,
8
+ "quant_method": "gptq",
9
+ "checkpoint_format": "gptq",
10
+ "meta": {
11
+ "quantizer": [
12
+ "gptqmodel:1.4.0-dev"
13
+ ],
14
+ "uri": "https://github.com/modelcloud/gptqmodel",
15
+ "damp_percent": 0.01,
16
+ "damp_auto_increment": 0.0015,
17
+ "static_groups": false,
18
+ "true_sequential": true
19
+ }
20
+ }