alyssavance commited on
Commit
5d1b27c
·
verified ·
1 Parent(s): b541b49

Upload folder using huggingface_hub

Browse files
config.json ADDED
@@ -0,0 +1,205 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "meta-llama/Meta-Llama-3.1-405B",
3
+ "architectures": [
4
+ "LlamaForCausalLM"
5
+ ],
6
+ "attention_bias": false,
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 128000,
9
+ "eos_token_id": 128001,
10
+ "hidden_act": "silu",
11
+ "hidden_size": 16384,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 53248,
14
+ "max_position_embeddings": 131072,
15
+ "mlp_bias": false,
16
+ "model_type": "llama",
17
+ "num_attention_heads": 128,
18
+ "num_hidden_layers": 126,
19
+ "num_key_value_heads": 8,
20
+ "pretraining_tp": 1,
21
+ "quantization_config": {
22
+ "mlp.down_proj": {
23
+ "offload_meta": false,
24
+ "scale_quant_params": {
25
+ "channel_wise": true,
26
+ "group_size": 128,
27
+ "nbits": 8,
28
+ "optimize": false
29
+ },
30
+ "weight_quant_params": {
31
+ "axis": 0,
32
+ "channel_wise": true,
33
+ "group_size": 128,
34
+ "nbits": 3,
35
+ "optimize": true,
36
+ "round_zero": false,
37
+ "view_as_float": false
38
+ },
39
+ "zero_quant_params": {
40
+ "channel_wise": false,
41
+ "group_size": null,
42
+ "nbits": 8,
43
+ "optimize": false
44
+ }
45
+ },
46
+ "mlp.gate_proj": {
47
+ "offload_meta": false,
48
+ "scale_quant_params": {
49
+ "channel_wise": true,
50
+ "group_size": 128,
51
+ "nbits": 8,
52
+ "optimize": false
53
+ },
54
+ "weight_quant_params": {
55
+ "axis": 0,
56
+ "channel_wise": true,
57
+ "group_size": 128,
58
+ "nbits": 3,
59
+ "optimize": true,
60
+ "round_zero": false,
61
+ "view_as_float": false
62
+ },
63
+ "zero_quant_params": {
64
+ "channel_wise": false,
65
+ "group_size": null,
66
+ "nbits": 8,
67
+ "optimize": false
68
+ }
69
+ },
70
+ "mlp.up_proj": {
71
+ "offload_meta": false,
72
+ "scale_quant_params": {
73
+ "channel_wise": true,
74
+ "group_size": 128,
75
+ "nbits": 8,
76
+ "optimize": false
77
+ },
78
+ "weight_quant_params": {
79
+ "axis": 0,
80
+ "channel_wise": true,
81
+ "group_size": 128,
82
+ "nbits": 3,
83
+ "optimize": true,
84
+ "round_zero": false,
85
+ "view_as_float": false
86
+ },
87
+ "zero_quant_params": {
88
+ "channel_wise": false,
89
+ "group_size": null,
90
+ "nbits": 8,
91
+ "optimize": false
92
+ }
93
+ },
94
+ "self_attn.k_proj": {
95
+ "offload_meta": false,
96
+ "scale_quant_params": {
97
+ "channel_wise": true,
98
+ "group_size": 128,
99
+ "nbits": 8,
100
+ "optimize": false
101
+ },
102
+ "weight_quant_params": {
103
+ "axis": 0,
104
+ "channel_wise": true,
105
+ "group_size": 128,
106
+ "nbits": 3,
107
+ "optimize": true,
108
+ "round_zero": false,
109
+ "view_as_float": false
110
+ },
111
+ "zero_quant_params": {
112
+ "channel_wise": false,
113
+ "group_size": null,
114
+ "nbits": 8,
115
+ "optimize": false
116
+ }
117
+ },
118
+ "self_attn.o_proj": {
119
+ "offload_meta": false,
120
+ "scale_quant_params": {
121
+ "channel_wise": true,
122
+ "group_size": 128,
123
+ "nbits": 8,
124
+ "optimize": false
125
+ },
126
+ "weight_quant_params": {
127
+ "axis": 0,
128
+ "channel_wise": true,
129
+ "group_size": 128,
130
+ "nbits": 3,
131
+ "optimize": true,
132
+ "round_zero": false,
133
+ "view_as_float": false
134
+ },
135
+ "zero_quant_params": {
136
+ "channel_wise": false,
137
+ "group_size": null,
138
+ "nbits": 8,
139
+ "optimize": false
140
+ }
141
+ },
142
+ "self_attn.q_proj": {
143
+ "offload_meta": false,
144
+ "scale_quant_params": {
145
+ "channel_wise": true,
146
+ "group_size": 128,
147
+ "nbits": 8,
148
+ "optimize": false
149
+ },
150
+ "weight_quant_params": {
151
+ "axis": 0,
152
+ "channel_wise": true,
153
+ "group_size": 128,
154
+ "nbits": 3,
155
+ "optimize": true,
156
+ "round_zero": false,
157
+ "view_as_float": false
158
+ },
159
+ "zero_quant_params": {
160
+ "channel_wise": false,
161
+ "group_size": null,
162
+ "nbits": 8,
163
+ "optimize": false
164
+ }
165
+ },
166
+ "self_attn.v_proj": {
167
+ "offload_meta": false,
168
+ "scale_quant_params": {
169
+ "channel_wise": true,
170
+ "group_size": 128,
171
+ "nbits": 8,
172
+ "optimize": false
173
+ },
174
+ "weight_quant_params": {
175
+ "axis": 0,
176
+ "channel_wise": true,
177
+ "group_size": 128,
178
+ "nbits": 3,
179
+ "optimize": true,
180
+ "round_zero": false,
181
+ "view_as_float": false
182
+ },
183
+ "zero_quant_params": {
184
+ "channel_wise": false,
185
+ "group_size": null,
186
+ "nbits": 8,
187
+ "optimize": false
188
+ }
189
+ }
190
+ },
191
+ "rms_norm_eps": 1e-05,
192
+ "rope_scaling": {
193
+ "factor": 8.0,
194
+ "high_freq_factor": 4.0,
195
+ "low_freq_factor": 1.0,
196
+ "original_max_position_embeddings": 8192,
197
+ "rope_type": "llama3"
198
+ },
199
+ "rope_theta": 500000.0,
200
+ "tie_word_embeddings": false,
201
+ "torch_dtype": "bfloat16",
202
+ "transformers_version": "4.44.2",
203
+ "use_cache": true,
204
+ "vocab_size": 128256
205
+ }
qmodel_shard_aa.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3499bb188fa4906a9b80bf0fe456389bd92cef042c4881b626b6f1bf6418d250
3
+ size 4294967296
qmodel_shard_ab.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15bfe5aee7aaec65a8f9f49ad584470293786ee7ee2a02b5ef53a79869a4741d
3
+ size 4294967296
qmodel_shard_ac.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14a2943f829e487b4d49d9d1e5f74111014078d6f9ade4cdf6df39dc1aca1c5a
3
+ size 4294967296
qmodel_shard_ad.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0747269f940b86034e95525cd3ea39bfbaef7721836f073b771d2d5fe8e50332
3
+ size 4294967296
qmodel_shard_ae.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbd03022f66e4d6ab38331da6e52828d1816cf64e145f6607f3f9a29d63efb10
3
+ size 4294967296
qmodel_shard_af.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64164e2c50ac54f8d94386e35708340e93a3c4cfd1f3b8c764d91850f8a57d88
3
+ size 4294967296
qmodel_shard_ag.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:241eaf6385e9e571530beb16cc8fb74487afb46b1a363fc3a30d49e2bd29e62c
3
+ size 4294967296
qmodel_shard_ah.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:673437b100b5dd1ef92a2bce1b67e76a7285f415fa1a7973fe9e4986dccb0510
3
+ size 4294967296
qmodel_shard_ai.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54a7abf92e6efeb3042e3f60d752491e4ed87e2e949c93bee66818eab507cc5f
3
+ size 4294967296
qmodel_shard_aj.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc9cb3f13b5b2c7f626484c591e56d2d01f299e6a9d61139493bcb65f20a5452
3
+ size 4294967296
qmodel_shard_ak.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fbe35e0deb07a5b5eb426a6689e22259b89d006ad5bab3992bbdf0a2611377ce
3
+ size 4294967296
qmodel_shard_al.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f31dfcbf1359754531f315c51e6630972c0170384150c8dc95a5d27382c6b4a
3
+ size 4294967296
qmodel_shard_am.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccd457168f88c4c9579d1b7bddf299aecf66022da209ef3f484b895ea7661905
3
+ size 4294967296
qmodel_shard_an.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd823acbd013f8582628391c4f5a0568a47dac372dab4c9895e2038aff9b8675
3
+ size 4294967296
qmodel_shard_ao.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cfbde27bdcd16b9bf8d258c9f35248aeb6582d15a35f98944157d6bf8ea3ea9e
3
+ size 4294967296
qmodel_shard_ap.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e132774fe97570900b0abb1e452709fdad03247a61069de66d1ae56b4f0f9d6
3
+ size 4294967296
qmodel_shard_aq.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d48ee3f5f078e8954bb5100f086faae6ccb6e626dbd2efd451672db92581836d
3
+ size 4294967296
qmodel_shard_ar.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:677106aa663ee2eec080b8e4490ec4df6d3e55b4f29f5fd7626d85184caa7093
3
+ size 4294967296
qmodel_shard_as.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ece20e414c1d971db1c0d0e6cafbc5170791c5107748385aa36c8dac42d24a4e
3
+ size 4294967296
qmodel_shard_at.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b00ceecabd0937742ab5f49f74e451e738b48295facb8e4f9db489a37875521d
3
+ size 4294967296
qmodel_shard_au.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ac91e828a89709481a3b625b9212b3a9af2a44461eaaccf477552e873a7cf4e
3
+ size 4294967296
qmodel_shard_av.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa35635ab50ae4cd63cec665bb79529fc178e0797557e30dfd00c992deceba2e
3
+ size 4294967296
qmodel_shard_aw.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca4a82bad44820ce4abe6053da956a35ec04d8492f50bb212455586f2aa926c7
3
+ size 4294967296
qmodel_shard_ax.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7687833a9407616999a5eb3da299c0a50cf3735fc2013c8d44e0946ceb60439e
3
+ size 4294967296
qmodel_shard_ay.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b69562d4cfe30a64c371142e4543ad1aa3bcceb22b2b389bcb7045299e9ae18
3
+ size 4294967296
qmodel_shard_az.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9c96d23ee51c5a944fb2df7f88512c7ce4f5f27bf4b540e3a860421511bc23a
3
+ size 4294967296
qmodel_shard_ba.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2da0f067c6e4174f59a70dfaceb62c28bda0ec9e5abc224f6415e1152eee8b54
3
+ size 4294967296
qmodel_shard_bb.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be7504fe9d1b3def9c497fc0c5841d7ec55440aeede859eab86aa098ce8c9d7c
3
+ size 4294967296
qmodel_shard_bc.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3bab37d55e9ff2efb49b25a80107f3e65e7b1ce798c5677e5e9dd3d0232ad3ec
3
+ size 4294967296
qmodel_shard_bd.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4719b63dcbdeaa122f5c8d6ea68c4029151325169f51ea074b6a2c6c15ce8a6d
3
+ size 4294967296
qmodel_shard_be.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4252536b7571a476170371dc47b9d5e0b47048b9e4e8278cb4e3eacb855087f1
3
+ size 4294967296
qmodel_shard_bf.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a65fd5f01bdb2d4c08f3b944079dc488d223e6b1f221e838b52b9e6f08adb223
3
+ size 4294967296
qmodel_shard_bg.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:761d5e173588b70d03e799e3d48e3f4a8f53199251863c575b8c488dd7b2797d
3
+ size 4294967296
qmodel_shard_bh.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f6f20c5a4dd78a2d19a82ca25b4f28b5fb538bc44f4551a1f5986c7de26db77
3
+ size 4294967296
qmodel_shard_bi.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b37c1bebb14301903a9ca30474d4d106f9995026f2073400ebae6e8a026a104
3
+ size 4294967296
qmodel_shard_bj.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4bf9297918900cddc177b7293b50753d87de4dce831504b926485a96a43239fa
3
+ size 4294967296
qmodel_shard_bk.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f725439c6c335e5f0a3c2719a0cca931acf233a06e99f3d88b7318c54440ba9c
3
+ size 4294967296
qmodel_shard_bl.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98c9294e9213cc98ea42cc53213d856e98a4fe8960398c47ce9e036c985fb226
3
+ size 4294967296
qmodel_shard_bm.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3d6a24552930559c2d3bd88154896651591003779909da3d29dad717203c2bc
3
+ size 4294967296
qmodel_shard_bn.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a59d1dcb08e3850125f24b0a93611d98354614fae3e68797cb8c348f00036520
3
+ size 4294967296
qmodel_shard_bo.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:449fb4ace5f0e9e81b4a3051c88f72dfb9735bccdd2fb697ffb9b552009d6cb1
3
+ size 4294967296
qmodel_shard_bp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e6a6204d2b3882fc45851bea8028d1e3a5682b6182773568be7dd5f2b9b3ee3
3
+ size 4294967296
qmodel_shard_bq.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bcbcb2901a2c43732198725cbb5b14297ae0dfa7573a8bb01ba83b1ed987f01e
3
+ size 4294967296
qmodel_shard_br.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c223d8e8997ec250e85e8b2f9de17daa5544b7689218be9ebd5466a235298cc6
3
+ size 1786659040