alyssavance commited on
Commit
675bd81
1 Parent(s): 6d280cf

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
config.json ADDED
@@ -0,0 +1,205 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "meta-llama/Meta-Llama-3.1-405B",
3
+ "architectures": [
4
+ "LlamaForCausalLM"
5
+ ],
6
+ "attention_bias": false,
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 128000,
9
+ "eos_token_id": 128001,
10
+ "hidden_act": "silu",
11
+ "hidden_size": 16384,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 53248,
14
+ "max_position_embeddings": 131072,
15
+ "mlp_bias": false,
16
+ "model_type": "llama",
17
+ "num_attention_heads": 128,
18
+ "num_hidden_layers": 126,
19
+ "num_key_value_heads": 8,
20
+ "pretraining_tp": 1,
21
+ "quantization_config": {
22
+ "mlp.down_proj": {
23
+ "offload_meta": false,
24
+ "scale_quant_params": {
25
+ "channel_wise": true,
26
+ "group_size": 128,
27
+ "nbits": 8,
28
+ "optimize": false
29
+ },
30
+ "weight_quant_params": {
31
+ "axis": 0,
32
+ "channel_wise": true,
33
+ "group_size": 128,
34
+ "nbits": 4,
35
+ "optimize": true,
36
+ "round_zero": true,
37
+ "view_as_float": false
38
+ },
39
+ "zero_quant_params": {
40
+ "channel_wise": false,
41
+ "group_size": null,
42
+ "nbits": 8,
43
+ "optimize": false
44
+ }
45
+ },
46
+ "mlp.gate_proj": {
47
+ "offload_meta": false,
48
+ "scale_quant_params": {
49
+ "channel_wise": true,
50
+ "group_size": 128,
51
+ "nbits": 8,
52
+ "optimize": false
53
+ },
54
+ "weight_quant_params": {
55
+ "axis": 0,
56
+ "channel_wise": true,
57
+ "group_size": 128,
58
+ "nbits": 4,
59
+ "optimize": true,
60
+ "round_zero": true,
61
+ "view_as_float": false
62
+ },
63
+ "zero_quant_params": {
64
+ "channel_wise": false,
65
+ "group_size": null,
66
+ "nbits": 8,
67
+ "optimize": false
68
+ }
69
+ },
70
+ "mlp.up_proj": {
71
+ "offload_meta": false,
72
+ "scale_quant_params": {
73
+ "channel_wise": true,
74
+ "group_size": 128,
75
+ "nbits": 8,
76
+ "optimize": false
77
+ },
78
+ "weight_quant_params": {
79
+ "axis": 0,
80
+ "channel_wise": true,
81
+ "group_size": 128,
82
+ "nbits": 4,
83
+ "optimize": true,
84
+ "round_zero": true,
85
+ "view_as_float": false
86
+ },
87
+ "zero_quant_params": {
88
+ "channel_wise": false,
89
+ "group_size": null,
90
+ "nbits": 8,
91
+ "optimize": false
92
+ }
93
+ },
94
+ "self_attn.k_proj": {
95
+ "offload_meta": false,
96
+ "scale_quant_params": {
97
+ "channel_wise": true,
98
+ "group_size": 128,
99
+ "nbits": 8,
100
+ "optimize": false
101
+ },
102
+ "weight_quant_params": {
103
+ "axis": 0,
104
+ "channel_wise": true,
105
+ "group_size": 128,
106
+ "nbits": 4,
107
+ "optimize": true,
108
+ "round_zero": true,
109
+ "view_as_float": false
110
+ },
111
+ "zero_quant_params": {
112
+ "channel_wise": false,
113
+ "group_size": null,
114
+ "nbits": 8,
115
+ "optimize": false
116
+ }
117
+ },
118
+ "self_attn.o_proj": {
119
+ "offload_meta": false,
120
+ "scale_quant_params": {
121
+ "channel_wise": true,
122
+ "group_size": 128,
123
+ "nbits": 8,
124
+ "optimize": false
125
+ },
126
+ "weight_quant_params": {
127
+ "axis": 0,
128
+ "channel_wise": true,
129
+ "group_size": 128,
130
+ "nbits": 4,
131
+ "optimize": true,
132
+ "round_zero": true,
133
+ "view_as_float": false
134
+ },
135
+ "zero_quant_params": {
136
+ "channel_wise": false,
137
+ "group_size": null,
138
+ "nbits": 8,
139
+ "optimize": false
140
+ }
141
+ },
142
+ "self_attn.q_proj": {
143
+ "offload_meta": false,
144
+ "scale_quant_params": {
145
+ "channel_wise": true,
146
+ "group_size": 128,
147
+ "nbits": 8,
148
+ "optimize": false
149
+ },
150
+ "weight_quant_params": {
151
+ "axis": 0,
152
+ "channel_wise": true,
153
+ "group_size": 128,
154
+ "nbits": 4,
155
+ "optimize": true,
156
+ "round_zero": true,
157
+ "view_as_float": false
158
+ },
159
+ "zero_quant_params": {
160
+ "channel_wise": false,
161
+ "group_size": null,
162
+ "nbits": 8,
163
+ "optimize": false
164
+ }
165
+ },
166
+ "self_attn.v_proj": {
167
+ "offload_meta": false,
168
+ "scale_quant_params": {
169
+ "channel_wise": true,
170
+ "group_size": 128,
171
+ "nbits": 8,
172
+ "optimize": false
173
+ },
174
+ "weight_quant_params": {
175
+ "axis": 0,
176
+ "channel_wise": true,
177
+ "group_size": 128,
178
+ "nbits": 4,
179
+ "optimize": true,
180
+ "round_zero": true,
181
+ "view_as_float": false
182
+ },
183
+ "zero_quant_params": {
184
+ "channel_wise": false,
185
+ "group_size": null,
186
+ "nbits": 8,
187
+ "optimize": false
188
+ }
189
+ }
190
+ },
191
+ "rms_norm_eps": 1e-05,
192
+ "rope_scaling": {
193
+ "factor": 8.0,
194
+ "high_freq_factor": 4.0,
195
+ "low_freq_factor": 1.0,
196
+ "original_max_position_embeddings": 8192,
197
+ "rope_type": "llama3"
198
+ },
199
+ "rope_theta": 500000.0,
200
+ "tie_word_embeddings": false,
201
+ "torch_dtype": "bfloat16",
202
+ "transformers_version": "4.44.2",
203
+ "use_cache": true,
204
+ "vocab_size": 128256
205
+ }
qmodel_shard_aa.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21eeb346dcb381d7b98b45ec5d3bceb5404c6736e488e26d7e2b98ed85cf3fe9
3
+ size 4294967296
qmodel_shard_ab.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f37e98d57602c59bf308fd8a7bc60a64c40ea570ce645ed9362e3a883d516da4
3
+ size 4294967296
qmodel_shard_ac.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a96a033114839961e135dbf74724298afa0ecdbcec325a0f34618163d56a0e50
3
+ size 4294967296
qmodel_shard_ad.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6fe7e4cbba5dacec21030c27a9f82ddbc713ad1838883008c6cb0c856b8d06f4
3
+ size 4294967296
qmodel_shard_ae.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3286ee57e5de7e67ac5532c8205bd36fedcac29362381d458639f5b0a9bb832
3
+ size 4294967296
qmodel_shard_af.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ce6580f87f9d6551fd5511eaa78dbe98725cab31593bfaeba6a55ffc349a4a5
3
+ size 4294967296
qmodel_shard_ag.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80d3a21b9abdbe59b903a60e10cf617455f4076f44bc079a1621682aad1652e9
3
+ size 4294967296
qmodel_shard_ah.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b6900598f7eb9fd7217c3d67a5d2ade11744ec2598b74ca6af5b69d00a0aba3
3
+ size 4294967296
qmodel_shard_ai.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:624555e9721cef28bc8aa335ddb42f8688622a6dc38510197546be0f08cf04c5
3
+ size 4294967296
qmodel_shard_aj.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dad3661f13559e9b13e6511197475de3780d3af6ba3888b2d20339e6197311e9
3
+ size 4294967296
qmodel_shard_ak.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79762d8b6ce72ff8c3e6205293a279b7ddfe1735cc467d37ae3c2fd0ab8e6bcd
3
+ size 4294967296
qmodel_shard_al.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6bb91a646f64dc6c4fd30db1a3178b204491e37318dfbba4eecb1ac6e2dff6eb
3
+ size 4294967296
qmodel_shard_am.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34068b2a1ae5c28ee4b65c48259f6cca1ba071cfd93c8dbdbd34878ab9e0f9c5
3
+ size 4294967296
qmodel_shard_an.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d1a5a760f10504d93c8d040cf3403a745d7ae05b35577740e64c3d6c4953ba2
3
+ size 4294967296
qmodel_shard_ao.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c1146c3a2436e454cccf7bbb78afe57e2843a6fb9a8ae6f162ce07329c66202
3
+ size 4294967296
qmodel_shard_ap.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6c7b9ee046ec95462bbaa23331f787a9139ad21d720c727e9b41c157f134674
3
+ size 4294967296
qmodel_shard_aq.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4cac7e31ce500e74e449a2a3785d20b9f175ce485c4e29a5e6d080135481448c
3
+ size 4294967296
qmodel_shard_ar.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13532b6a81fa6b826e62b424df86527e7954374f8b639a91f04c8ec6ca385b67
3
+ size 4294967296
qmodel_shard_as.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66d5a08c4ea07177018abdfa3f067cae56d3f5baa74ae9929ee3c02e664f3180
3
+ size 4294967296
qmodel_shard_at.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:978c5e26c04b2367025eff3642281770f24d685cae52cc863843973386089b30
3
+ size 4294967296
qmodel_shard_au.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37340acea730e4ebb45e7d9e6fd5ab041fa3d4d65e60c2ac22836dd41db03f2f
3
+ size 4294967296
qmodel_shard_av.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2459097b646bed5a00843a649f1bc186c3fa87d6c4cd151b20e350a2dc846226
3
+ size 4294967296
qmodel_shard_aw.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33881e290454e78e5f945561edda1c29cdf1c1b08d84ce91ed689d3058057869
3
+ size 4294967296
qmodel_shard_ax.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:070ad92ce3186483fd1eefe363faf939be54b184548782f0f1c4ac5086b9f2dc
3
+ size 4294967296
qmodel_shard_ay.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2828f30bdd59efed738dbe0f365604a76955a154fe90c0f4af19e5269e31b57
3
+ size 4294967296
qmodel_shard_az.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:410117e7e9d047d0bc8a9e9641ee45eca0e0d850998fe3f5ffcc1e5603851c89
3
+ size 4294967296
qmodel_shard_ba.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af54c1ed9a5c7bfb3f5443b6dba15bbba3b756d174e7251806133a530efb8de9
3
+ size 4294967296
qmodel_shard_bb.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8c631f8af87afadcf90eff63ef534a5e77f077d1352a6d772430575f625482a
3
+ size 4294967296
qmodel_shard_bc.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f284371a3e26facab38544ab7e3ece93ebecbf04d11122801928405d9b5ed1a2
3
+ size 4294967296
qmodel_shard_bd.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90c909ac4bc7e185095816f07c36881e4c66591a247bfedae48807e555fda02d
3
+ size 4294967296
qmodel_shard_be.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5bdf94773d41f6970d5638a735cfb0784cc3ea5411bf6ff4d6afdba1e7d4804
3
+ size 4294967296
qmodel_shard_bf.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fee122d16f9a1775ed711463cabda618f615b523fb8e855b0d34fe4fd8e09408
3
+ size 4294967296
qmodel_shard_bg.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c9ca6a4d62271ec90a709fb5813fe8bff288bf682c628106f43fbf7f8e84078
3
+ size 4294967296
qmodel_shard_bh.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f31928d756d078057828ae4a41e86a44091d01370d7a30cf9c99a16d408a0d25
3
+ size 4294967296
qmodel_shard_bi.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5b5e888c1f79bc9e0cc8ff3707f027889526132083c4d9d48df8f66ea9bc10c
3
+ size 4294967296
qmodel_shard_bj.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d739ec439326fed2b7db16c842646a4c3eb1921492bf8b20242777676d86b371
3
+ size 4294967296
qmodel_shard_bk.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d48ca08db9b763747ce46b52e672ea4798a9a361ac6c9e4d7ffa444482db04d
3
+ size 4294967296
qmodel_shard_bl.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:534d11f549ef831745b15bf59f6500889651e340c9c127cea5abec0c39016e03
3
+ size 4294967296
qmodel_shard_bm.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f0494f8392f7daa61e64373b4130ba2b35e9825f243f9d212543d3ffe8b41a5
3
+ size 4294967296
qmodel_shard_bn.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51db805a1d16c25f1155eeb9e394cc92df7ecd5b4b1202fd4d8cc9945891ab7b
3
+ size 4294967296
qmodel_shard_bo.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:832c8fbcd3334eef055c8fc42c6673fd1f66676fc998326e51f6c985d1bccff0
3
+ size 4294967296
qmodel_shard_bp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b62fa3cc337f5e8e7af5ebc748b7883bdecdf527abb6acb3c44b1bc13f75d5a
3
+ size 4294967296
qmodel_shard_bq.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd8734ca2544319bdea604e4ab38fc5d1399a4af99bc78ec2e25df9d7cced936
3
+ size 4294967296
qmodel_shard_br.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:317af14c8ba53a9d1dc97c34db58b2def1a4202d6f1b8141743340e4f7ad4bef
3
+ size 4294967296
qmodel_shard_bs.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f488d8b1df274bbce6cba25a49bdbcd53cd640f43ea61a4adbc7d8a85374b588
3
+ size 4294967296
qmodel_shard_bt.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f71de924160044d34a660c471b2253dbad23dc006feb5b01c7cef66b3ccfeba
3
+ size 4294967296
qmodel_shard_bu.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c32add4fd22844ca5104418411db8d5835dcefa75dcedc992891d6d85f9b23b
3
+ size 4294967296
qmodel_shard_bv.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac395cfdcf7685c07f8b9eb53770b7d1046b090f2f72b3a7c03d9af845845ee2
3
+ size 4294967296
qmodel_shard_bw.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6d0d6c9235d112df82e296581da7231a518ae127752b7477ce0bf7e5f9647fc
3
+ size 4294967296