Radostin Cholakov
commited on
Commit
•
6e84fad
1
Parent(s):
37baa0b
Add nf_w4g64.
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- config.json +39 -0
- flute_config.json +5 -0
- generation_config.json +12 -0
- model-00001-of-00047.safetensors +3 -0
- model-00002-of-00047.safetensors +3 -0
- model-00003-of-00047.safetensors +3 -0
- model-00004-of-00047.safetensors +3 -0
- model-00005-of-00047.safetensors +3 -0
- model-00006-of-00047.safetensors +3 -0
- model-00007-of-00047.safetensors +3 -0
- model-00008-of-00047.safetensors +3 -0
- model-00009-of-00047.safetensors +3 -0
- model-00010-of-00047.safetensors +3 -0
- model-00011-of-00047.safetensors +3 -0
- model-00012-of-00047.safetensors +3 -0
- model-00013-of-00047.safetensors +3 -0
- model-00014-of-00047.safetensors +3 -0
- model-00015-of-00047.safetensors +3 -0
- model-00016-of-00047.safetensors +3 -0
- model-00017-of-00047.safetensors +3 -0
- model-00018-of-00047.safetensors +3 -0
- model-00019-of-00047.safetensors +3 -0
- model-00020-of-00047.safetensors +3 -0
- model-00021-of-00047.safetensors +3 -0
- model-00022-of-00047.safetensors +3 -0
- model-00023-of-00047.safetensors +3 -0
- model-00024-of-00047.safetensors +3 -0
- model-00025-of-00047.safetensors +3 -0
- model-00026-of-00047.safetensors +3 -0
- model-00027-of-00047.safetensors +3 -0
- model-00028-of-00047.safetensors +3 -0
- model-00029-of-00047.safetensors +3 -0
- model-00030-of-00047.safetensors +3 -0
- model-00031-of-00047.safetensors +3 -0
- model-00032-of-00047.safetensors +3 -0
- model-00033-of-00047.safetensors +3 -0
- model-00034-of-00047.safetensors +3 -0
- model-00035-of-00047.safetensors +3 -0
- model-00036-of-00047.safetensors +3 -0
- model-00037-of-00047.safetensors +3 -0
- model-00038-of-00047.safetensors +3 -0
- model-00039-of-00047.safetensors +3 -0
- model-00040-of-00047.safetensors +3 -0
- model-00041-of-00047.safetensors +3 -0
- model-00042-of-00047.safetensors +3 -0
- model-00043-of-00047.safetensors +3 -0
- model-00044-of-00047.safetensors +3 -0
- model-00045-of-00047.safetensors +3 -0
- model-00046-of-00047.safetensors +3 -0
- model-00047-of-00047.safetensors +3 -0
config.json
ADDED
@@ -0,0 +1,39 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "/data/cl/scratch/model_weights/Meta-Llama-3.1-405B-Instruct",
|
3 |
+
"architectures": [
|
4 |
+
"LlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 128000,
|
9 |
+
"eos_token_id": [
|
10 |
+
128001,
|
11 |
+
128008,
|
12 |
+
128009
|
13 |
+
],
|
14 |
+
"hidden_act": "silu",
|
15 |
+
"hidden_size": 16384,
|
16 |
+
"initializer_range": 0.02,
|
17 |
+
"intermediate_size": 53248,
|
18 |
+
"max_position_embeddings": 131072,
|
19 |
+
"mlp_bias": false,
|
20 |
+
"model_type": "llama",
|
21 |
+
"num_attention_heads": 128,
|
22 |
+
"num_hidden_layers": 126,
|
23 |
+
"num_key_value_heads": 16,
|
24 |
+
"pretraining_tp": 1,
|
25 |
+
"rms_norm_eps": 1e-05,
|
26 |
+
"rope_scaling": {
|
27 |
+
"factor": 8.0,
|
28 |
+
"high_freq_factor": 4.0,
|
29 |
+
"low_freq_factor": 1.0,
|
30 |
+
"original_max_position_embeddings": 8192,
|
31 |
+
"rope_type": "llama3"
|
32 |
+
},
|
33 |
+
"rope_theta": 500000.0,
|
34 |
+
"tie_word_embeddings": false,
|
35 |
+
"torch_dtype": "float16",
|
36 |
+
"transformers_version": "4.44.2",
|
37 |
+
"use_cache": true,
|
38 |
+
"vocab_size": 128256
|
39 |
+
}
|
flute_config.json
ADDED
@@ -0,0 +1,5 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"num_sms": 108,
|
3 |
+
"num_bits": 4,
|
4 |
+
"group_size": 64
|
5 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token_id": 128000,
|
3 |
+
"do_sample": true,
|
4 |
+
"eos_token_id": [
|
5 |
+
128001,
|
6 |
+
128008,
|
7 |
+
128009
|
8 |
+
],
|
9 |
+
"temperature": 0.6,
|
10 |
+
"top_p": 0.9,
|
11 |
+
"transformers_version": "4.44.2"
|
12 |
+
}
|
model-00001-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:495dcbdec465c627fff4bfc2fc00f031dcd0be35672c610edf844fe48321d0fb
|
3 |
+
size 4987035088
|
model-00002-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f30d9c03f342b8e260f426fd1a3b839e5c40df250eed0af50e04f57b8103f58e
|
3 |
+
size 4670584640
|
model-00003-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6e4741c471a0d2a36531424baf2f50caafa0bfc1f42f8d40e6e867ad2f2642ef
|
3 |
+
size 4991448880
|
model-00004-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:579a254b5ce4e667e8f5a234a74640326c23772a1cf87d2e74adce669546053a
|
3 |
+
size 4955794296
|
model-00005-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:87cc88fe5037ba89272bdff95b1b63715ef9a07557361f83effa9cf5332a51f0
|
3 |
+
size 4670518920
|
model-00006-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b130b5adc7914694846923aea96783535d31b9e17f2c9334bd6fb150adefb223
|
3 |
+
size 4670584728
|
model-00007-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a66603cf388fb8bd163c38eaf94b1730ff5ea57856d04d15e8ec2d534dcc0b02
|
3 |
+
size 4670584720
|
model-00008-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f40b97c2788325ebe23b61e5fadd59c25e5a0cf1b6fff492b84951a358695079
|
3 |
+
size 4991448968
|
model-00009-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc0b595c0c2ad39205d40eb0f7fcfc771628e7a07d97e24059c3ead421c1b641
|
3 |
+
size 4955794376
|
model-00010-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ad4d71a08f167bddbc6ca5271c95b52a2d71c5729650f607b43f3a14d057ef4
|
3 |
+
size 4670518952
|
model-00011-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:02d2ee43a6e3a32ed8a6727ea384c83e188d0723db35ab962ebe8966958c3042
|
3 |
+
size 4670584728
|
model-00012-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b482b70c133ed65f25413c8095127d5bbfeaf80052bd9bfef814ab6f12b65606
|
3 |
+
size 4670584720
|
model-00013-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:41eae7b5b6fe0b0bee87b6201d0180502f29b2d7cf9c6979b28f692d939bd044
|
3 |
+
size 4991448968
|
model-00014-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cdbe39de3eed4154710cc66c51f1398cdd9ff305f78daf46836f2f15ff0d64a6
|
3 |
+
size 4955794376
|
model-00015-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:80f493012ec20197abfce1ed51c64e78a3d859485b66980ec6818ba6eb4927e8
|
3 |
+
size 4670518952
|
model-00016-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:21c60e876e7adc58e1ecc6f1365a6425444d14e72d856837dfe1a27045b1c693
|
3 |
+
size 4670584728
|
model-00017-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:04b5487ae1c0dd41ec3b26e2be9ccc4b458cc7477bcbbd39dfe4e0998900ee19
|
3 |
+
size 4670584720
|
model-00018-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b6bfbdfe61bc72eda15693fcd9ea65192cd3ca51949e3b40aea4a623d8f5ebcb
|
3 |
+
size 4991448968
|
model-00019-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b07be7d043bfb7fc0ada6ff6d3edfa9e3f336be0f98b2482b418612ff0fcddaa
|
3 |
+
size 4955794376
|
model-00020-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a95f1715ddeea09e709b37daf695c8f18fa61f49c1cdb0f74847944dc87c4684
|
3 |
+
size 4670518952
|
model-00021-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f7d9068b777f7d38ed9b5e292cf9c74fc03bb2c40fbe64f236494e02ed732f09
|
3 |
+
size 4670584728
|
model-00022-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aab7531f7c810cbdabd3c2b0a88ca682c585a7ca63ee0e2a6f3ec1ae41d657a7
|
3 |
+
size 4670584720
|
model-00023-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b95f97a12518390eea5feb46e264d8073f6cfb8fa8180fcc1bd8a2cc5146a6a
|
3 |
+
size 4991448968
|
model-00024-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad6c7a4380df7e01151b6b72f239ef78631f9ae31c37e19a72db59a4f586f561
|
3 |
+
size 4955794376
|
model-00025-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8dfef1c3f49d8bd140f9d9ec9da6b7916be115c4c14d3b6b5ef94e41c839ad1f
|
3 |
+
size 4670518952
|
model-00026-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:20bfe584172cdfdafd0e7b7fdf9b0398ade0648079cc11cfe8150df70f1dd1bd
|
3 |
+
size 4670584728
|
model-00027-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c23e5ad6f2c0ad51d31540e1a33bb860f307b84068422c130645969cfa0c596
|
3 |
+
size 4670584720
|
model-00028-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a52e31f73dfd028abbf3bfa7444cfc12a6fbbdadd3f3fe9070866ac3ef309a4f
|
3 |
+
size 4991448968
|
model-00029-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1f715e036a265aec816b4cd59da6aa1c2b48b3c97ca7c1f2c13b865374d1f9f3
|
3 |
+
size 4955794376
|
model-00030-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b2563157a7103839327f7cf6c777239232556d559b15ac751949fa288473631
|
3 |
+
size 4670518952
|
model-00031-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f3b80b6ead51494ae5fccbd331729aabc6c3968d621615544377cf2797c6a561
|
3 |
+
size 4670584728
|
model-00032-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:751279fd463a80381cc217df25d7902fc5377d85999202acfe56b5e140bc1908
|
3 |
+
size 4670584720
|
model-00033-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f7ee873f06aa2d9caceea66c47930736cad143117003178f31592fa486f8ef5
|
3 |
+
size 4991448968
|
model-00034-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98d90f0ee70a97f5e87d24be83268694619e1840b2f61ae87355b61658a8c251
|
3 |
+
size 4955794376
|
model-00035-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:58c8ce057b106c074fb7234a3da9cadb158987f98997c477a4f57622020ae531
|
3 |
+
size 4670518952
|
model-00036-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c4550b0c3c2d70c113eae6088821c73cb59e97c26e2441f364d12b56a6c0a8bf
|
3 |
+
size 4670584728
|
model-00037-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ded90644f6b7446e0a2edb77c4ba40492535c6c35a1ea029151debe502621ed9
|
3 |
+
size 4670584760
|
model-00038-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ccb762690eba441f3dca87e7ef3256bedcb45ceafd686c7ae908dafaef55a685
|
3 |
+
size 4991449056
|
model-00039-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7b8ca1f19ce114ee1ba608f18da35185766b4e8bfa742f120063132b6e0dacbe
|
3 |
+
size 4955794456
|
model-00040-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d53bfc16505c0a94cc7b11d69beb8684d0830ea639628ee45f81fa986103b040
|
3 |
+
size 4670519032
|
model-00041-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8a3e5251b394bc18aad2f7dccd37b5ad20a26327fcf17c9b130f4c70a791d71e
|
3 |
+
size 4670584816
|
model-00042-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:52669921944ce039b80e0c37ce9267b853b0903e80b6460941386d5366b9f2f5
|
3 |
+
size 4670584808
|
model-00043-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad14fa4064f39cfad7d70a85c257440620882f452f941c69683683655b17d842
|
3 |
+
size 4991449056
|
model-00044-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:49cc063874d78aa9737263f6a9d79eb59b021268054676df9fa222caa35de35e
|
3 |
+
size 4955794456
|
model-00045-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d56bb26080b9ef93eb550efc755c9c8cb100660d288d2dba16bf6787ad65fd30
|
3 |
+
size 4670519032
|
model-00046-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:40998c0dad827e3474d41666db710ba3521eeef7e3a69046fa75ee8c7e3ca5ee
|
3 |
+
size 3886275304
|
model-00047-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:56b10aec9a93280980a830629be8161bacec7e0f741f7b87e5fcb3de68104edb
|
3 |
+
size 4202692736
|