Radostin Cholakov
commited on
Commit
•
3a58b22
1
Parent(s):
de1b5cd
Add nf_w4g64.
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- config.json +35 -0
- flute_config.json +5 -0
- generation_config.json +9 -0
- model-00001-of-00047.safetensors +3 -0
- model-00002-of-00047.safetensors +3 -0
- model-00003-of-00047.safetensors +3 -0
- model-00004-of-00047.safetensors +3 -0
- model-00005-of-00047.safetensors +3 -0
- model-00006-of-00047.safetensors +3 -0
- model-00007-of-00047.safetensors +3 -0
- model-00008-of-00047.safetensors +3 -0
- model-00009-of-00047.safetensors +3 -0
- model-00010-of-00047.safetensors +3 -0
- model-00011-of-00047.safetensors +3 -0
- model-00012-of-00047.safetensors +3 -0
- model-00013-of-00047.safetensors +3 -0
- model-00014-of-00047.safetensors +3 -0
- model-00015-of-00047.safetensors +3 -0
- model-00016-of-00047.safetensors +3 -0
- model-00017-of-00047.safetensors +3 -0
- model-00018-of-00047.safetensors +3 -0
- model-00019-of-00047.safetensors +3 -0
- model-00020-of-00047.safetensors +3 -0
- model-00021-of-00047.safetensors +3 -0
- model-00022-of-00047.safetensors +3 -0
- model-00023-of-00047.safetensors +3 -0
- model-00024-of-00047.safetensors +3 -0
- model-00025-of-00047.safetensors +3 -0
- model-00026-of-00047.safetensors +3 -0
- model-00027-of-00047.safetensors +3 -0
- model-00028-of-00047.safetensors +3 -0
- model-00029-of-00047.safetensors +3 -0
- model-00030-of-00047.safetensors +3 -0
- model-00031-of-00047.safetensors +3 -0
- model-00032-of-00047.safetensors +3 -0
- model-00033-of-00047.safetensors +3 -0
- model-00034-of-00047.safetensors +3 -0
- model-00035-of-00047.safetensors +3 -0
- model-00036-of-00047.safetensors +3 -0
- model-00037-of-00047.safetensors +3 -0
- model-00038-of-00047.safetensors +3 -0
- model-00039-of-00047.safetensors +3 -0
- model-00040-of-00047.safetensors +3 -0
- model-00041-of-00047.safetensors +3 -0
- model-00042-of-00047.safetensors +3 -0
- model-00043-of-00047.safetensors +3 -0
- model-00044-of-00047.safetensors +3 -0
- model-00045-of-00047.safetensors +3 -0
- model-00046-of-00047.safetensors +3 -0
- model-00047-of-00047.safetensors +3 -0
config.json
ADDED
@@ -0,0 +1,35 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "/data/cl/scratch/model_weights/Meta-Llama-3.1-405B",
|
3 |
+
"architectures": [
|
4 |
+
"LlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 128000,
|
9 |
+
"eos_token_id": 128001,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 16384,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 53248,
|
14 |
+
"max_position_embeddings": 131072,
|
15 |
+
"mlp_bias": false,
|
16 |
+
"model_type": "llama",
|
17 |
+
"num_attention_heads": 128,
|
18 |
+
"num_hidden_layers": 126,
|
19 |
+
"num_key_value_heads": 16,
|
20 |
+
"pretraining_tp": 1,
|
21 |
+
"rms_norm_eps": 1e-05,
|
22 |
+
"rope_scaling": {
|
23 |
+
"factor": 8.0,
|
24 |
+
"high_freq_factor": 4.0,
|
25 |
+
"low_freq_factor": 1.0,
|
26 |
+
"original_max_position_embeddings": 8192,
|
27 |
+
"rope_type": "llama3"
|
28 |
+
},
|
29 |
+
"rope_theta": 500000.0,
|
30 |
+
"tie_word_embeddings": false,
|
31 |
+
"torch_dtype": "float16",
|
32 |
+
"transformers_version": "4.44.2",
|
33 |
+
"use_cache": true,
|
34 |
+
"vocab_size": 128256
|
35 |
+
}
|
flute_config.json
ADDED
@@ -0,0 +1,5 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"num_sms": 108,
|
3 |
+
"num_bits": 4,
|
4 |
+
"group_size": 64
|
5 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 128000,
|
4 |
+
"do_sample": true,
|
5 |
+
"eos_token_id": 128001,
|
6 |
+
"temperature": 0.6,
|
7 |
+
"top_p": 0.9,
|
8 |
+
"transformers_version": "4.44.2"
|
9 |
+
}
|
model-00001-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b90b4cfa9b9116b1fbe023029af06bd738e9401c5a2b9cd4c775397a5aebf5e
|
3 |
+
size 4987035088
|
model-00002-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f96765f8d8ab16d27d343b7aefb9cbf5a8ac184ecdbc509a5ab3e91da27393c
|
3 |
+
size 4670584640
|
model-00003-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e941fedd54acc9f540817c4d35f17dfae43461bb14b1cea39074311fb3a89b3b
|
3 |
+
size 4991448880
|
model-00004-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f046379ba85059e806e081a2eb4d0f2cdb6fad0540fd1a4883949f7dcfb8108
|
3 |
+
size 4955794296
|
model-00005-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e678f4d8a209cb2e887183bd5412763cf190ed4b10a70f7f323c199b70e68242
|
3 |
+
size 4670518920
|
model-00006-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4689f4ecf28146fa3d84bc269029ca06cd1e4f665f09e05921c24005324b0be6
|
3 |
+
size 4670584728
|
model-00007-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:abd4a6aff57a7e2bb4321fbe0ea164dd0efbd442ae6608bd2256a30f3382df8e
|
3 |
+
size 4670584720
|
model-00008-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1d7be621c1976feae0b190eedcb2eb761f74be101ef50095e481e67091a43c9b
|
3 |
+
size 4991448968
|
model-00009-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0a587e433c67127e4c96351eb91fe5d4cd5702e5fa106bbefbea1c59fde4f31c
|
3 |
+
size 4955794376
|
model-00010-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e85d4006b57a8caa05f77088d7f94dbd79b90b66de57b980529064fefb8c6a0
|
3 |
+
size 4670518952
|
model-00011-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f605a88d00bb076931e31031f94fe7c966b753135f5747aa70010d975e8ccec6
|
3 |
+
size 4670584728
|
model-00012-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:083f8825c875685b066e9e1940559b7c24b288698b43c806d3a9f8e1030a27c6
|
3 |
+
size 4670584720
|
model-00013-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0205707407cf8739010b981aa5f5c76e7ec67c48fa01f81da12ee168ae2bc98e
|
3 |
+
size 4991448968
|
model-00014-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:952e3cf60c47820b4575981968ddbe3f31b9a098c3501f6e259b57660d8580e5
|
3 |
+
size 4955794376
|
model-00015-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e6aa748eccf100a69f2355ce419f11fec54c2b0fd86031dc065343e454277a2
|
3 |
+
size 4670518952
|
model-00016-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2050eb9670e7bc5319e7891ffa3ed92534ce15f30463b639a7dec85623a7c363
|
3 |
+
size 4670584728
|
model-00017-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bcc0afa0bf1181b9579452093715260a89eb3962c969b6531d0db07b1d084ab9
|
3 |
+
size 4670584720
|
model-00018-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:280da8fa37ee398e759aab905bb0e3b8195660b2c6e8733075c994f15589275d
|
3 |
+
size 4991448968
|
model-00019-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0f5b6e9cf64e296f97715b66fa4999b4674502d681f802baaacce6438c0b5268
|
3 |
+
size 4955794376
|
model-00020-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b20a61f0c7b6cbd165c215835dac1a1dccf0f02fa737ca4f2e714c1990be47e
|
3 |
+
size 4670518952
|
model-00021-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c31041007161db86edf9a402561b04349b00a9d933d589a1343cbbb2874c61f5
|
3 |
+
size 4670584728
|
model-00022-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:440c9d766631ce86f6016ebf33f624178829e733057b3db1132cc690215a3dcb
|
3 |
+
size 4670584720
|
model-00023-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1128429c5b290edf8e6816727d6f74e1acc107d67286cf919ee027f5fe3be591
|
3 |
+
size 4991448968
|
model-00024-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4be9e690b7ec42043ca301dc3204d7462cfd72a479ecc7a378ddbcd72a78dd11
|
3 |
+
size 4955794376
|
model-00025-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b3aecd1128f4bd25e0859f28bd9459f2c25f1821ef82a3091a8d67e264e463e
|
3 |
+
size 4670518952
|
model-00026-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5b02524e98d62050d021236fe9c3e347a48fb8416450832287fb777ac725d40
|
3 |
+
size 4670584728
|
model-00027-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:34c8649fbfc2478cce3c909ecfe4ba524fbaa3df8e3609d7fab32f974e0a2ae7
|
3 |
+
size 4670584720
|
model-00028-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:635ce4ce984d4b5b0eae8c090384631b7798dbe486cef9d5bc9ce88ffacbed81
|
3 |
+
size 4991448968
|
model-00029-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c17a517546d32c618a7fe0d9e3ad9cf7aa1c77f557cbb899cafaa8f9e379f4d
|
3 |
+
size 4955794376
|
model-00030-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ef22dac6503a20042c0444706c9712cbcc20eb57d196f01c473b8ec90ccdb93
|
3 |
+
size 4670518952
|
model-00031-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c14c665902194578b36297b35cc1c8a0879f3240d0ec4fa1a5ae2ee101df60b8
|
3 |
+
size 4670584728
|
model-00032-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1619a1e4939385fcfa3bfc93b05ea99b6deeac1b6840266a584e613da05a179f
|
3 |
+
size 4670584720
|
model-00033-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cd84216aef85ad1931d70f71ea7a4d2872eebcb4a3ea0619b82b2af80d3cf031
|
3 |
+
size 4991448968
|
model-00034-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a1e2c341e68f75ab492fb3b838b01cea0c0d7a3a326863f61f7da2b0cfb5556
|
3 |
+
size 4955794376
|
model-00035-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ba0f8932484a0cb740ee47e909b7734abbec5a0dc7a0f6b4b72b2da28eef8a0a
|
3 |
+
size 4670518952
|
model-00036-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f35059acb555cbb0ac330e3cbc33e10656bad2850539a4f20a3916f606cb6592
|
3 |
+
size 4670584728
|
model-00037-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:786f4d544d97c7b58629fc4c3e9c0857c91cb6b7c9e03aad025f12ca45412486
|
3 |
+
size 4670584760
|
model-00038-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e67a9e1e2d17822ca03333f13614814e4f3eb9abf4cb29cc9fccddeb5bd82c98
|
3 |
+
size 4991449056
|
model-00039-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d365794eb11fc2f13bff7a08f710851b3c0c6f03399926996a5259b883bf08cb
|
3 |
+
size 4955794456
|
model-00040-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:08f17873cb919a5bd70446cd00870077852a35f0d84d1afd7913240d84c4cc92
|
3 |
+
size 4670519032
|
model-00041-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:15ea41b8f9a8a2f6f53107ee8fdd9de6b983035f8a738b4e0000b3130c8b9020
|
3 |
+
size 4670584816
|
model-00042-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb88bfba7e2af768361242f0cb46bf8a3f8243c0d01593e3f5fbffe034fba4f5
|
3 |
+
size 4670584808
|
model-00043-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:78c3759e9589615dee40e5b8bcc2b87abe671445a4e6cf924eefe1f4aeedb4c5
|
3 |
+
size 4991449056
|
model-00044-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a0defe1790900441fe2f5761bc0052e32f15d4994aee0e4643c4548ebd3f75b2
|
3 |
+
size 4955794456
|
model-00045-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:870e8926d4f1e413604117b11be72a11bcaf07e6a6a03c924d77bd679535833d
|
3 |
+
size 4670519032
|
model-00046-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:44944b15fe4a6ba9e9a1da09b527521c4ad906cabdf2d740226ac0746c83919c
|
3 |
+
size 3886275304
|
model-00047-of-00047.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ad9f1b9d860e193110b25ae81706a93a93991adcd9e8b2333d3273235e6cee5
|
3 |
+
size 4202692736
|