lastdefiance20
commited on
Upload LlamaForCausalLM
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- config.json +40 -0
- generation_config.json +12 -0
- model-00001-of-00062.safetensors +3 -0
- model-00002-of-00062.safetensors +3 -0
- model-00003-of-00062.safetensors +3 -0
- model-00004-of-00062.safetensors +3 -0
- model-00005-of-00062.safetensors +3 -0
- model-00006-of-00062.safetensors +3 -0
- model-00007-of-00062.safetensors +3 -0
- model-00008-of-00062.safetensors +3 -0
- model-00009-of-00062.safetensors +3 -0
- model-00010-of-00062.safetensors +3 -0
- model-00011-of-00062.safetensors +3 -0
- model-00012-of-00062.safetensors +3 -0
- model-00013-of-00062.safetensors +3 -0
- model-00014-of-00062.safetensors +3 -0
- model-00015-of-00062.safetensors +3 -0
- model-00016-of-00062.safetensors +3 -0
- model-00017-of-00062.safetensors +3 -0
- model-00018-of-00062.safetensors +3 -0
- model-00019-of-00062.safetensors +3 -0
- model-00020-of-00062.safetensors +3 -0
- model-00021-of-00062.safetensors +3 -0
- model-00022-of-00062.safetensors +3 -0
- model-00023-of-00062.safetensors +3 -0
- model-00024-of-00062.safetensors +3 -0
- model-00025-of-00062.safetensors +3 -0
- model-00026-of-00062.safetensors +3 -0
- model-00027-of-00062.safetensors +3 -0
- model-00028-of-00062.safetensors +3 -0
- model-00029-of-00062.safetensors +3 -0
- model-00030-of-00062.safetensors +3 -0
- model-00031-of-00062.safetensors +3 -0
- model-00032-of-00062.safetensors +3 -0
- model-00033-of-00062.safetensors +3 -0
- model-00034-of-00062.safetensors +3 -0
- model-00035-of-00062.safetensors +3 -0
- model-00036-of-00062.safetensors +3 -0
- model-00037-of-00062.safetensors +3 -0
- model-00038-of-00062.safetensors +3 -0
- model-00039-of-00062.safetensors +3 -0
- model-00040-of-00062.safetensors +3 -0
- model-00041-of-00062.safetensors +3 -0
- model-00042-of-00062.safetensors +3 -0
- model-00043-of-00062.safetensors +3 -0
- model-00044-of-00062.safetensors +3 -0
- model-00045-of-00062.safetensors +3 -0
- model-00046-of-00062.safetensors +3 -0
- model-00047-of-00062.safetensors +3 -0
- model-00048-of-00062.safetensors +3 -0
config.json
ADDED
@@ -0,0 +1,40 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "/raid/checkpoint/averitec/Meta-Llama-3.1-70B-HerO-bs/checkpoint-48",
|
3 |
+
"architectures": [
|
4 |
+
"LlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 128000,
|
9 |
+
"eos_token_id": [
|
10 |
+
128001,
|
11 |
+
128008,
|
12 |
+
128009
|
13 |
+
],
|
14 |
+
"head_dim": 128,
|
15 |
+
"hidden_act": "silu",
|
16 |
+
"hidden_size": 8192,
|
17 |
+
"initializer_range": 0.02,
|
18 |
+
"intermediate_size": 28672,
|
19 |
+
"max_position_embeddings": 131072,
|
20 |
+
"mlp_bias": false,
|
21 |
+
"model_type": "llama",
|
22 |
+
"num_attention_heads": 64,
|
23 |
+
"num_hidden_layers": 80,
|
24 |
+
"num_key_value_heads": 8,
|
25 |
+
"pretraining_tp": 1,
|
26 |
+
"rms_norm_eps": 1e-05,
|
27 |
+
"rope_scaling": {
|
28 |
+
"factor": 8.0,
|
29 |
+
"high_freq_factor": 4.0,
|
30 |
+
"low_freq_factor": 1.0,
|
31 |
+
"original_max_position_embeddings": 8192,
|
32 |
+
"rope_type": "llama3"
|
33 |
+
},
|
34 |
+
"rope_theta": 500000.0,
|
35 |
+
"tie_word_embeddings": false,
|
36 |
+
"torch_dtype": "float32",
|
37 |
+
"transformers_version": "4.46.1",
|
38 |
+
"use_cache": false,
|
39 |
+
"vocab_size": 128256
|
40 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token_id": 128000,
|
3 |
+
"do_sample": true,
|
4 |
+
"eos_token_id": [
|
5 |
+
128001,
|
6 |
+
128008,
|
7 |
+
128009
|
8 |
+
],
|
9 |
+
"temperature": 0.6,
|
10 |
+
"top_p": 0.9,
|
11 |
+
"transformers_version": "4.46.1"
|
12 |
+
}
|
model-00001-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b4c66ef691095de5bef4270fe0613a4392c3dcae5190a82664c64772472adeb
|
3 |
+
size 4806672984
|
model-00002-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e569256fe933a4d160c2231e251278ca0cea04ece1e21544a7f71f333db0c48a
|
3 |
+
size 4362142864
|
model-00003-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d8746592cbcb1d66f65490349cb9c21131fab3ce6aa20576723b1f25bbf3c7b
|
3 |
+
size 4362142864
|
model-00004-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef3a52c53bc55852195e964b2716b196ac789c99ad8fcf82b627690fb49494cf
|
3 |
+
size 4966188864
|
model-00005-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be0e80da994ea0de80729d420c6332a833b2d107ec92d0b26af0b206ae2694e9
|
3 |
+
size 4362142864
|
model-00006-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f1afec345058951a18cd4b5ddc0654b1a5436bc572b046f056c795b62786300d
|
3 |
+
size 4362142864
|
model-00007-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:14b9e367fa75d6f0746f23a853495b2a67429ecea58251463821b193e7acbae7
|
3 |
+
size 4966188864
|
model-00008-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:91e996843e886ff412b9248027120b6443e13f56cabaa3ca550b201aeaa729b6
|
3 |
+
size 4362142864
|
model-00009-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d77ff0be94849eac75e03b0d3f23800326538102e16feefc3d3e40b3ae51a098
|
3 |
+
size 4362142880
|
model-00010-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98b9cc9c68ca9ee19242bd02bafda8c6c612cc6fd80d64114dfff121cc1db522
|
3 |
+
size 4966188880
|
model-00011-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31c5766fb851b089719db14f1917627f125cd5d3287d1c2f138492ebc62342a0
|
3 |
+
size 4362142872
|
model-00012-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96329b0ccd35c4b8d16d8791d062e3f58ab5239cd49c85ad92aa7fe1baf120a5
|
3 |
+
size 4362142872
|
model-00013-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e0307bf0cb015cc3de8c657377e4f7d27344367053a6d3435a65179f9c776405
|
3 |
+
size 4966188880
|
model-00014-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1c95bc1f9cd3fffe0514d1ecc23621b0c041ac678b5aef363dae52fdffd562fd
|
3 |
+
size 4362142872
|
model-00015-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b8b09ec6f0a23f12f9a0ae0c6eb54162861d92ea89fdf5fa1d2a0ca0aee4477
|
3 |
+
size 4362142872
|
model-00016-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f4acc5969aad7303e894067f49053fc5f578624296dc040412a711bb04876d3b
|
3 |
+
size 4966188880
|
model-00017-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8bee1e379b2d73e6270339d30dcc815bd2295be4ddce6d539d4ba6d0659fa11c
|
3 |
+
size 4362142872
|
model-00018-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ad7880cae914b6841ab8e33b457eb320b2c62d70d0f0acc29a747b43f458cb2
|
3 |
+
size 4362142872
|
model-00019-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:26d6f20772c2c2e268578de8158d19799fc4c22ea5610db16a95c78fc9339aa0
|
3 |
+
size 4966188880
|
model-00020-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4c9159399cc077ab88b91b945c59a0d9c911e90d4aa386b1220260e5b4ce1d77
|
3 |
+
size 4362142872
|
model-00021-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:88f19d18fe2f0979d6fe939841515af3521ef771b43aed86dddc15bedbdd2f36
|
3 |
+
size 4362142872
|
model-00022-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b64dc3d0a633233b7d022c6c7f1354617fb0d4b24fb78887d33992667f69698
|
3 |
+
size 4966188880
|
model-00023-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3cb20619df9745a0c07621864e01da225075959b282503f580df4d2425831c19
|
3 |
+
size 4362142872
|
model-00024-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a953f7d8d03e5215ba16443af633dce083037a549debc712596c8eda7bd16870
|
3 |
+
size 4362142872
|
model-00025-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8d4ef31c663a3dc48d159a976970ca735615783f49d0493f581810fedb1a8b50
|
3 |
+
size 4966188880
|
model-00026-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c727f018923d6a01d94d1bf242d88c0eef9fbcf8e3df78f11b50275e80eb5482
|
3 |
+
size 4362142872
|
model-00027-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:74cf981d1ba8abfea4f48e4e65c12f34ca4dfdea64d7821453b4aa658899e9a8
|
3 |
+
size 4362142872
|
model-00028-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a359024ee1ca5216ae1d5ca631e3d6eb67265714f9b55e178481728b45c05578
|
3 |
+
size 4966188880
|
model-00029-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:858b382360c0c57dfc17abb20d28a61e1fc0f0b34d5290383e69631c7972608c
|
3 |
+
size 4362142872
|
model-00030-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f8ef09d30a66af96538dc6f382129c1b297278d5baa6bb5491f926c5693274f8
|
3 |
+
size 4362142872
|
model-00031-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f0b91e5dea235b57dfd6369137722e4a0876c6d24f4ac7177eb88c6ec1139de7
|
3 |
+
size 4966188880
|
model-00032-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd58845afd6b69d11744417067e73298c688a328aebf0d426ed10d997f184d3c
|
3 |
+
size 4362142872
|
model-00033-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4dae2c007bcfac81441743007065e00566d7256afa3602e0c39cda361bdd97a4
|
3 |
+
size 4362142872
|
model-00034-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:790f5278f1e40c06876c14aec668a5fd6a24dcf8321e3b3413b992be7fffcf7e
|
3 |
+
size 4966188880
|
model-00035-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:02cafabad8f09dc315c9f72baba6ed4ba92cc5127c1b14e437d4e7a61bdc54b1
|
3 |
+
size 4362142872
|
model-00036-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1742e8969ef49e8a9aa5490fbaaf868ab6b6874c9625d71074632239d04a51d1
|
3 |
+
size 4362142872
|
model-00037-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a11ce33e0ba0e2d3021d4ed63923c27f4f256c74a6a4effe0eb9102a3c1d5381
|
3 |
+
size 4966188880
|
model-00038-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c3153e7d6114ec71c63f99bbf33498157600b8b2ffbd3c442d2f14e37bf0f9f
|
3 |
+
size 4362142872
|
model-00039-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf9fce44374b00e8cd99cfc888c92768a8d210cc054de9ca8f79a49ae725b9fb
|
3 |
+
size 4362142872
|
model-00040-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e65bdfb179c50adaad93e5a87855f94aad3f776f08e95ffcfe6a9d50819cf4b
|
3 |
+
size 4966188880
|
model-00041-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:93cb604d3fe041f0ff181d828194498433f4a2b0518245f955f4c5666c046543
|
3 |
+
size 4362142872
|
model-00042-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a50e11b046e2da47e7a8575ff1b854b26cc4ee9d364483c4f231c2c9a550d93
|
3 |
+
size 4362142872
|
model-00043-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7b376bf6b14b0096ff3c105f1e8bc4cf01e2186f494cfc3c87f7e2720b077cf3
|
3 |
+
size 4966188880
|
model-00044-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c2ca635b14164e6225e9d6d6db299f6d886149ae71a3251a72d4243fe8f2227
|
3 |
+
size 4362142872
|
model-00045-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6e5300658a6c4865ad570027e4f80108173630afe8232db45d2866b06894d2b5
|
3 |
+
size 4362142872
|
model-00046-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:64106f49bd3abd1f9ec11f7290004cf80c4522a0e704481f00a2b5ac7e32f28e
|
3 |
+
size 4966188880
|
model-00047-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:de4c06d5a4cd137ebaaf890e9c4f7feffbd0523d960fa1c0b023dc2fcf464a7c
|
3 |
+
size 4362142872
|
model-00048-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:285a83e448f134e1441d75c7b7eba25ff488be12a782b68850ba4b8e4b45b3a9
|
3 |
+
size 4362142872
|