Safetensors
llama
lastdefiance20 commited on
Commit
59a6ae7
·
verified ·
1 Parent(s): 2f34f0b

Upload LlamaForCausalLM

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. config.json +40 -0
  2. generation_config.json +12 -0
  3. model-00001-of-00062.safetensors +3 -0
  4. model-00002-of-00062.safetensors +3 -0
  5. model-00003-of-00062.safetensors +3 -0
  6. model-00004-of-00062.safetensors +3 -0
  7. model-00005-of-00062.safetensors +3 -0
  8. model-00006-of-00062.safetensors +3 -0
  9. model-00007-of-00062.safetensors +3 -0
  10. model-00008-of-00062.safetensors +3 -0
  11. model-00009-of-00062.safetensors +3 -0
  12. model-00010-of-00062.safetensors +3 -0
  13. model-00011-of-00062.safetensors +3 -0
  14. model-00012-of-00062.safetensors +3 -0
  15. model-00013-of-00062.safetensors +3 -0
  16. model-00014-of-00062.safetensors +3 -0
  17. model-00015-of-00062.safetensors +3 -0
  18. model-00016-of-00062.safetensors +3 -0
  19. model-00017-of-00062.safetensors +3 -0
  20. model-00018-of-00062.safetensors +3 -0
  21. model-00019-of-00062.safetensors +3 -0
  22. model-00020-of-00062.safetensors +3 -0
  23. model-00021-of-00062.safetensors +3 -0
  24. model-00022-of-00062.safetensors +3 -0
  25. model-00023-of-00062.safetensors +3 -0
  26. model-00024-of-00062.safetensors +3 -0
  27. model-00025-of-00062.safetensors +3 -0
  28. model-00026-of-00062.safetensors +3 -0
  29. model-00027-of-00062.safetensors +3 -0
  30. model-00028-of-00062.safetensors +3 -0
  31. model-00029-of-00062.safetensors +3 -0
  32. model-00030-of-00062.safetensors +3 -0
  33. model-00031-of-00062.safetensors +3 -0
  34. model-00032-of-00062.safetensors +3 -0
  35. model-00033-of-00062.safetensors +3 -0
  36. model-00034-of-00062.safetensors +3 -0
  37. model-00035-of-00062.safetensors +3 -0
  38. model-00036-of-00062.safetensors +3 -0
  39. model-00037-of-00062.safetensors +3 -0
  40. model-00038-of-00062.safetensors +3 -0
  41. model-00039-of-00062.safetensors +3 -0
  42. model-00040-of-00062.safetensors +3 -0
  43. model-00041-of-00062.safetensors +3 -0
  44. model-00042-of-00062.safetensors +3 -0
  45. model-00043-of-00062.safetensors +3 -0
  46. model-00044-of-00062.safetensors +3 -0
  47. model-00045-of-00062.safetensors +3 -0
  48. model-00046-of-00062.safetensors +3 -0
  49. model-00047-of-00062.safetensors +3 -0
  50. model-00048-of-00062.safetensors +3 -0
config.json ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "/raid/checkpoint/averitec/Meta-Llama-3.1-70B-HerO-bs/checkpoint-48",
3
+ "architectures": [
4
+ "LlamaForCausalLM"
5
+ ],
6
+ "attention_bias": false,
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 128000,
9
+ "eos_token_id": [
10
+ 128001,
11
+ 128008,
12
+ 128009
13
+ ],
14
+ "head_dim": 128,
15
+ "hidden_act": "silu",
16
+ "hidden_size": 8192,
17
+ "initializer_range": 0.02,
18
+ "intermediate_size": 28672,
19
+ "max_position_embeddings": 131072,
20
+ "mlp_bias": false,
21
+ "model_type": "llama",
22
+ "num_attention_heads": 64,
23
+ "num_hidden_layers": 80,
24
+ "num_key_value_heads": 8,
25
+ "pretraining_tp": 1,
26
+ "rms_norm_eps": 1e-05,
27
+ "rope_scaling": {
28
+ "factor": 8.0,
29
+ "high_freq_factor": 4.0,
30
+ "low_freq_factor": 1.0,
31
+ "original_max_position_embeddings": 8192,
32
+ "rope_type": "llama3"
33
+ },
34
+ "rope_theta": 500000.0,
35
+ "tie_word_embeddings": false,
36
+ "torch_dtype": "float32",
37
+ "transformers_version": "4.46.1",
38
+ "use_cache": false,
39
+ "vocab_size": 128256
40
+ }
generation_config.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token_id": 128000,
3
+ "do_sample": true,
4
+ "eos_token_id": [
5
+ 128001,
6
+ 128008,
7
+ 128009
8
+ ],
9
+ "temperature": 0.6,
10
+ "top_p": 0.9,
11
+ "transformers_version": "4.46.1"
12
+ }
model-00001-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b4c66ef691095de5bef4270fe0613a4392c3dcae5190a82664c64772472adeb
3
+ size 4806672984
model-00002-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e569256fe933a4d160c2231e251278ca0cea04ece1e21544a7f71f333db0c48a
3
+ size 4362142864
model-00003-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d8746592cbcb1d66f65490349cb9c21131fab3ce6aa20576723b1f25bbf3c7b
3
+ size 4362142864
model-00004-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef3a52c53bc55852195e964b2716b196ac789c99ad8fcf82b627690fb49494cf
3
+ size 4966188864
model-00005-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be0e80da994ea0de80729d420c6332a833b2d107ec92d0b26af0b206ae2694e9
3
+ size 4362142864
model-00006-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1afec345058951a18cd4b5ddc0654b1a5436bc572b046f056c795b62786300d
3
+ size 4362142864
model-00007-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14b9e367fa75d6f0746f23a853495b2a67429ecea58251463821b193e7acbae7
3
+ size 4966188864
model-00008-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91e996843e886ff412b9248027120b6443e13f56cabaa3ca550b201aeaa729b6
3
+ size 4362142864
model-00009-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d77ff0be94849eac75e03b0d3f23800326538102e16feefc3d3e40b3ae51a098
3
+ size 4362142880
model-00010-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98b9cc9c68ca9ee19242bd02bafda8c6c612cc6fd80d64114dfff121cc1db522
3
+ size 4966188880
model-00011-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31c5766fb851b089719db14f1917627f125cd5d3287d1c2f138492ebc62342a0
3
+ size 4362142872
model-00012-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96329b0ccd35c4b8d16d8791d062e3f58ab5239cd49c85ad92aa7fe1baf120a5
3
+ size 4362142872
model-00013-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0307bf0cb015cc3de8c657377e4f7d27344367053a6d3435a65179f9c776405
3
+ size 4966188880
model-00014-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c95bc1f9cd3fffe0514d1ecc23621b0c041ac678b5aef363dae52fdffd562fd
3
+ size 4362142872
model-00015-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b8b09ec6f0a23f12f9a0ae0c6eb54162861d92ea89fdf5fa1d2a0ca0aee4477
3
+ size 4362142872
model-00016-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4acc5969aad7303e894067f49053fc5f578624296dc040412a711bb04876d3b
3
+ size 4966188880
model-00017-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8bee1e379b2d73e6270339d30dcc815bd2295be4ddce6d539d4ba6d0659fa11c
3
+ size 4362142872
model-00018-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ad7880cae914b6841ab8e33b457eb320b2c62d70d0f0acc29a747b43f458cb2
3
+ size 4362142872
model-00019-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26d6f20772c2c2e268578de8158d19799fc4c22ea5610db16a95c78fc9339aa0
3
+ size 4966188880
model-00020-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c9159399cc077ab88b91b945c59a0d9c911e90d4aa386b1220260e5b4ce1d77
3
+ size 4362142872
model-00021-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88f19d18fe2f0979d6fe939841515af3521ef771b43aed86dddc15bedbdd2f36
3
+ size 4362142872
model-00022-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b64dc3d0a633233b7d022c6c7f1354617fb0d4b24fb78887d33992667f69698
3
+ size 4966188880
model-00023-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3cb20619df9745a0c07621864e01da225075959b282503f580df4d2425831c19
3
+ size 4362142872
model-00024-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a953f7d8d03e5215ba16443af633dce083037a549debc712596c8eda7bd16870
3
+ size 4362142872
model-00025-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d4ef31c663a3dc48d159a976970ca735615783f49d0493f581810fedb1a8b50
3
+ size 4966188880
model-00026-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c727f018923d6a01d94d1bf242d88c0eef9fbcf8e3df78f11b50275e80eb5482
3
+ size 4362142872
model-00027-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74cf981d1ba8abfea4f48e4e65c12f34ca4dfdea64d7821453b4aa658899e9a8
3
+ size 4362142872
model-00028-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a359024ee1ca5216ae1d5ca631e3d6eb67265714f9b55e178481728b45c05578
3
+ size 4966188880
model-00029-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:858b382360c0c57dfc17abb20d28a61e1fc0f0b34d5290383e69631c7972608c
3
+ size 4362142872
model-00030-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8ef09d30a66af96538dc6f382129c1b297278d5baa6bb5491f926c5693274f8
3
+ size 4362142872
model-00031-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0b91e5dea235b57dfd6369137722e4a0876c6d24f4ac7177eb88c6ec1139de7
3
+ size 4966188880
model-00032-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd58845afd6b69d11744417067e73298c688a328aebf0d426ed10d997f184d3c
3
+ size 4362142872
model-00033-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4dae2c007bcfac81441743007065e00566d7256afa3602e0c39cda361bdd97a4
3
+ size 4362142872
model-00034-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:790f5278f1e40c06876c14aec668a5fd6a24dcf8321e3b3413b992be7fffcf7e
3
+ size 4966188880
model-00035-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02cafabad8f09dc315c9f72baba6ed4ba92cc5127c1b14e437d4e7a61bdc54b1
3
+ size 4362142872
model-00036-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1742e8969ef49e8a9aa5490fbaaf868ab6b6874c9625d71074632239d04a51d1
3
+ size 4362142872
model-00037-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a11ce33e0ba0e2d3021d4ed63923c27f4f256c74a6a4effe0eb9102a3c1d5381
3
+ size 4966188880
model-00038-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c3153e7d6114ec71c63f99bbf33498157600b8b2ffbd3c442d2f14e37bf0f9f
3
+ size 4362142872
model-00039-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf9fce44374b00e8cd99cfc888c92768a8d210cc054de9ca8f79a49ae725b9fb
3
+ size 4362142872
model-00040-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e65bdfb179c50adaad93e5a87855f94aad3f776f08e95ffcfe6a9d50819cf4b
3
+ size 4966188880
model-00041-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93cb604d3fe041f0ff181d828194498433f4a2b0518245f955f4c5666c046543
3
+ size 4362142872
model-00042-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a50e11b046e2da47e7a8575ff1b854b26cc4ee9d364483c4f231c2c9a550d93
3
+ size 4362142872
model-00043-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b376bf6b14b0096ff3c105f1e8bc4cf01e2186f494cfc3c87f7e2720b077cf3
3
+ size 4966188880
model-00044-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c2ca635b14164e6225e9d6d6db299f6d886149ae71a3251a72d4243fe8f2227
3
+ size 4362142872
model-00045-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e5300658a6c4865ad570027e4f80108173630afe8232db45d2866b06894d2b5
3
+ size 4362142872
model-00046-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64106f49bd3abd1f9ec11f7290004cf80c4522a0e704481f00a2b5ac7e32f28e
3
+ size 4966188880
model-00047-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de4c06d5a4cd137ebaaf890e9c4f7feffbd0523d960fa1c0b023dc2fcf464a7c
3
+ size 4362142872
model-00048-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:285a83e448f134e1441d75c7b7eba25ff488be12a782b68850ba4b8e4b45b3a9
3
+ size 4362142872