Upload LlamaForCausalLM
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- config.json +29 -0
- generation_config.json +8 -0
- model-00001-of-00106.safetensors +3 -0
- model-00002-of-00106.safetensors +3 -0
- model-00003-of-00106.safetensors +3 -0
- model-00004-of-00106.safetensors +3 -0
- model-00005-of-00106.safetensors +3 -0
- model-00006-of-00106.safetensors +3 -0
- model-00007-of-00106.safetensors +3 -0
- model-00008-of-00106.safetensors +3 -0
- model-00009-of-00106.safetensors +3 -0
- model-00010-of-00106.safetensors +3 -0
- model-00011-of-00106.safetensors +3 -0
- model-00012-of-00106.safetensors +3 -0
- model-00013-of-00106.safetensors +3 -0
- model-00014-of-00106.safetensors +3 -0
- model-00015-of-00106.safetensors +3 -0
- model-00016-of-00106.safetensors +3 -0
- model-00017-of-00106.safetensors +3 -0
- model-00018-of-00106.safetensors +3 -0
- model-00019-of-00106.safetensors +3 -0
- model-00020-of-00106.safetensors +3 -0
- model-00021-of-00106.safetensors +3 -0
- model-00022-of-00106.safetensors +3 -0
- model-00023-of-00106.safetensors +3 -0
- model-00024-of-00106.safetensors +3 -0
- model-00025-of-00106.safetensors +3 -0
- model-00026-of-00106.safetensors +3 -0
- model-00027-of-00106.safetensors +3 -0
- model-00028-of-00106.safetensors +3 -0
- model-00029-of-00106.safetensors +3 -0
- model-00030-of-00106.safetensors +3 -0
- model-00031-of-00106.safetensors +3 -0
- model-00032-of-00106.safetensors +3 -0
- model-00033-of-00106.safetensors +3 -0
- model-00034-of-00106.safetensors +3 -0
- model-00035-of-00106.safetensors +3 -0
- model-00036-of-00106.safetensors +3 -0
- model-00037-of-00106.safetensors +3 -0
- model-00038-of-00106.safetensors +3 -0
- model-00039-of-00106.safetensors +3 -0
- model-00040-of-00106.safetensors +3 -0
- model-00041-of-00106.safetensors +3 -0
- model-00042-of-00106.safetensors +3 -0
- model-00043-of-00106.safetensors +3 -0
- model-00044-of-00106.safetensors +3 -0
- model-00045-of-00106.safetensors +3 -0
- model-00046-of-00106.safetensors +3 -0
- model-00047-of-00106.safetensors +3 -0
- model-00048-of-00106.safetensors +3 -0
config.json
ADDED
@@ -0,0 +1,29 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "./merged2",
|
3 |
+
"architectures": [
|
4 |
+
"LlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 1,
|
9 |
+
"eos_token_id": 2,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 8192,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 28672,
|
14 |
+
"max_position_embeddings": 4096,
|
15 |
+
"model_type": "llama",
|
16 |
+
"num_attention_heads": 64,
|
17 |
+
"num_hidden_layers": 140,
|
18 |
+
"num_key_value_heads": 8,
|
19 |
+
"pad_token_id": 0,
|
20 |
+
"pretraining_tp": 1,
|
21 |
+
"rms_norm_eps": 1e-05,
|
22 |
+
"rope_scaling": null,
|
23 |
+
"rope_theta": 10000.0,
|
24 |
+
"tie_word_embeddings": false,
|
25 |
+
"torch_dtype": "float32",
|
26 |
+
"transformers_version": "4.36.2",
|
27 |
+
"use_cache": false,
|
28 |
+
"vocab_size": 32000
|
29 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 1,
|
4 |
+
"eos_token_id": 2,
|
5 |
+
"pad_token_id": 0,
|
6 |
+
"transformers_version": "4.36.2",
|
7 |
+
"use_cache": false
|
8 |
+
}
|
model-00001-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b21385d70b303324eff225a6b6a8705975b805cb23ebe1fd18e75405d2846de4
|
3 |
+
size 4806739440
|
model-00002-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9d2c8dcf3a734d0d7e73dae05b975197664be5229202875018d1f8ab23474aa8
|
3 |
+
size 4630578440
|
model-00003-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f000c6dd16e76bcf456cdc84853be3c6d01fa131c6d7a7399183296be28ec90f
|
3 |
+
size 4362142864
|
model-00004-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67386c6a282a1defe3f3c9636f6b165b14e81abc96665db9e4de6d68a04eab5c
|
3 |
+
size 4966188864
|
model-00005-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a96516b9e430fa970a82fa415bedae34bd2c61f45d9c20218bb8064066d44add
|
3 |
+
size 4362142864
|
model-00006-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1716a29f0aa0e9e8cce505d0f1fd06aff03e090d04ebe402d37531cd49a8f13
|
3 |
+
size 4362142864
|
model-00007-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c9f305229739d3eef00d6df105adfd795cd6381307e887e20c1087fbcbbedc72
|
3 |
+
size 4966188864
|
model-00008-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:02ff2b92df7629fa797a2afc729d2bdedf1fd627c2a1eeadb6dc2475c8a5a4f0
|
3 |
+
size 4362142880
|
model-00009-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c5d017e765d91e0e8d927504e7d75cb746a47f5fabe8c2e51d7f48af110a9220
|
3 |
+
size 4362142872
|
model-00010-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d24b98baef4e5bb8b97646113b3595e3736b09bdae48200635fb0466c93e19ae
|
3 |
+
size 4966188880
|
model-00011-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a417e07496ddc82043773c786e11e1e5d5955d542b59f9ad66d0ee7a66e3c1e0
|
3 |
+
size 4362142872
|
model-00012-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5ffac5372b71c252999d3f419ee635a6b7f962d8819dfe53e66ec4c398041f8
|
3 |
+
size 4362142872
|
model-00013-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:587adef026b7eec7f0553dfbd34fff62737f6e220e729b16325262b595149530
|
3 |
+
size 4966188880
|
model-00014-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ef65978f45eb6f4bf9e9d30cc0909c327110980b183efd4594411b09bd7f210
|
3 |
+
size 4362142872
|
model-00015-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:531cbe73ae058d9a9941332853a6f35c95fcdce481328e48c333305a180cd143
|
3 |
+
size 4362142872
|
model-00016-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:01272681d6bc1d76731fcf2e8bf16d21c07f16bb42072ca66b751b2bc68535e9
|
3 |
+
size 4966188880
|
model-00017-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd7f470ca0d85c1dc6421a322a6d2330632b6725d894afbd3a578992b925b92b
|
3 |
+
size 4362142872
|
model-00018-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8fe3ec985cc994b0e7bba2522cfc5446789b9e79d75b3a71d911ae3eee57ffaa
|
3 |
+
size 4362142872
|
model-00019-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c6a6035d1d1d7269792fd55660b7dce6d224c4404b9bd91ed421e82c993f2b7
|
3 |
+
size 4966188880
|
model-00020-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:686c4b0c39dd3bc8244131e527c605e673ec3b6b078a17b5db1f974c87c272b1
|
3 |
+
size 4362142872
|
model-00021-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c5eb6705c2f74609bcdce32d5496ef002456084ec21002335ec8e77d9c8c23a2
|
3 |
+
size 4362142872
|
model-00022-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:81546d86f68d76f5c7da97fe147e88ab866d19e6b6117e58848d0f4c4a2c0233
|
3 |
+
size 4966188880
|
model-00023-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad4a72b4c8f0c58290ed8504a0745de7658fb253d7dac4a75e95834f02017402
|
3 |
+
size 4362142872
|
model-00024-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2aaf9482005433fabad1b124ceb9a6a137bd38f316a99e62c9ae20d669c0c931
|
3 |
+
size 4362142872
|
model-00025-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e30ab9197d0756bcd4d54f4c8a1773c82c378afb23667c4fd2b8e5afada3d4d0
|
3 |
+
size 4966188880
|
model-00026-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8464b5b2fc1b8b85390725fd90383911833d52c158f0752d184f01dda83ef9b1
|
3 |
+
size 4362142872
|
model-00027-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8fea7df14ba735e76440987ff36e8a5397c70313526f3f1783e0b3c02ea78924
|
3 |
+
size 4362142872
|
model-00028-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2a7ee877f50384050ca7f3a3d4fbe36a1715b83da9aad2488733f3df68e7eda0
|
3 |
+
size 4966188880
|
model-00029-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e5871178e9afaf8527020c17e5209468e9ee553a1e7d126e127440d21cb3f421
|
3 |
+
size 4362142872
|
model-00030-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c51f9452c9f6e875ebe5eb044fc69510596856a5c159509b1a5fdd56ffddd19d
|
3 |
+
size 4362142872
|
model-00031-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4fb4961c9225b85f449ce345a7fc118cce8819c4d03797176c7625a5f9d6c79c
|
3 |
+
size 4966188880
|
model-00032-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:260d01c03d1db85a706f2558390dc7403548abe9f59904d59b163e3f77e05996
|
3 |
+
size 4362142872
|
model-00033-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f81a762a9068d07f1ac2312576fc1a8882dd2a5fe6844b6a48b9f646bde4372c
|
3 |
+
size 4362142872
|
model-00034-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1e4a53e1fdba9bc63863e438c8954c572289cae79a3f6ca5a64d11f078fe00a2
|
3 |
+
size 4966188880
|
model-00035-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:876efa34066c377495e4b3b513dc3e085286005a0261efa730fce37e04a2d488
|
3 |
+
size 4362142872
|
model-00036-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ab07ab2baaece6d30084d8c1040226b1312ab5c381b70b395f1a8f0e1777def
|
3 |
+
size 4362142872
|
model-00037-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3aff298d6f851b89ccb2688d753b9a449bfcd5d5f61e79f8772ef357ca37f8f
|
3 |
+
size 4966188880
|
model-00038-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ac263823230ba8fb163a8d45502d4d45e734fcb6a72555e3296809f3bb5e3bce
|
3 |
+
size 4362142872
|
model-00039-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab84e3cf6814bdc899fbcc897955f01baa052811b5003c8c22cae6628e3498b5
|
3 |
+
size 4362142872
|
model-00040-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f489026fb8d0470fba6d0a8aa7695fc8661110ccaa17184d3630018b19dca966
|
3 |
+
size 4966188880
|
model-00041-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b27a092e8a0c56723298b95fa508317a6e5cbfb6bd9eddbe354e1cd7028098d7
|
3 |
+
size 4362142872
|
model-00042-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:25fe0d80822d46cfc74572fc3e6a42ead50a9fe0b09c3683ed3609380b53ea0b
|
3 |
+
size 4362142872
|
model-00043-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ebf4ea9a760112a30e1e2b16159b089f233e5650ace831e35a80f2290033d83
|
3 |
+
size 4966188880
|
model-00044-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca46cb25dd15fda4cfa341f25b269266a999ee1fb67096c10a566fd85c0231c1
|
3 |
+
size 4362142872
|
model-00045-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e4a89c716381ab7c7153a5223034c3099689ea51a12743e7b1484fee61888f8
|
3 |
+
size 4362142872
|
model-00046-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:798f639849bc93b4eb48cd04a3c9c0066732efdb5cc2e5b0a1917acb78ef1dda
|
3 |
+
size 4966188880
|
model-00047-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e061bcb6a47746981b84f0a5598860eb6353abdf3abd0c7918b5a8c00387be7
|
3 |
+
size 4362142872
|
model-00048-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:169e978d504244dc864841a41cc8a053c807d3f6b79e8c5f8e409395ddbbbc7e
|
3 |
+
size 4362142872
|