Upload LlamaForCausalLM
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- config.json +28 -0
- generation_config.json +6 -0
- model-00001-of-00106.safetensors +3 -0
- model-00002-of-00106.safetensors +3 -0
- model-00003-of-00106.safetensors +3 -0
- model-00004-of-00106.safetensors +3 -0
- model-00005-of-00106.safetensors +3 -0
- model-00006-of-00106.safetensors +3 -0
- model-00007-of-00106.safetensors +3 -0
- model-00008-of-00106.safetensors +3 -0
- model-00009-of-00106.safetensors +3 -0
- model-00010-of-00106.safetensors +3 -0
- model-00011-of-00106.safetensors +3 -0
- model-00012-of-00106.safetensors +3 -0
- model-00013-of-00106.safetensors +3 -0
- model-00014-of-00106.safetensors +3 -0
- model-00015-of-00106.safetensors +3 -0
- model-00016-of-00106.safetensors +3 -0
- model-00017-of-00106.safetensors +3 -0
- model-00018-of-00106.safetensors +3 -0
- model-00019-of-00106.safetensors +3 -0
- model-00020-of-00106.safetensors +3 -0
- model-00021-of-00106.safetensors +3 -0
- model-00022-of-00106.safetensors +3 -0
- model-00023-of-00106.safetensors +3 -0
- model-00024-of-00106.safetensors +3 -0
- model-00025-of-00106.safetensors +3 -0
- model-00026-of-00106.safetensors +3 -0
- model-00027-of-00106.safetensors +3 -0
- model-00028-of-00106.safetensors +3 -0
- model-00029-of-00106.safetensors +3 -0
- model-00030-of-00106.safetensors +3 -0
- model-00031-of-00106.safetensors +3 -0
- model-00032-of-00106.safetensors +3 -0
- model-00033-of-00106.safetensors +3 -0
- model-00034-of-00106.safetensors +3 -0
- model-00035-of-00106.safetensors +3 -0
- model-00036-of-00106.safetensors +3 -0
- model-00037-of-00106.safetensors +3 -0
- model-00038-of-00106.safetensors +3 -0
- model-00039-of-00106.safetensors +3 -0
- model-00040-of-00106.safetensors +3 -0
- model-00041-of-00106.safetensors +3 -0
- model-00042-of-00106.safetensors +3 -0
- model-00043-of-00106.safetensors +3 -0
- model-00044-of-00106.safetensors +3 -0
- model-00045-of-00106.safetensors +3 -0
- model-00046-of-00106.safetensors +3 -0
- model-00047-of-00106.safetensors +3 -0
- model-00048-of-00106.safetensors +3 -0
config.json
ADDED
@@ -0,0 +1,28 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "./megameditron",
|
3 |
+
"architectures": [
|
4 |
+
"LlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 1,
|
9 |
+
"eos_token_id": 2,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 8192,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 28672,
|
14 |
+
"max_position_embeddings": 4096,
|
15 |
+
"model_type": "llama",
|
16 |
+
"num_attention_heads": 64,
|
17 |
+
"num_hidden_layers": 140,
|
18 |
+
"num_key_value_heads": 8,
|
19 |
+
"pretraining_tp": 1,
|
20 |
+
"rms_norm_eps": 1e-05,
|
21 |
+
"rope_scaling": null,
|
22 |
+
"rope_theta": 10000.0,
|
23 |
+
"tie_word_embeddings": false,
|
24 |
+
"torch_dtype": "float32",
|
25 |
+
"transformers_version": "4.37.2",
|
26 |
+
"use_cache": true,
|
27 |
+
"vocab_size": 32017
|
28 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 1,
|
4 |
+
"eos_token_id": 2,
|
5 |
+
"transformers_version": "4.37.2"
|
6 |
+
}
|
model-00001-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e44f30dc0a92bc6574428303e23a6c0964174ee94b1e701fa42f119eddf2110c
|
3 |
+
size 4807296496
|
model-00002-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f371c9797b49a1818be31f13189b21894be17abc77eb68a6c7dacb4f8e9704b2
|
3 |
+
size 4630578440
|
model-00003-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f5f1edd281d9775b494a113540cb48d6841569c03a96cb17e253e8a8d1f1593
|
3 |
+
size 4362142864
|
model-00004-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2132e1459c61cd88cd2b4c312e1cb875bf5243465b8a4efa6b9cc3b3bfc02cec
|
3 |
+
size 4966188864
|
model-00005-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb6e2477e9b0b7132ab5cd83a99a3704a27e23ca754ae0be5df32b6ddbfcf441
|
3 |
+
size 4362142864
|
model-00006-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:275616391af8a2683efbe3869bad28bb5a7e5c64b018f1f1914112d7769903a9
|
3 |
+
size 4362142864
|
model-00007-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d57593a90e8ab7b3773462e08a2d03a20a6368e8424738f61b2bdf4f64037753
|
3 |
+
size 4966188864
|
model-00008-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:01c176dd13d24cce03d915ba907fdfe32af02054f7675e130610a4a50f057dc5
|
3 |
+
size 4362142880
|
model-00009-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:28db210f73f2188bab3828c467e1ba8d141109443378c3a29d1ec140cee24d9d
|
3 |
+
size 4362142872
|
model-00010-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d12869ec39c315347caa7afbca5586788d4b95f32585925ba0be7a96adaf2bd
|
3 |
+
size 4966188880
|
model-00011-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1487a550365f076689e3659b67466dbc2b322b477957f37abc6b62b2486a42c7
|
3 |
+
size 4362142872
|
model-00012-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1804d2848dc8898194ef2d25056ddffc6a86bff2c210cbeb78ffc2b2128dcd78
|
3 |
+
size 4362142872
|
model-00013-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf7f8ac8e8a0a32ecff1124bf0513e3a3b4bfd680b4c7d5a5f27c75f6aedc267
|
3 |
+
size 4966188880
|
model-00014-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ef8c4db30c35951ae16df352286cc47594d12b8cf0b4afc72989ac8bfaf2b50
|
3 |
+
size 4362142872
|
model-00015-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cbf5c961404fd9b659d6fd7ed2c3fe31b745e1fb1c2dfd2627789fbaf7066271
|
3 |
+
size 4362142872
|
model-00016-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3e1e018e77c90d7315f9ca5adc896d042c624d9d7cdd4545e77b119c960955a1
|
3 |
+
size 4966188880
|
model-00017-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:66f17b39749a12195242e6fc76058c2ce681560c31d2b61cdf01d618440e60b8
|
3 |
+
size 4362142872
|
model-00018-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e6e7727d00bd5306de377d8d697e119ea62c2a53770f6fb54baf791fcdd6457f
|
3 |
+
size 4362142872
|
model-00019-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f980f2724b5efef11aba2d3c2e21f376360e68a4f41c85a3a8f14c57b899a98
|
3 |
+
size 4966188880
|
model-00020-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df6d28fe1b87f35581a393ed23a9a7960137c586363a43fe134a6f802f3e9919
|
3 |
+
size 4362142872
|
model-00021-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:85371cddd82e6459d7b1cbba1237e0b414539dfe3522882179e5af0abd64ccd6
|
3 |
+
size 4362142872
|
model-00022-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:959127991902a94a91669e30363c90a67810a52e3142ce5f7a2f908964c73bf0
|
3 |
+
size 4966188880
|
model-00023-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:278ae88f1c61df761593d4a3cce286b8be4cce0e90a37e5ab3c78b016ac402a4
|
3 |
+
size 4362142872
|
model-00024-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc90c062ac66b626383f8eb13655054e6d8197771c7063cab579babd82a484c4
|
3 |
+
size 4362142872
|
model-00025-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7b2235386f1e48e03ed8a8c5d920c04931419bd4b765a31a1fa05e002a03c556
|
3 |
+
size 4966188880
|
model-00026-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:569fb6ca087dc124de13c19d5f5027f4aacf1104e330ba9796307741b26925c3
|
3 |
+
size 4362142872
|
model-00027-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e50faf290f8fde5b4a4b04f78228894a4f59b91372c37160fe04d0d157b324f
|
3 |
+
size 4362142872
|
model-00028-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd5554cb2e1b2c20b57ef323d03f8503182973e5bf73687b3f6ed81f88b259e2
|
3 |
+
size 4966188880
|
model-00029-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a6a712f513bed6dddd8cde9b88485c5db25ef4ee35600867d851d92e76df86c0
|
3 |
+
size 4362142872
|
model-00030-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:166c4281d86ec9683fc339a01bf537d42ef12a7b186ac14a5e0f7de798f3fdde
|
3 |
+
size 4362142872
|
model-00031-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d36da9926dd8868f30b9584b870fa068c4a174d7809f77cc5809aae56896390a
|
3 |
+
size 4966188880
|
model-00032-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:70ed077b14fff9ecb57102bb6f7ea32b248b452670bf31456fde62a5886458ff
|
3 |
+
size 4362142872
|
model-00033-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:01dcf19ef6fbb286fe2d868ef7b738c796982e7d3ba2163e71b26e8814a8a823
|
3 |
+
size 4362142872
|
model-00034-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c1533a69d5910e3ec69df3349b8c3703703367af01fdff78b433be0df812f840
|
3 |
+
size 4966188880
|
model-00035-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ae7bd608da1edf12dac3e684ad504632192543cd1f5b2b3a99c0fb291dbb241a
|
3 |
+
size 4362142872
|
model-00036-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:37666359397e186f8905bdf4634ee01625b4f3e4a652b612441654164bba140d
|
3 |
+
size 4362142872
|
model-00037-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:308dc865f397c805a29813436bc87ab62182749640cba6b8f71deb5ab2ab91e7
|
3 |
+
size 4966188880
|
model-00038-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e82ecfee42184e7b57cd8a1d4e7ca676309e9d48c89aa15f2b809cc454f6972
|
3 |
+
size 4362142872
|
model-00039-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6281dede905574ce3856ad6b1d4d5d30cbd0fefe2ec4a09fb7e14f51c979a7b9
|
3 |
+
size 4362142872
|
model-00040-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:11bc1ce583318a4cf9cf647386786f818ff6092fbeda1df269c11310f50917c4
|
3 |
+
size 4966188880
|
model-00041-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b3c78e972b00a18357f9e5c3fddd0045bb1dff28120581a5c278d087c346499
|
3 |
+
size 4362142872
|
model-00042-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:28e71dd95cf65563c3d0be1870cf8c7d61cfda48a8b82d878046c385b3983e96
|
3 |
+
size 4362142872
|
model-00043-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c6e0acbfd05b56f2b2c2196f4189c86065ff759ef47e0484527ea1c660990b9e
|
3 |
+
size 4966188880
|
model-00044-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9d3e45974ce0bc071c085268af0a2b9e00745b53f7b7cebaed7e09a10f095ac6
|
3 |
+
size 4362142872
|
model-00045-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:18a3021cf61db1e8aa5910886a52b7faae9b2563511778369bda21f63412ceff
|
3 |
+
size 4362142872
|
model-00046-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8eef6c91dc333e5afd238bd0cb6f1bf3b75c4daab1dd5d3a6febc03b51b0f653
|
3 |
+
size 4966188880
|
model-00047-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:098845e4ee41cc8deb0f3ece1770c4a18dd7296dfde2e8deef668eb72853ba8e
|
3 |
+
size 4362142872
|
model-00048-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ecafa9aa5a28f2b0f681c84025326c4ca6a11eb67a141fec86fc90665f843779
|
3 |
+
size 4362142872
|