ibivibiv commited on
Commit
f51e11b
1 Parent(s): 2ef05a6

Upload LlamaForCausalLM

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. config.json +28 -0
  2. generation_config.json +6 -0
  3. model-00001-of-00106.safetensors +3 -0
  4. model-00002-of-00106.safetensors +3 -0
  5. model-00003-of-00106.safetensors +3 -0
  6. model-00004-of-00106.safetensors +3 -0
  7. model-00005-of-00106.safetensors +3 -0
  8. model-00006-of-00106.safetensors +3 -0
  9. model-00007-of-00106.safetensors +3 -0
  10. model-00008-of-00106.safetensors +3 -0
  11. model-00009-of-00106.safetensors +3 -0
  12. model-00010-of-00106.safetensors +3 -0
  13. model-00011-of-00106.safetensors +3 -0
  14. model-00012-of-00106.safetensors +3 -0
  15. model-00013-of-00106.safetensors +3 -0
  16. model-00014-of-00106.safetensors +3 -0
  17. model-00015-of-00106.safetensors +3 -0
  18. model-00016-of-00106.safetensors +3 -0
  19. model-00017-of-00106.safetensors +3 -0
  20. model-00018-of-00106.safetensors +3 -0
  21. model-00019-of-00106.safetensors +3 -0
  22. model-00020-of-00106.safetensors +3 -0
  23. model-00021-of-00106.safetensors +3 -0
  24. model-00022-of-00106.safetensors +3 -0
  25. model-00023-of-00106.safetensors +3 -0
  26. model-00024-of-00106.safetensors +3 -0
  27. model-00025-of-00106.safetensors +3 -0
  28. model-00026-of-00106.safetensors +3 -0
  29. model-00027-of-00106.safetensors +3 -0
  30. model-00028-of-00106.safetensors +3 -0
  31. model-00029-of-00106.safetensors +3 -0
  32. model-00030-of-00106.safetensors +3 -0
  33. model-00031-of-00106.safetensors +3 -0
  34. model-00032-of-00106.safetensors +3 -0
  35. model-00033-of-00106.safetensors +3 -0
  36. model-00034-of-00106.safetensors +3 -0
  37. model-00035-of-00106.safetensors +3 -0
  38. model-00036-of-00106.safetensors +3 -0
  39. model-00037-of-00106.safetensors +3 -0
  40. model-00038-of-00106.safetensors +3 -0
  41. model-00039-of-00106.safetensors +3 -0
  42. model-00040-of-00106.safetensors +3 -0
  43. model-00041-of-00106.safetensors +3 -0
  44. model-00042-of-00106.safetensors +3 -0
  45. model-00043-of-00106.safetensors +3 -0
  46. model-00044-of-00106.safetensors +3 -0
  47. model-00045-of-00106.safetensors +3 -0
  48. model-00046-of-00106.safetensors +3 -0
  49. model-00047-of-00106.safetensors +3 -0
  50. model-00048-of-00106.safetensors +3 -0
config.json ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "./megameditron",
3
+ "architectures": [
4
+ "LlamaForCausalLM"
5
+ ],
6
+ "attention_bias": false,
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 1,
9
+ "eos_token_id": 2,
10
+ "hidden_act": "silu",
11
+ "hidden_size": 8192,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 28672,
14
+ "max_position_embeddings": 4096,
15
+ "model_type": "llama",
16
+ "num_attention_heads": 64,
17
+ "num_hidden_layers": 140,
18
+ "num_key_value_heads": 8,
19
+ "pretraining_tp": 1,
20
+ "rms_norm_eps": 1e-05,
21
+ "rope_scaling": null,
22
+ "rope_theta": 10000.0,
23
+ "tie_word_embeddings": false,
24
+ "torch_dtype": "float32",
25
+ "transformers_version": "4.37.2",
26
+ "use_cache": true,
27
+ "vocab_size": 32017
28
+ }
generation_config.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 1,
4
+ "eos_token_id": 2,
5
+ "transformers_version": "4.37.2"
6
+ }
model-00001-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e44f30dc0a92bc6574428303e23a6c0964174ee94b1e701fa42f119eddf2110c
3
+ size 4807296496
model-00002-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f371c9797b49a1818be31f13189b21894be17abc77eb68a6c7dacb4f8e9704b2
3
+ size 4630578440
model-00003-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f5f1edd281d9775b494a113540cb48d6841569c03a96cb17e253e8a8d1f1593
3
+ size 4362142864
model-00004-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2132e1459c61cd88cd2b4c312e1cb875bf5243465b8a4efa6b9cc3b3bfc02cec
3
+ size 4966188864
model-00005-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb6e2477e9b0b7132ab5cd83a99a3704a27e23ca754ae0be5df32b6ddbfcf441
3
+ size 4362142864
model-00006-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:275616391af8a2683efbe3869bad28bb5a7e5c64b018f1f1914112d7769903a9
3
+ size 4362142864
model-00007-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d57593a90e8ab7b3773462e08a2d03a20a6368e8424738f61b2bdf4f64037753
3
+ size 4966188864
model-00008-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01c176dd13d24cce03d915ba907fdfe32af02054f7675e130610a4a50f057dc5
3
+ size 4362142880
model-00009-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28db210f73f2188bab3828c467e1ba8d141109443378c3a29d1ec140cee24d9d
3
+ size 4362142872
model-00010-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d12869ec39c315347caa7afbca5586788d4b95f32585925ba0be7a96adaf2bd
3
+ size 4966188880
model-00011-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1487a550365f076689e3659b67466dbc2b322b477957f37abc6b62b2486a42c7
3
+ size 4362142872
model-00012-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1804d2848dc8898194ef2d25056ddffc6a86bff2c210cbeb78ffc2b2128dcd78
3
+ size 4362142872
model-00013-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf7f8ac8e8a0a32ecff1124bf0513e3a3b4bfd680b4c7d5a5f27c75f6aedc267
3
+ size 4966188880
model-00014-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ef8c4db30c35951ae16df352286cc47594d12b8cf0b4afc72989ac8bfaf2b50
3
+ size 4362142872
model-00015-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbf5c961404fd9b659d6fd7ed2c3fe31b745e1fb1c2dfd2627789fbaf7066271
3
+ size 4362142872
model-00016-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e1e018e77c90d7315f9ca5adc896d042c624d9d7cdd4545e77b119c960955a1
3
+ size 4966188880
model-00017-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66f17b39749a12195242e6fc76058c2ce681560c31d2b61cdf01d618440e60b8
3
+ size 4362142872
model-00018-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6e7727d00bd5306de377d8d697e119ea62c2a53770f6fb54baf791fcdd6457f
3
+ size 4362142872
model-00019-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f980f2724b5efef11aba2d3c2e21f376360e68a4f41c85a3a8f14c57b899a98
3
+ size 4966188880
model-00020-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df6d28fe1b87f35581a393ed23a9a7960137c586363a43fe134a6f802f3e9919
3
+ size 4362142872
model-00021-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85371cddd82e6459d7b1cbba1237e0b414539dfe3522882179e5af0abd64ccd6
3
+ size 4362142872
model-00022-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:959127991902a94a91669e30363c90a67810a52e3142ce5f7a2f908964c73bf0
3
+ size 4966188880
model-00023-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:278ae88f1c61df761593d4a3cce286b8be4cce0e90a37e5ab3c78b016ac402a4
3
+ size 4362142872
model-00024-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc90c062ac66b626383f8eb13655054e6d8197771c7063cab579babd82a484c4
3
+ size 4362142872
model-00025-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b2235386f1e48e03ed8a8c5d920c04931419bd4b765a31a1fa05e002a03c556
3
+ size 4966188880
model-00026-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:569fb6ca087dc124de13c19d5f5027f4aacf1104e330ba9796307741b26925c3
3
+ size 4362142872
model-00027-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e50faf290f8fde5b4a4b04f78228894a4f59b91372c37160fe04d0d157b324f
3
+ size 4362142872
model-00028-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd5554cb2e1b2c20b57ef323d03f8503182973e5bf73687b3f6ed81f88b259e2
3
+ size 4966188880
model-00029-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6a712f513bed6dddd8cde9b88485c5db25ef4ee35600867d851d92e76df86c0
3
+ size 4362142872
model-00030-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:166c4281d86ec9683fc339a01bf537d42ef12a7b186ac14a5e0f7de798f3fdde
3
+ size 4362142872
model-00031-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d36da9926dd8868f30b9584b870fa068c4a174d7809f77cc5809aae56896390a
3
+ size 4966188880
model-00032-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70ed077b14fff9ecb57102bb6f7ea32b248b452670bf31456fde62a5886458ff
3
+ size 4362142872
model-00033-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01dcf19ef6fbb286fe2d868ef7b738c796982e7d3ba2163e71b26e8814a8a823
3
+ size 4362142872
model-00034-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1533a69d5910e3ec69df3349b8c3703703367af01fdff78b433be0df812f840
3
+ size 4966188880
model-00035-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae7bd608da1edf12dac3e684ad504632192543cd1f5b2b3a99c0fb291dbb241a
3
+ size 4362142872
model-00036-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37666359397e186f8905bdf4634ee01625b4f3e4a652b612441654164bba140d
3
+ size 4362142872
model-00037-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:308dc865f397c805a29813436bc87ab62182749640cba6b8f71deb5ab2ab91e7
3
+ size 4966188880
model-00038-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e82ecfee42184e7b57cd8a1d4e7ca676309e9d48c89aa15f2b809cc454f6972
3
+ size 4362142872
model-00039-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6281dede905574ce3856ad6b1d4d5d30cbd0fefe2ec4a09fb7e14f51c979a7b9
3
+ size 4362142872
model-00040-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11bc1ce583318a4cf9cf647386786f818ff6092fbeda1df269c11310f50917c4
3
+ size 4966188880
model-00041-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b3c78e972b00a18357f9e5c3fddd0045bb1dff28120581a5c278d087c346499
3
+ size 4362142872
model-00042-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28e71dd95cf65563c3d0be1870cf8c7d61cfda48a8b82d878046c385b3983e96
3
+ size 4362142872
model-00043-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6e0acbfd05b56f2b2c2196f4189c86065ff759ef47e0484527ea1c660990b9e
3
+ size 4966188880
model-00044-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d3e45974ce0bc071c085268af0a2b9e00745b53f7b7cebaed7e09a10f095ac6
3
+ size 4362142872
model-00045-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18a3021cf61db1e8aa5910886a52b7faae9b2563511778369bda21f63412ceff
3
+ size 4362142872
model-00046-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8eef6c91dc333e5afd238bd0cb6f1bf3b75c4daab1dd5d3a6febc03b51b0f653
3
+ size 4966188880
model-00047-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:098845e4ee41cc8deb0f3ece1770c4a18dd7296dfde2e8deef668eb72853ba8e
3
+ size 4362142872
model-00048-of-00106.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ecafa9aa5a28f2b0f681c84025326c4ca6a11eb67a141fec86fc90665f843779
3
+ size 4362142872