ibivibiv commited on
Commit
153d38e
1 Parent(s): c2ea6a9

Upload LlamaForCausalLM

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. config.json +29 -0
  2. generation_config.json +8 -0
  3. model-00001-of-00061.safetensors +3 -0
  4. model-00002-of-00061.safetensors +3 -0
  5. model-00003-of-00061.safetensors +3 -0
  6. model-00004-of-00061.safetensors +3 -0
  7. model-00005-of-00061.safetensors +3 -0
  8. model-00006-of-00061.safetensors +3 -0
  9. model-00007-of-00061.safetensors +3 -0
  10. model-00008-of-00061.safetensors +3 -0
  11. model-00009-of-00061.safetensors +3 -0
  12. model-00010-of-00061.safetensors +3 -0
  13. model-00011-of-00061.safetensors +3 -0
  14. model-00012-of-00061.safetensors +3 -0
  15. model-00013-of-00061.safetensors +3 -0
  16. model-00014-of-00061.safetensors +3 -0
  17. model-00015-of-00061.safetensors +3 -0
  18. model-00016-of-00061.safetensors +3 -0
  19. model-00017-of-00061.safetensors +3 -0
  20. model-00018-of-00061.safetensors +3 -0
  21. model-00019-of-00061.safetensors +3 -0
  22. model-00020-of-00061.safetensors +3 -0
  23. model-00021-of-00061.safetensors +3 -0
  24. model-00022-of-00061.safetensors +3 -0
  25. model-00023-of-00061.safetensors +3 -0
  26. model-00024-of-00061.safetensors +3 -0
  27. model-00025-of-00061.safetensors +3 -0
  28. model-00026-of-00061.safetensors +3 -0
  29. model-00027-of-00061.safetensors +3 -0
  30. model-00028-of-00061.safetensors +3 -0
  31. model-00029-of-00061.safetensors +3 -0
  32. model-00030-of-00061.safetensors +3 -0
  33. model-00031-of-00061.safetensors +3 -0
  34. model-00032-of-00061.safetensors +3 -0
  35. model-00033-of-00061.safetensors +3 -0
  36. model-00034-of-00061.safetensors +3 -0
  37. model-00035-of-00061.safetensors +3 -0
  38. model-00036-of-00061.safetensors +3 -0
  39. model-00037-of-00061.safetensors +3 -0
  40. model-00038-of-00061.safetensors +3 -0
  41. model-00039-of-00061.safetensors +3 -0
  42. model-00040-of-00061.safetensors +3 -0
  43. model-00041-of-00061.safetensors +3 -0
  44. model-00042-of-00061.safetensors +3 -0
  45. model-00043-of-00061.safetensors +3 -0
  46. model-00044-of-00061.safetensors +3 -0
  47. model-00045-of-00061.safetensors +3 -0
  48. model-00046-of-00061.safetensors +3 -0
  49. model-00047-of-00061.safetensors +3 -0
  50. model-00048-of-00061.safetensors +3 -0
config.json ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "merged_marcoroni70b",
3
+ "architectures": [
4
+ "LlamaForCausalLM"
5
+ ],
6
+ "attention_bias": false,
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 1,
9
+ "eos_token_id": 2,
10
+ "hidden_act": "silu",
11
+ "hidden_size": 8192,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 28672,
14
+ "max_position_embeddings": 4096,
15
+ "model_type": "llama",
16
+ "num_attention_heads": 64,
17
+ "num_hidden_layers": 80,
18
+ "num_key_value_heads": 8,
19
+ "pad_token_id": 0,
20
+ "pretraining_tp": 1,
21
+ "rms_norm_eps": 1e-05,
22
+ "rope_scaling": null,
23
+ "rope_theta": 10000.0,
24
+ "tie_word_embeddings": false,
25
+ "torch_dtype": "float32",
26
+ "transformers_version": "4.36.2",
27
+ "use_cache": false,
28
+ "vocab_size": 32000
29
+ }
generation_config.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 1,
4
+ "eos_token_id": 2,
5
+ "pad_token_id": 0,
6
+ "transformers_version": "4.36.2",
7
+ "use_cache": false
8
+ }
model-00001-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c921454a21d2c14b80ee950a05f42ecc36f2b44a382dcaa58f627911d4cfc78
3
+ size 4806739440
model-00002-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc6a497911d6e54cf79fe48a19d88a1874e123e1382f8b0825f80f86d94bf67a
3
+ size 4630578440
model-00003-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3bb7cdf4b22b39aea4aec8a4545d137b271ff58ed20f0e416cdf9f516b1f5638
3
+ size 4362142864
model-00004-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3acaaeb105328a6cd1beb6dbbec05a8e206faaa507afa92186bf0dfe620dca9a
3
+ size 4966188864
model-00005-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3a07113797690bcd5b09ebd0e5091415734730e1073a519d0ad868cf32fb018
3
+ size 4362142864
model-00006-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f685a6bec89b561abeed2d2d50a048f6360e18d41da6096c76c921c01d0a7726
3
+ size 4362142864
model-00007-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7879bf679306240982de17b19d7d1b5c8a61f502a6755814cf838e2344f7076
3
+ size 4966188864
model-00008-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:acc9d683a48d957473b7190e2fc19438cd42114e815afa74ff11d5761cc31a44
3
+ size 4362142880
model-00009-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e65c0be11c75254b5a72851119a5c378c6cbde9f775c6395b592fef1ec5b933
3
+ size 4362142872
model-00010-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:833b9629fd2797930dab0ea203cddbbb5fa1dc146e402fbaf53b4b342dd5b9c9
3
+ size 4966188880
model-00011-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec8d428c5af18e27350d237b9042370fdf2503ec7acc6494e3b44a7c14da622e
3
+ size 4362142872
model-00012-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2af8795d69ed71e1a06d2dbbfd5b48439a46141bb90b795553cc758a0c562ea4
3
+ size 4362142872
model-00013-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ee7401f22503919607e109185c270e34d2f3ca723eb09e263a0f9bd94e66c94
3
+ size 4966188880
model-00014-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8603add4dd9382107bb77c6bd04b365e32a3ce2a6ef154d0c7a06a8131fce16
3
+ size 4362142872
model-00015-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:007854ada89f3f97a2d7281c8903dbb471751391dfb0f99bc2f441609f0c8309
3
+ size 4362142872
model-00016-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c5359e3fbe06ac2c5f4226367b9862bbe9ec52f023a2b3903abc47f7ebf94a6
3
+ size 4966188880
model-00017-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11c1ff4222fc0bfc7384d9d786402aeb78de40f4233691be91a702aadcb2d7d0
3
+ size 4362142872
model-00018-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c37be7fc13e5be411457381725b07effdff88ed3eb8cfa2ddfd73b24a818df57
3
+ size 4362142872
model-00019-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:699f5e55ab8af815a8077bdfcd799cbde6d32cd2a8eed998aae0dedf878b7e41
3
+ size 4966188880
model-00020-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7bfed75586618d1423e0d85b030ef09758ecf68ce3d287c43324dc281e2977e5
3
+ size 4362142872
model-00021-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3dc977d1e3642cf1d09c9359a8c09333a3960ef6ef1c96b47086472ceedbde5
3
+ size 4362142872
model-00022-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a48af4b56cb5f36ae09912a4aea1999522b80faf83eaf987e4a96e1cac763e01
3
+ size 4966188880
model-00023-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84dd5e109fedaa08bd68da7ff92c3ae47a14f902c04d249a6ba79240bcab2374
3
+ size 4362142872
model-00024-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50a71a3b20c05490d0ebfa4705bba954162ddca20d61fbdb434ee8ed03effe47
3
+ size 4362142872
model-00025-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:150f593b91b8e37d3f1534dc7fa08929dec9296f50e949977dcda9f9e4ebe8e5
3
+ size 4966188880
model-00026-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2deffdd7aa5fd025f13634d2185c4831bb7a1d2eb895fd446604b1def0b08484
3
+ size 4362142872
model-00027-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ebb73f23107966e39d94d4ba043166d9e9e83320818b33d9f4ea0440eb72113
3
+ size 4362142872
model-00028-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3181d787fa6a9c47741d7c70375cfd4566ac5275deb85b80cc9680b2c6b4f54
3
+ size 4966188880
model-00029-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a30b9d4e0f70d6a7737d975dd6539dbdda47a270748c1c0b2cb843cf9fa98aba
3
+ size 4362142872
model-00030-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38b2d4a4ca167ef885d2e6347c018f45f0ab247ebf434a0f4c7590c683dba96c
3
+ size 4362142872
model-00031-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:634c36e9b3bf11f9a0705a2b218d769c5ecc457227aa0b1b69ec3ea9185e7721
3
+ size 4966188880
model-00032-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d730cb66474233b5da031179301133298e5e2e40ec1a8b5c6583187a0042932d
3
+ size 4362142872
model-00033-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0fb9a14b0ad587092fa350b2e2ba70ab689030e5de5136f9435f195cc219f78d
3
+ size 4362142872
model-00034-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e99c2e241a386b946dfa9de6c2f2b80ec80f99733a586bda62b2d2ff83d0a977
3
+ size 4966188880
model-00035-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1487c296ecf3c1955d32c5b8d36c768830a14919958bd734f4f60993e787bfbe
3
+ size 4362142872
model-00036-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c92b2d0eeb416f96052a7eb82a84065193d6b76b209a6b32767066c81da2fe08
3
+ size 4362142872
model-00037-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f6941e407b38a38999e9eb16b823760e75654704c3c9632cdb63954f91f6597
3
+ size 4966188880
model-00038-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ba77213ae35e9e785ac16d74ee8eb5cbdbef1b03ba8f7f2fb6a8711ff58df3e
3
+ size 4362142872
model-00039-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50bfdbcbcc0253f1d755599bbc777a1e90c1995924d776299bbcf6b9005f3f40
3
+ size 4362142872
model-00040-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7548698a52f67879ed7333e01296f59d0924756faf718e13f7cc6af0e35672d4
3
+ size 4966188880
model-00041-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c062571485cd736c62d949f2fabc4deecc80ed7192e3cd59b815331ea8ce13eb
3
+ size 4362142872
model-00042-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7e712a14133c9a2e1a7ed50edc4163712431df86d944a227b1acafde74da6cb
3
+ size 4362142872
model-00043-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6943e2137d3da0eed59ada7bf8dadac1c05016835d199d83ce6d3bac7ee6c3e2
3
+ size 4966188880
model-00044-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2207531330d874f2fd3f2d9971ef4f6847355ce5c655a5a5ea65b5df5dad8022
3
+ size 4362142872
model-00045-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7267b73fce2a4d4f63643c2ef281e91157aac7e4cde784eb875b431d8813ef9
3
+ size 4362142872
model-00046-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2bddfc5288852364407679c384bf7fcfc6a81638ccd03b0c1fc63367cae1a9d
3
+ size 4966188880
model-00047-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9bf30fb3f82c73ac064c826e888cde87fb6c07722ba139fa07a570bf4a037a2e
3
+ size 4362142872
model-00048-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81da0ee7520aa5feec78297401a97a877a796c4a70c92e04b72c7cc5c7fbafe0
3
+ size 4362142872