swj0419 commited on
Commit
f4bb9f6
1 Parent(s): 597945d

Upload LlamaForCausalLM

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. config.json +27 -0
  2. generation_config.json +6 -0
  3. model-00001-of-00061.safetensors +3 -0
  4. model-00002-of-00061.safetensors +3 -0
  5. model-00003-of-00061.safetensors +3 -0
  6. model-00004-of-00061.safetensors +3 -0
  7. model-00005-of-00061.safetensors +3 -0
  8. model-00006-of-00061.safetensors +3 -0
  9. model-00007-of-00061.safetensors +3 -0
  10. model-00008-of-00061.safetensors +3 -0
  11. model-00009-of-00061.safetensors +3 -0
  12. model-00010-of-00061.safetensors +3 -0
  13. model-00011-of-00061.safetensors +3 -0
  14. model-00012-of-00061.safetensors +3 -0
  15. model-00013-of-00061.safetensors +3 -0
  16. model-00014-of-00061.safetensors +3 -0
  17. model-00015-of-00061.safetensors +3 -0
  18. model-00016-of-00061.safetensors +3 -0
  19. model-00017-of-00061.safetensors +3 -0
  20. model-00018-of-00061.safetensors +3 -0
  21. model-00019-of-00061.safetensors +3 -0
  22. model-00020-of-00061.safetensors +3 -0
  23. model-00021-of-00061.safetensors +3 -0
  24. model-00022-of-00061.safetensors +3 -0
  25. model-00023-of-00061.safetensors +3 -0
  26. model-00024-of-00061.safetensors +3 -0
  27. model-00025-of-00061.safetensors +3 -0
  28. model-00026-of-00061.safetensors +3 -0
  29. model-00027-of-00061.safetensors +3 -0
  30. model-00028-of-00061.safetensors +3 -0
  31. model-00029-of-00061.safetensors +3 -0
  32. model-00030-of-00061.safetensors +3 -0
  33. model-00031-of-00061.safetensors +3 -0
  34. model-00032-of-00061.safetensors +3 -0
  35. model-00033-of-00061.safetensors +3 -0
  36. model-00034-of-00061.safetensors +3 -0
  37. model-00035-of-00061.safetensors +3 -0
  38. model-00036-of-00061.safetensors +3 -0
  39. model-00037-of-00061.safetensors +3 -0
  40. model-00038-of-00061.safetensors +3 -0
  41. model-00039-of-00061.safetensors +3 -0
  42. model-00040-of-00061.safetensors +3 -0
  43. model-00041-of-00061.safetensors +3 -0
  44. model-00042-of-00061.safetensors +3 -0
  45. model-00043-of-00061.safetensors +3 -0
  46. model-00044-of-00061.safetensors +3 -0
  47. model-00045-of-00061.safetensors +3 -0
  48. model-00046-of-00061.safetensors +3 -0
  49. model-00047-of-00061.safetensors +3 -0
  50. model-00048-of-00061.safetensors +3 -0
config.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "/fsx-onellm/swj0419/rlm_pretrain/xldumps/trevor/70b2/70b2_run000/checkpoints/checkpoint_0000090_consolidated/checkpoint_0000090_hf",
3
+ "architectures": [
4
+ "LlamaForCausalLM"
5
+ ],
6
+ "attention_bias": false,
7
+ "bos_token_id": 1,
8
+ "eos_token_id": 2,
9
+ "hidden_act": "silu",
10
+ "hidden_size": 8192,
11
+ "initializer_range": 0.02,
12
+ "intermediate_size": 28672,
13
+ "max_position_embeddings": 2048,
14
+ "model_type": "llama",
15
+ "num_attention_heads": 64,
16
+ "num_hidden_layers": 80,
17
+ "num_key_value_heads": 8,
18
+ "pretraining_tp": 1,
19
+ "rms_norm_eps": 1e-05,
20
+ "rope_scaling": null,
21
+ "rope_theta": 10000.0,
22
+ "tie_word_embeddings": false,
23
+ "torch_dtype": "float32",
24
+ "transformers_version": "4.35.2",
25
+ "use_cache": true,
26
+ "vocab_size": 32000
27
+ }
generation_config.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 1,
4
+ "eos_token_id": 2,
5
+ "transformers_version": "4.35.2"
6
+ }
model-00001-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc6f3b504f2c2294f406f03f0bed7bd653104958d2f9019f3daa6d87e31af9cb
3
+ size 4806739440
model-00002-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:beffb44f4f216dac9bc89de4b3b2b696606a4bf9e5ed69af7f94e7f53f70e259
3
+ size 4630578440
model-00003-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40f7644adb60a8f3f03949ae5b353e4c766e0ae45dbb64913b95838e1e0d0d5b
3
+ size 4362142864
model-00004-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71a930fd44cf95c09829ccd4d2d32848f0115b33f9c1113456be8812016d961d
3
+ size 4966188864
model-00005-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:337565128e30d54402aa5cbc00ac6eaf8f079efab46ff4f241c6f3897ab0f66b
3
+ size 4362142864
model-00006-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:031dfc4f0c2843b6f532b4a98ecbbd47c38212c47115b18c035730d1660402cb
3
+ size 4362142864
model-00007-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fda3b915490ec6957e4c58c1fe51e87f51d8c39ea8fdad87e90c100848186cb2
3
+ size 4966188864
model-00008-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9544dcc8f29d53ea6a13025fe5a393a9a7b29b948a0773f6e87c5f5911856046
3
+ size 4362142880
model-00009-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0563b3c6aead2de4ddd9e7ee796b84b922a92faee301cb98c8d98a99fb34b47b
3
+ size 4362142872
model-00010-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3388e56a0bce2d96d40dc12d5398d89e41f593f8163feb9ccad9a44d2c538df
3
+ size 4966188880
model-00011-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b0cd447111e6e10e96bf25224a5b3acbe945c3af2b7f2148f1799020a82a123
3
+ size 4362142872
model-00012-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2779b18cad31e88125a5ebab9a5bdea39d0b9bfd2cc53ab0971fdef750cd0c41
3
+ size 4362142872
model-00013-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8ea1d321190aacd6ab718239a71b24d4d573353ee7c0957ae88b0c43ca8cec2
3
+ size 4966188880
model-00014-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62ab5185c71d640d3782751c8f5ec6f5a329b7f762a65003a9e861657d6c8323
3
+ size 4362142872
model-00015-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8462e741250fcfd0a6a39d0701b70c90c826551b4e8856aa8f2d07f36df1a3d0
3
+ size 4362142872
model-00016-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4af2e83e3d303d9681a84464004f8668b94acd8e7319b5b7c1e48aed8c078c52
3
+ size 4966188880
model-00017-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3fc0db0f661847e89798d0d9429f364b8f83f2c370edae26ece515e28d725fd
3
+ size 4362142872
model-00018-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de8a7fb98808847952c214326f8b0aa26f5bab0d3d71c96ad6c2b26335b3e13d
3
+ size 4362142872
model-00019-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fa99e8b78ec58abef3caba55c58627a29f867ae835b7b821299799090d0abc2
3
+ size 4966188880
model-00020-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9983dcc7a6798054ba9bd34486e6cce1ac18b4041b51af70c2be149b95a05615
3
+ size 4362142872
model-00021-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:925de2e62ceda64268b4dd1bffbc37059bdd43573d2e45d1295fea5176708786
3
+ size 4362142872
model-00022-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f02ffafe94363d6ec5d1411c8f05c90a31575587eb7cdc9f2ff55b5037def1ca
3
+ size 4966188880
model-00023-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:084305f3bec8d6e222fd8d5b6a149026b47cc36461b14d2e6c3c503e00046197
3
+ size 4362142872
model-00024-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ede76eafa28270b0eaf91daca4569556e8b7d1538764ede8bc9549b32e63a84c
3
+ size 4362142872
model-00025-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d44a37cbee3a70ba199765bfb0c726600b31c3a3ccc5b862c68729f4896b726
3
+ size 4966188880
model-00026-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eafb8c1cb3d9eccdb331a5e3b69aa566d2463eccb1dfe848294bcbbbeb2a639d
3
+ size 4362142872
model-00027-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46a4f31cdf54ff3454627630b7df1c9d750fe007229474bd0b024600032a776e
3
+ size 4362142872
model-00028-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0edef4ab30bd6fba0a0025d0a5af02f520580f189a918856eb97fa9f368baf2a
3
+ size 4966188880
model-00029-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35a2541a03b9ce39ce5180f91ca73273242d90e262e6961ba81beec1b7207efc
3
+ size 4362142872
model-00030-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d4150db316fc7fc64c78548141ae1a89a08004281dde7abe030dc985c8f49e9d
3
+ size 4362142872
model-00031-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ae074f9c6f2df9bfd7e473ed200bc48a2121c6375ba0bb6b93831567287eb5b
3
+ size 4966188880
model-00032-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6dba918a8984849fbc93d62cbf05388e926dfa708c4379704f96abebba70c3cb
3
+ size 4362142872
model-00033-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25ead882ae570b605daa189509bec421f87bb29eb784ed4f2216319b8e11eea5
3
+ size 4362142872
model-00034-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de8a73288ccc567acd42a6a9e572b1053df24239d32c151677a35683dfa90887
3
+ size 4966188880
model-00035-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:218803783c017aeb4a45454148a2d2d0513c7b860b34fc3f152d691a0e1d0948
3
+ size 4362142872
model-00036-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8606fcb4ebc6be07aff84e397015568f2108b22cc630c9bdabb5d89cea57066
3
+ size 4362142872
model-00037-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1af81e9aa2b40b64d5bfe8891d48283ae561a267890be4794402373b9c73feb
3
+ size 4966188880
model-00038-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24305e97862adfd5631326dfbe033d00d38136621737d5251b428322399657aa
3
+ size 4362142872
model-00039-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a8d29d60f4dd58cd01983e134799f78ec641d2c4a05afa3f5591823d187cbd3
3
+ size 4362142872
model-00040-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00452029aa2dcaba23612946f4aac9d0684b4fc2d047e63a1e4573ca0d1962c4
3
+ size 4966188880
model-00041-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b86e4656ead2dfeddd4baae505616832191c83e1b100380854e989e06c9cbce
3
+ size 4362142872
model-00042-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4373db4ffebcc9720a21a194b70eb841c6b2eaedaddb52e1fef50d370b0412ae
3
+ size 4362142872
model-00043-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da51411a429b6985f20fb2251fb9b68fbabc545f347e5dc5a17d63e50dc62d95
3
+ size 4966188880
model-00044-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00af8b0b93b210c6c07f343e3b1599f63848f610c04129a195fc5ee4e3f157df
3
+ size 4362142872
model-00045-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3c3efa23626f9705305a60fce6781b9761e1142d2087cad4469212454e46611
3
+ size 4362142872
model-00046-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20c9dc69bbb289bd09116f42886b4fe4e4fd72d538ad1b548aed929865e3281c
3
+ size 4966188880
model-00047-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ccd1d277d59dfa8e741c11b8b53c3f7865d23140bb8a463021955b0ac2b0851
3
+ size 4362142872
model-00048-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77acb9246d1ed70664874f177ff8dfa78f174e3ebd77f63399b798fcd8f7c1bf
3
+ size 4362142872