lucadiliello commited on
Commit
0e3cd21
1 Parent(s): ff546ce

added tp sharded ckpts

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
config.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "facebook/opt-30b",
3
+ "_remove_final_layer_norm": false,
4
+ "activation_dropout": 0.0,
5
+ "activation_function": "relu",
6
+ "architectures": [
7
+ "OPTForCausalLM"
8
+ ],
9
+ "attention_dropout": 0.0,
10
+ "bos_token_id": 2,
11
+ "do_layer_norm_before": true,
12
+ "dropout": 0.1,
13
+ "enable_bias": true,
14
+ "eos_token_id": 2,
15
+ "ffn_dim": 28672,
16
+ "hidden_size": 7168,
17
+ "init_std": 0.02,
18
+ "layer_norm_elementwise_affine": true,
19
+ "layerdrop": 0.0,
20
+ "max_position_embeddings": 2048,
21
+ "model_type": "opt",
22
+ "num_attention_heads": 56,
23
+ "num_hidden_layers": 48,
24
+ "pad_token_id": 1,
25
+ "prefix": "</s>",
26
+ "torch_dtype": "float16",
27
+ "transformers_version": "4.27.1",
28
+ "use_cache": true,
29
+ "vocab_size": 50272,
30
+ "word_embed_proj_dim": 7168
31
+ }
ds_inference_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"type": "bloom", "base_dir": "/science/lucadiliello/models/facebook/sharded/opt-30b-deepspeed-inference-fp16-shard-8", "checkpoints": {"non_tp": ["non-tp.pt"], "tp": ["tp_00_00.pt", "tp_01_00.pt", "tp_02_00.pt", "tp_03_00.pt", "tp_04_00.pt", "tp_05_00.pt", "tp_06_00.pt", "tp_07_00.pt", "tp_00_01.pt", "tp_01_01.pt", "tp_02_01.pt", "tp_03_01.pt", "tp_04_01.pt", "tp_05_01.pt", "tp_06_01.pt", "tp_07_01.pt", "tp_00_02.pt", "tp_01_02.pt", "tp_02_02.pt", "tp_03_02.pt", "tp_04_02.pt", "tp_05_02.pt", "tp_06_02.pt", "tp_07_02.pt", "tp_00_03.pt", "tp_01_03.pt", "tp_02_03.pt", "tp_03_03.pt", "tp_04_03.pt", "tp_05_03.pt", "tp_06_03.pt", "tp_07_03.pt", "tp_00_04.pt", "tp_01_04.pt", "tp_02_04.pt", "tp_03_04.pt", "tp_04_04.pt", "tp_05_04.pt", "tp_06_04.pt", "tp_07_04.pt", "tp_00_05.pt", "tp_01_05.pt", "tp_02_05.pt", "tp_03_05.pt", "tp_04_05.pt", "tp_05_05.pt", "tp_06_05.pt", "tp_07_05.pt", "tp_00_06.pt", "tp_01_06.pt", "tp_02_06.pt", "tp_03_06.pt", "tp_04_06.pt", "tp_05_06.pt", "tp_06_06.pt", "tp_07_06.pt", "tp_00_07.pt", "tp_01_07.pt", "tp_02_07.pt", "tp_03_07.pt", "tp_04_07.pt", "tp_05_07.pt", "tp_06_07.pt", "tp_07_07.pt"]}, "version": 1.0, "parallelization": "tp", "tp_size": 8, "dtype": "float16"}
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
non-tp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd9d68f2514fff789d00648f4d0773c910b166f5d1e51c54920639b5841b4ad4
3
+ size 429
special_tokens_map.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "</s>",
4
+ "lstrip": false,
5
+ "normalized": true,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "</s>",
11
+ "lstrip": false,
12
+ "normalized": true,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "<pad>",
18
+ "lstrip": false,
19
+ "normalized": true,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "unk_token": {
24
+ "content": "</s>",
25
+ "lstrip": false,
26
+ "normalized": true,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ }
30
+ }
tokenizer_config.json ADDED
@@ -0,0 +1,41 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_bos_token": true,
3
+ "add_prefix_space": false,
4
+ "bos_token": {
5
+ "__type": "AddedToken",
6
+ "content": "</s>",
7
+ "lstrip": false,
8
+ "normalized": true,
9
+ "rstrip": false,
10
+ "single_word": false
11
+ },
12
+ "eos_token": {
13
+ "__type": "AddedToken",
14
+ "content": "</s>",
15
+ "lstrip": false,
16
+ "normalized": true,
17
+ "rstrip": false,
18
+ "single_word": false
19
+ },
20
+ "errors": "replace",
21
+ "model_max_length": 1000000000000000019884624838656,
22
+ "pad_token": {
23
+ "__type": "AddedToken",
24
+ "content": "<pad>",
25
+ "lstrip": false,
26
+ "normalized": true,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ },
30
+ "padding_side": "left",
31
+ "special_tokens_map_file": null,
32
+ "tokenizer_class": "GPT2Tokenizer",
33
+ "unk_token": {
34
+ "__type": "AddedToken",
35
+ "content": "</s>",
36
+ "lstrip": false,
37
+ "normalized": true,
38
+ "rstrip": false,
39
+ "single_word": false
40
+ }
41
+ }
tp_00_00.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c26882660c767ce5005a9efca8a48500d865483fed2356f724d965d5e5196e92
3
+ size 1572785581
tp_00_01.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db3be077f72491fe26c80ffa205731ceea55270f02be68e0033d58be1fae14fb
3
+ size 925480293
tp_00_02.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0084afc36f70d046245d50557a90e02303e0cd5af231f31518d617c919546b11
3
+ size 976846563
tp_00_03.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf77684b8a9f0221ba9d6bed79cc89a7f3071f9074265b2b6b34bc3ccb424dd9
3
+ size 925473189
tp_00_04.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c4c55a14365b48dabec5d5f0b22b22193ae4b73e9f0e7ae634379398bdce15d
3
+ size 976846563
tp_00_05.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:524e4bc6e4761dfb4f647b2b0ebc3b28f6e3b2484c17f906b71815aa447d3b10
3
+ size 925480357
tp_00_06.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2383cbd093ad1261b11a2293a16fc944a3a7e9bfab399eb0e75719cf325bd9e6
3
+ size 925480357
tp_00_07.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6bfc56ad0bdbd4d209fe9b12014f986cd86b9dad2b019b0d9649661d44fb2e54
3
+ size 1646150759
tp_01_00.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3d98973a4cb975d61dfc908e39f562c32e7782066b0b869bf646ab96329b76c
3
+ size 1572785581
tp_01_01.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5060ed14ce6de8d304d63aa0f299fc01bf5ef9d818891d00b204b46a2ac9a85
3
+ size 925480293
tp_01_02.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24e25c293c0182ba8051e3fb3f00ab593c72da4f0ef728a379c2991b5f12cf7f
3
+ size 976846563
tp_01_03.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8eaf6de268fc1d33fed71c081d0b2eb16bc248d9e823f9815137769665b76ce7
3
+ size 925473189
tp_01_04.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08ecde010b332e442204c262cea165d48165b18ff317b12f806fea7ccaa0e88c
3
+ size 976846563
tp_01_05.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d85659026294ba1eabe8e7a47397d8c85400a7511e00a451ab45d2f285a8f2a3
3
+ size 925480357
tp_01_06.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:715aeb88d85af6db640da8a8f93e84f669097babb10b307975f1237a55b3eea6
3
+ size 925480357
tp_01_07.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a01e3e8db32940bca54c6b543399b8238b00da7999b3350c65f9d3bc7e26bc3f
3
+ size 1646150759
tp_02_00.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f42b6c83411e0325cc0015318bfce07acf32fe63e662ea2cf6c0e49a7b991cd
3
+ size 1572785581
tp_02_01.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e346a3277d08757cbdb0f3f7efa1bb59a39ff2f8ac94614a8c8b4eb2c69064e4
3
+ size 925480293
tp_02_02.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:921ebde7213ca3e6a2d4e663489ef31a9ccfcabda38bd36404a3ed5f48b8e2d4
3
+ size 976846563
tp_02_03.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:029c22b4ba9a7f5e6a330e1febf063a366fe225cef083e7fffdbebdb74058bdb
3
+ size 925473189
tp_02_04.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8fdf045edcffbab10635a841ef64e00bf2714b0c696a220e31a52039e3f9eab
3
+ size 976846563
tp_02_05.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7de448302ced47d238f3a149b5211a011f865ff6ea723cab075baadfde994ad2
3
+ size 925480357
tp_02_06.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90dcc2bf582eac1b6791bc6b9db5c65a73ad367e99574175995a99855817749e
3
+ size 925480357
tp_02_07.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:909298a42c2f209c0d662063bd09c0f7cae13393fce7d232b999aab4474a78df
3
+ size 1646150759
tp_03_00.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a412beab94560853c7b87daf3781dc9070f2ecf6c1b15c6de5827ba7c3eb3005
3
+ size 1572785581
tp_03_01.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b7dea26ad5e8c9c324de1f27a0debf28be1b946f66589ef9f7d55cfb730f250
3
+ size 925480293
tp_03_02.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b79e7e0e6a222156d90fa7a28e60553acb6e083d33bd43e2b6215db1cca3a8af
3
+ size 976846563
tp_03_03.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1c473ffbea673587fa266e63316948c5583f10b1ae726336feccc172bedf372
3
+ size 925473189
tp_03_04.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ab80776c9a979def96cf88d2accd16d02b662f28f9dea9626a8076874431ad8
3
+ size 976846563
tp_03_05.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6634347816671154be5830bef65d1e1fbf89fd03ac37c68d3f83514d1458681
3
+ size 925480357
tp_03_06.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5915a72b60d40941968abe25200d6a07755bed7a0a14558b57127c9c2088c143
3
+ size 925480357
tp_03_07.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c283fc1ba18d196819d20047746f2c4b3d173f04118a5dc2ab64af7c2e1d37d9
3
+ size 1646150759
tp_04_00.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e715c684852c96286c7f4821ffb1c18f4a8acbef420e512ca2764083e496eb23
3
+ size 1572785581
tp_04_01.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d619f45e8f3336071bbb883b3154d1759940912de293954620d1065bf73dc7bb
3
+ size 925480293
tp_04_02.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6fb47d4b2baf35488284d473ad857303c24709c011d5948b2fe3a4299f9caf9f
3
+ size 976846563
tp_04_03.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4718eda4837a011d91bd525d2bd13ab145c3dc8a7e8927fdd10847142263a62a
3
+ size 925473189
tp_04_04.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:895061f14ac398c71d1115a5f04b392eaf13af6bb8bf6870a56992ce75c63958
3
+ size 976846563
tp_04_05.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d640105011413893a3ede588de04432eff4f732909ec99d55d35dcef6fd00239
3
+ size 925480357
tp_04_06.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2749083ee0d21243d19dc2d7a97da6f9b9a7473852cc98be7c27647f54aaa08
3
+ size 925480357
tp_04_07.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c68cd3dd13da88aa9838ec52fe682147053fcd38a89650d861927e5317e354d
3
+ size 1646150759
tp_05_00.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5590117f6b4e397b0f5da60d2ee2a050dba7d1184c0c4ba0a5758c51bda32375
3
+ size 1572785581
tp_05_01.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79bfc9c4cc3fd61c842cdb90983a2826fe23f5b0812b5676f887cb556ac46bfc
3
+ size 925480293
tp_05_02.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31ca8c5769b23ffe945a60616c0e041a19565af4e0b39b11d3a858f14e1e1f7b
3
+ size 976846563
tp_05_03.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24246eb55689c1e5377c34d318d5daee1e3323bd72db7cae46e2e6f2b9429cfe
3
+ size 925473189