opt-30b-deepspeed-inference-fp16-shard-8 / ds_inference_config.json
lucadiliello's picture
Update ds_inference_config.json
4fc9560
raw
history blame contribute delete
No virus
1.21 kB
{"type": "ds_model", "base_dir": "/science/lucadiliello/models/facebook/sharded/opt-30b-deepspeed-inference-fp16-shard-8", "checkpoints": {"non_tp": ["non-tp.pt"], "tp": ["tp_00_00.pt", "tp_01_00.pt", "tp_02_00.pt", "tp_03_00.pt", "tp_04_00.pt", "tp_05_00.pt", "tp_06_00.pt", "tp_07_00.pt", "tp_00_01.pt", "tp_01_01.pt", "tp_02_01.pt", "tp_03_01.pt", "tp_04_01.pt", "tp_05_01.pt", "tp_06_01.pt", "tp_07_01.pt", "tp_00_02.pt", "tp_01_02.pt", "tp_02_02.pt", "tp_03_02.pt", "tp_04_02.pt", "tp_05_02.pt", "tp_06_02.pt", "tp_07_02.pt", "tp_00_03.pt", "tp_01_03.pt", "tp_02_03.pt", "tp_03_03.pt", "tp_04_03.pt", "tp_05_03.pt", "tp_06_03.pt", "tp_07_03.pt", "tp_00_04.pt", "tp_01_04.pt", "tp_02_04.pt", "tp_03_04.pt", "tp_04_04.pt", "tp_05_04.pt", "tp_06_04.pt", "tp_07_04.pt", "tp_00_05.pt", "tp_01_05.pt", "tp_02_05.pt", "tp_03_05.pt", "tp_04_05.pt", "tp_05_05.pt", "tp_06_05.pt", "tp_07_05.pt", "tp_00_06.pt", "tp_01_06.pt", "tp_02_06.pt", "tp_03_06.pt", "tp_04_06.pt", "tp_05_06.pt", "tp_06_06.pt", "tp_07_06.pt", "tp_00_07.pt", "tp_01_07.pt", "tp_02_07.pt", "tp_03_07.pt", "tp_04_07.pt", "tp_05_07.pt", "tp_06_07.pt", "tp_07_07.pt"]}, "version": 1.0, "parallelization": "tp", "tp_size": 8, "dtype": "float16"}