bloom-deepspeed-inference-fp16 / ds_inference_config.json
jeffra's picture
mp-size -> tp-size
348b3ad
{
"type": "BLOOM",
"checkpoints": {
"non_tp": [
"non-tp.pt"
],
"tp": [
"tp_00_00.pt",
"tp_01_00.pt",
"tp_02_00.pt",
"tp_03_00.pt",
"tp_04_00.pt",
"tp_05_00.pt",
"tp_06_00.pt",
"tp_07_00.pt",
"tp_00_01.pt",
"tp_01_01.pt",
"tp_02_01.pt",
"tp_03_01.pt",
"tp_04_01.pt",
"tp_05_01.pt",
"tp_06_01.pt",
"tp_07_01.pt",
"tp_00_02.pt",
"tp_01_02.pt",
"tp_02_02.pt",
"tp_03_02.pt",
"tp_04_02.pt",
"tp_05_02.pt",
"tp_06_02.pt",
"tp_07_02.pt",
"tp_00_03.pt",
"tp_01_03.pt",
"tp_02_03.pt",
"tp_03_03.pt",
"tp_04_03.pt",
"tp_05_03.pt",
"tp_06_03.pt",
"tp_07_03.pt",
"tp_00_04.pt",
"tp_01_04.pt",
"tp_02_04.pt",
"tp_03_04.pt",
"tp_04_04.pt",
"tp_05_04.pt",
"tp_06_04.pt",
"tp_07_04.pt",
"tp_00_05.pt",
"tp_01_05.pt",
"tp_02_05.pt",
"tp_03_05.pt",
"tp_04_05.pt",
"tp_05_05.pt",
"tp_06_05.pt",
"tp_07_05.pt",
"tp_00_06.pt",
"tp_01_06.pt",
"tp_02_06.pt",
"tp_03_06.pt",
"tp_04_06.pt",
"tp_05_06.pt",
"tp_06_06.pt",
"tp_07_06.pt",
"tp_00_07.pt",
"tp_01_07.pt",
"tp_02_07.pt",
"tp_03_07.pt",
"tp_04_07.pt",
"tp_05_07.pt",
"tp_06_07.pt",
"tp_07_07.pt"
]
},
"version": 1,
"parallelization": "tp",
"tp_size": 8,
"dtype": "float16"
}