monai
medical
pathology_nuclick_annotation / configs /multi_gpu_evaluate.json
katielink's picture
fix the wrong GPU index issue of multi-node
5fbf6fb
{
"device": "$torch.device('cuda:' + os.environ['LOCAL_RANK'])",
"network": {
"_target_": "torch.nn.parallel.DistributedDataParallel",
"module": "$@network_def.to(@device)",
"device_ids": [
"@device"
]
},
"validate#sampler": {
"_target_": "DistributedSampler",
"dataset": "@validate#dataset",
"even_divisible": false,
"shuffle": false
},
"validate#dataloader#sampler": "@validate#sampler",
"validate#handlers#1#_disabled_": "$dist.get_rank() > 0",
"initialize": [
"$import sys",
"$sys.path.append(@bundle_root)",
"$import torch.distributed as dist",
"$dist.is_initialized() or dist.init_process_group(backend='nccl')",
"$torch.cuda.set_device(@device)",
"$monai.utils.set_determinism(seed=123)",
"$import logging",
"$@validate#evaluator.logger.setLevel(logging.WARNING if dist.get_rank() > 0 else logging.INFO)"
],
"run": [
"$@validate#evaluator.run()"
],
"finalize": [
"$dist.is_initialized() and dist.destroy_process_group()"
]
}