Spaces:
Runtime error
Runtime error
export MASTER_PORT=$((12000 + $RANDOM % 20000)) | |
set -x | |
PARTITION=$1 | |
JOB_NAME=$2 | |
CONFIG=$3 | |
WORK_DIR=$4 | |
GPUS=${GPUS:-8} | |
GPUS_PER_NODE=${GPUS_PER_NODE:-8} | |
CPUS_PER_TASK=${CPUS_PER_TASK:-5} | |
PY_ARGS=${@:5} | |
SRUN_ARGS=${SRUN_ARGS:-""} | |
PYTHONPATH="$(dirname $0)/..":$PYTHONPATH \ | |
srun -p ${PARTITION} \ | |
--job-name=${JOB_NAME} \ | |
--gres=gpu:${GPUS_PER_NODE} \ | |
--ntasks=${GPUS} \ | |
--ntasks-per-node=${GPUS_PER_NODE} \ | |
--cpus-per-task=${CPUS_PER_TASK} \ | |
--kill-on-bad-exit=1 \ | |
${SRUN_ARGS} \ | |
python -u tools/train.py ${CONFIG} --work-dir=${WORK_DIR} --launcher="slurm" ${PY_ARGS} | |