File size: 601 Bytes
ea847ad |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 |
#!/bin/bash -l
# SLURM SUBMIT SCRIPT
#SBATCH --partition=g40
#SBATCH --nodes=1
#SBATCH --gpus=8
#SBATCH --cpus-per-gpu=6
#SBATCH --job-name=realfake
#SBATCH --comment=laion
#SBATCH --signal=SIGUSR1@90
source "${HOME}/venv/bin/activate"
export NCCL_DEBUG=INFO
export PYTHONFAULTHANDLER=1
export PYTHONPATH="${HOME}/realfake"
echo "Working directory: `pwd`"
srun python3 realfake/train_cluster.py \
-jf "${HOME}/realfake/metadata/prepared.2000k.jsonl" \
-mn convnext_large -e 5 -bs 128 \
--acceleratorparams.devices=8 \
--acceleratorparams.strategy=ddp_find_unused_parameters_false
|