#!/bin/bash -x #SBATCH --account=laionize #SBATCH --nodes=1 #SBATCH --ntasks-per-node=4 #SBATCH --cpus-per-task=24 #SBATCH --time=06:00:00 #SBATCH --gres=gpu:4 #SBATCH --partition=booster ml CUDA source /p/project/laionize/miniconda/bin/activate conda activate ddgan export CUDA_VISIBLE_DEVICES=0,1,2,3 echo "Job id: $SLURM_JOB_ID" export TOKENIZERS_PARALLELISM=false #export NCCL_ASYNC_ERROR_HANDLING=1 export NCCL_IB_TIMEOUT=50 export UCX_RC_TIMEOUT=4s export NCCL_IB_RETRY_CNT=10 srun python -u $*