Last active
November 15, 2019 16:30
-
-
Save williamFalcon/821517dd7a9fc8f366019b0295c9b992 to your computer and use it in GitHub Desktop.
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
#!/bin/bash -l | |
# SLURM SUBMIT SCRIPT | |
#SBATCH --nodes=32 | |
#SBATCH --gres=gpu:8 | |
#SBATCH --ntasks-per-node=8 | |
#SBATCH --mem=0 | |
#SBATCH --time=0-02:00:00 | |
# activate conda env | |
source activate $1 | |
# ------------------------- | |
# debugging flags (optional) | |
export NCCL_DEBUG=INFO | |
export PYTHONFAULTHANDLER=1 | |
# on your cluster you might need these: | |
# set the network interface | |
# export NCCL_SOCKET_IFNAME=^docker0,lo | |
# might need the latest cuda | |
# module load NCCL/2.4.7-1-cuda.10.0 | |
# ------------------------- | |
# run script from above | |
srun python3 my_demo_file.py |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment