From 79d58f349110ed670c7c8e485c6a6107a6dd2c52 Mon Sep 17 00:00:00 2001 From: Joseph Viviano Date: Thu, 1 Aug 2024 23:25:42 -0400 Subject: [PATCH] some notes --- tutorials/examples/multinode/ddp_gfn.small.4.slurm | 7 +++++-- 1 file changed, 5 insertions(+), 2 deletions(-) diff --git a/tutorials/examples/multinode/ddp_gfn.small.4.slurm b/tutorials/examples/multinode/ddp_gfn.small.4.slurm index 5940378..893084b 100644 --- a/tutorials/examples/multinode/ddp_gfn.small.4.slurm +++ b/tutorials/examples/multinode/ddp_gfn.small.4.slurm @@ -4,10 +4,13 @@ #SBATCH -J ddp #SBATCH --get-user-env #SBATCH --partition=spr -#SBATCH --ntasks=2 -#SBATCH --cpus-per-task=112 +#SBATCH --ntasks=2 # Number of sockets because we use all threads per socket. +#SBATCH --cpus-per-task=112 # Number of threads available per socket. #SBATCH --time=00:60:00 +# In my case (4 numa nodes) - would set ntasks=4 and cpus-per-task=8 because my CPU has +# 32 cores and I want to divide them across the 4 numa nodes. + source /swtools/intel/2024.0/oneapi-vars.sh export I_MPI_HYDRA_BOOTSTRAP=slurm