You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
Copy file name to clipboardExpand all lines: tutorials/scaling_up/scripts/hpc/leonardo/job.sbatch
+28-20Lines changed: 28 additions & 20 deletions
Original file line number
Diff line number
Diff line change
@@ -9,15 +9,6 @@
9
9
#SBATCH --gres=gpu:4
10
10
#SBATCH --exclusive
11
11
12
-
# Enable logging
13
-
set -x # Every command and its arguments are printed to stderr before being executed.
14
-
15
-
# Setup environment
16
-
module load cuda/12.3
17
-
module load gcc/12.2.0
18
-
module load binutils/2.42
19
-
source /leonardo_scratch/fast/EUHPC_D21_101/max_lue/python_envs/working/leonardo_modalities/bin/activate # TODO replace "working" with "stable" if needed
20
-
21
12
#### Environment variables
22
13
export CXX=g++
23
14
export CC=gcc
@@ -34,6 +25,14 @@ export GLOO_SOCKET_IFNAME=ib0
34
25
export CUDA_VISIBLE_DEVICES=0,1,2,3
35
26
export NCCL_ASYNC_ERROR_HANDLING=1
36
27
28
+
# Enable logging
29
+
set -x # Every command and its arguments are printed to stderr before being executed.
30
+
31
+
# Setup environment
32
+
module load cuda/12.3
33
+
source /leonardo_scratch/fast/EUHPC_D21_101/max_lue/python_envs/working/leonardo_modalities/bin/activate # TODO replace "working" with "stable" if needed
34
+
35
+
37
36
MASTER_ADDR=$(scontrol show hostnames "$SLURM_JOB_NODELIST"| head -n 1)
0 commit comments