How do I?

only

ssh user@linux.cs.uchicago.edu
ssh user@fe.ai.cs.uchicago.edu
man sbatch
amcguire@fe01:~$ cat mpi-hello.c 
#include <mpi.h>
#include <unistd.h>
#include <stdio.h>

int main(int argc, char **argv) {
    // Initialize MPI
    MPI_Init(&argc, &argv);

    // Get the number of processes in the global communicator
    int count;
    MPI_Comm_size(MPI_COMM_WORLD, &count);

    // Get the rank of the current process
    int rank;
    MPI_Comm_rank(MPI_COMM_WORLD, &rank);

    // Get the current hostname
    char hostname[1024];
    gethostname(hostname, sizeof(hostname));

    // Print a hello world message for this rank
    printf("Hello from process %d of %d on host %s\n", rank, count, hostname);

    // Finalize the MPI environment before exiting
    MPI_Finalize();
}
amcguire@fe01:~$ cat hello-job.sh
#!/bin/bash
#SBATCH -J mpi-hello            # Job name
#SBATCH -n 2                    # Number of processes
#SBATCH -t 0:10:00              # Max wall time
#SBATCH -o hello-job.out        # Output file name

# Disable the Infiniband transport for OpenMPI (not present on all clusters)
#export OMPI_MCA_btl="^openib"

# Run the job (assumes the batch script is submitted from the same directory)
mpirun -np 2 ./mpi-hello

amcguire@fe01:~$ mpicc -o mpi-hello mpi-hello.c
amcguire@fe01:~$ ls -l mpi-hello
-rwxrwx--- 1 amcguire amcguire 16992 Jun 30 10:49 mpi-hello
amcguire@fe01:~$ sbatch -w p001,p002 -p peanut-cpu hello-job.sh
Submitted batch job 1196702
amcguire@fe01:~$ cat hello-job.out 
Hello from process 0 of 2 on host p001
Hello from process 1 of 2 on host p002
 mkdir -p $HOME/slurm/out
#!/bin/bash
#
#SBATCH --mail-user=cnetid@cs.uchicago.edu
#SBATCH --mail-type=ALL
#SBATCH --output=/home/cnetid/slurm/out/%j.%N.stdout
#SBATCH --error=/home/cnetid/slurm/out/%j.%N.stderr
#SBATCH --chdir=/home/cnetid/slurm
#SBATCH --partition=debug
#SBATCH --job-name=check_hostname_of_node
#SBATCH --nodes=1
#SBATCH --ntasks=1
#SBATCH --mem-per-cpu=500
#SBATCH --time=15:00

hostname
man sbatch
sbatch hostname.job
user@host:~$ srun -n2 hostname
slurm2
slurm2
user@host:~$ srun -n1 sleep 400
user@host:~$ squeue
JOBID PARTITION     NAME     USER ST       TIME  NODES NODELIST(REASON)
   29     debug    sleep     user  R       0:11      1 research2
scancel 29
user@host:~$ sinfo
PARTITION AVAIL  TIMELIMIT  NODES  STATE NODELIST
debug*       up 1-00:00:00      1    mix slurm1
fast         up 1-00:00:00      6   idle slurm[9-14]
general      up 21-00:00:0      6   idle slurm[2-6,8]
pascal       up 3-00:00:00      1   idle gpu2
quadro       up 3-00:00:00      1   idle gpu1
titan        up 3-00:00:00      1    mix gpu3
squeue -u cnetid
squeue -j 7894
 srun -p general --pty --cpus-per-task 1 --mem 500 -t 0-06:00 /bin/bash
#SBATCH start-finish[:step][%maximum concurrent]
#SBATCH --array 0-15         0, 1, ..., 15
#SBATCH --array 1-3          0, 1, 2, 3
#SBATCH --array 1,3,4,6      1, 3, 4, 6
#SBATCH --array 1-8:2        1, 3, 5, 7
#SBATCH --array 1-10:3%2     1, 5, 9, but the only two of these will ever run concurrently.
#!/bin/bash
#
#SBATCH --mail-user=cnetid@cs.uchicago.edu
#SBATCH --mail-type=ALL
#SBATCH --output=/home/cnetid/slurm/out/%j.%N.stdout
#SBATCH --error=/home/cnetid/slurm/out/%j.%N.stderr
#SBATCH --chdir=/home/cnetid/slurm
#SBATCH --partition=debug
#SBATCH --job-name=check_hostname_of_node
#SBATCH --nodes=1
#SBATCH --ntasks=1
#SBATCH --mem-per-cpu=500
#SBATCH --time=15:00
#SBATCH --array 1-4

input=("small_dataset" "medium_dataset" "large_dataset" "huge_dataset")
./process $input[$SLURM_ARRAY_TASK_ID]
sbatch --gres=gpu:titan:2 ....
  --gpu=gpu:N    # where 'N' is the number of GPUs requested.
                 # Please try to limit yourself to one GPU per person.
#!/usr/bin/env python3
from tensorflow.python.client import device_lib
print(device_lib.list_local_devices())
user@bulldozer:~$ srun -p titan --pty /bin/bash
user@gpu3:~$ ./f 2>&1 | grep physical_device_desc
user@gpu3:~$
user@bulldozer:~$ srun -p titan --pty --gres=gpu:1 /bin/bash
user@gpu3:~$ ./f 2>&1 | grep physical_device_desc
physical_device_desc: "device: 0, name: GeForce GTX 1080 Ti, pci bus id: 0000:19:00.0, compute capability: 6.1"
user@bulldozer:~$ srun -p titan --pty --gres=gpu:2 /bin/bash
user@gpu3:~$ ./f 2>&1 | grep physical_device_desc
physical_device_desc: "device: 0, name: GeForce GTX 1080 Ti, pci bus id: 0000:19:00.0, compute capability: 6.1"
physical_device_desc: "device: 1, name: GeForce GTX 1080 Ti, pci bus id: 0000:1a:00.0, compute capability: 6.1"
kauffman3@bulldozer:~$ srun -p titan --pty --gres=gpu:5 /bin/bash
srun: error: Unable to allocate resources: Requested node configuration is not available
$ sinfo -O partition,nodelist,gres,features,available
PARTITION           NODELIST            GRES                FEATURES            AVAIL
debug*              slurm1              (null)              (null)              up
fast                slurm[9-14]         (null)              (null)              up
general             slurm[2-6,8]        (null)              (null)              up
pascal              gpu2                gpu:gtx1080:1       'pascal,gtx1080'    up
quadro              gpu1                gpu:p4000:2         'quadro,p4000'      up
titan               gpu3                gpu:gtx1080ti:4     'pascal,gtx1080ti'  up
$ squeue -O username,nodelist,gres
USER                NODELIST            GRES                
someusername        gpu3                gpu:1               
otherusername       gpu3                gpu:3               
...
cuda_version=11.1
export CUDA_HOME=/usr/local/cuda-${cuda_version}
export LD_LIBRARY_PATH=$LD_LIBRARY_PATH:$CUDA_HOME/lib64
export PATH=$PATH:/usr/local/cuda/bin
#!/bin/bash
#
#SBATCH --mail-user=cnetid@cs.uchicago.edu
#SBATCH --mail-type=ALL
#SBATCH --output=/home/cnetid/slurm/slurm_out/%j.%N.stdout
#SBATCH --error=/home/cnetid/slurm/slurm_out/%j.%N.stderr
#SBATCH --workdir=/home/cnetid/slurm
#SBATCH --partition=gpu
#SBATCH --job-name=get_tesla_info

export PATH=$PATH:/usr/local/cuda/bin
export LD_LIBRARY_PATH=$LD_LIBRARY_PATH=/usr/local/cuda/lib

cat << EOF > /tmp/getinfo.cu
#include <stdio.h>

int main() {
  int nDevices;

  cudaGetDeviceCount(&nDevices);
  for (int i = 0; i < nDevices; i++) {
    cudaDeviceProp prop;
    cudaGetDeviceProperties(&prop, i);
    printf("Device Number: %d\n", i);
    printf("  Device name: %s\n", prop.name);
    printf("  Memory Clock Rate (KHz): %d\n",
           prop.memoryClockRate);
    printf("  Memory Bus Width (bits): %d\n",
           prop.memoryBusWidth);
    printf("  Peak Memory Bandwidth (GB/s): %f\n\n",
           2.0*prop.memoryClockRate*(prop.memoryBusWidth/8)/1.0e6);
  }
}
EOF

/usr/local/cuda/bin/nvcc /tmp/getinfo.cu -o /tmp/a.out
/tmp/a.out
rm /tmp/a.out
rm /tmp/getinfo.cu
cnetid@focal0:~$ cat $HOME/slurm/slurm_out/12567.gpu1.stdout 
Device Number: 0
  Device name: Tesla M2090
  Memory Clock Rate (KHz): 1848000
  Memory Bus Width (bits): 384
  Peak Memory Bandwidth (GB/s): 177.408000

	Slurm	Example
Submit a batch serial job	sbatch	sbatch runscript.sh
Run a script interactively	srun	srun –pty -p interact -t 10 –mem 1000 /bin/bash /bin/hostname
Kill a job	scancel	scancel 4585
View status of queues	squeue	squeue -u cnetid
Check current job by id	sacct	sacct -j 999999

Error	What does it mean?
JOB <jobid> CANCELLED AT <time> DUE TO TIME LIMIT	You did not specify enough time for your job to run. The `-t` flag will allow you to set the time limit.
Job <jobid> exceeded <mem> memory limit, being killed	Your job is attempting to use more memory that you have requested for it. Either increase the amount of memory you have requested or reduce the amount of memory usage your application is trying to use.
JOB <jobid> CANCELLED AT <time> DUE TO NODE FAILURE	There can be many reasons for this message, but most often it means that the node your job was set to run on can no longer be contacted by the the Slurm controller.
error: Unable to allocate resources: More processors requested than permitted	It usually has nothing to do with privileges you may or may not have. Rather, it usually means that you have allocated more processors than one compute node actually has.

Table of Contents

Slurm

Communication

Mailing List

Discord

Clusters

Peanut Cluster

AI Cluster

Where to begin

Documentation

Resources

Job Submission

Command Summary

Usage

Default Quotas

MPI Usage

Exclusive access to a node

sbatch

Sample script

Submitting job script

srun

squeue

scancel

sinfo

Monitoring Jobs

Interactive Jobs

Job Scheduling

Array Jobs

Common Issues

Using the GPU

GRES Multiple GPU's on one system

Ok, but I don't want to read the wall of text above

Cool, but how do I know where and what resources are available

Checking how many Generic RESources are being consumed

Environment Variables

CUDA_HOME, LD_LIBRARY_PATH

PATH

CUDA_VISIBLE_DEVICES

Example

Output

Feedback

More