# What type of compute nodes?

qhost -F arch | tail -n +4 | xargs -l2 | grep -v ^sge | awk '{print $12,$3}'  | awk -F = '{print $2}' | sort | uniq -c | awk 'BEGIN {print "CPU-type\t\t# nodes\t\t#cores/node\t# tot. cores"} {SUM_NODES +=$1; SUM_CORES +=$1*$3; {printf "%-16s %8d\t %8d\t\t %8d\n", $2,$1,$3,$1*$3}} END {print "TOTALS\t\t\t"SUM_NODES"\t\t-\t\t\t"SUM_CORES}'


qhost -F arch | tail -n +4 | xargs -l2 | grep -v ^sge | awk '{print $12,$3,$8}'  | awk -F = '{print $2}' | sort | uniq -c | awk 'BEGIN {print "CPU-type\t\t# nodes\t\t#cores/node\t# tot. cores\t\tmemory/core (GB)\ttot memory (GB)"} {SUM_NODES +=$1; SUM_CORES +=$1*$3; SUM_MEM +=$4; {printf "%-16s %8d\t %8d\t\t %8d\t\t %.3f\t\t\t %.3f\n", $2,$1,$3,$1*$3,$4/$3,$4}} END {print "TOTALS\t\t\t"SUM_NODES"\t\t-\t\t\t"SUM_CORES"\t\t -\t\t\t"SUM_MEM}'


# Do I have access to highp resources?
# if you are running this presentation as a jupyter notebook you can test your resources by running this cell:

myresources -u rdtest


qhost -l cuda.0.name=* -q -j


## Most centrally installed apps are available via `modulefiles` 
## (if you are running this presentation as a jupyter notebook execute this cell):

    module av --no-pager


## Most centrally installed apps are available via `modulefiles` to look for a specifc software use `modules_lookup`
## (if you are running this presentation as a jupyter notebook execute this cell):

    modules_lookup


## To look for a specific appliaction say R
## (if you are running this presentation as a jupyter notebook execute this cell
## or paste the command in your terminal):

modules_lookup -m R


## Load an application in your environment
## (if you are running this presentation as a jupyter notebook execute this cell
## or paste the command in your terminal):

     which R


## Load an application in your environment - continued:
## (if you are running this presentation as a jupyter notebook execute this cell
## or paste the command in your terminal):
     which R
     module load gcc/10.2.0; module load R/4.3.0
     which R


## Submitting non interactive (batch) jobs

# create a time-stamped directory, cd to it and copy in it the submission script: 
# /u/local/apps/submit_scripts/submit_job.sh 
timestamp=`date "+%F"` 
mkdir $HOME/H2HH_$timestamp; cd $HOME/H2HH_$timestamp; pwd
if [ ! -f "submit_job.sh" ]; then 
   cp /u/local/apps/submit_scripts/submit_job.sh ./submit_job.sh
else 
   echo "File: submit_job.sh already present"; 
fi 

# check that the submission script has been copied in the current directory:
ls -l submit_job.sh


# now submit the job: 
qsub submit_job.sh 

# is my job running? 
myjobs 

# save the job ID number into the variable $JOB_ID for later use:
JOB_ID=`myjob | grep submit_job | awk '{print $1}'`

# echo the JOB_ID:
echo "JOB_ID=$JOB_ID"


#first four jobs queuing (status "p" pending):

qstat -s p | head -n 6


# tot. no. of currently jobs pending 

qstat -s p | grep qw | wc -l


#Let's count the total number of compute cores requested using some handy command line expressions:

count=1; qstat -s p | grep qw | awk -v count=$count '{count=count+$8} END {print "Total no. of cores requested: "count}'


#first four jobs running (status "r" running):

qstat -s r | head -n 6


# tot. no. of jobs running

qstat -s r | grep r | wc -l


#Let's count the total number of compute cores currently running jobs using some handy command line expressions: 

count=1 ; val=0 ; qstat -s r | grep @ | awk -v count=$count '{count=count+$9} END {print "Total no. of cores in use: "count}'


# let's take a look at the submission script:

cat submit_job.sh


# let's take a look at the joblog file: 

cat joblog.${JOB_ID}


# or look in:

    ls /u/local/apps/submit_scripts


# Submit R jobs with R_job_submitter.sh:  

# create temporary directory in your $SCRATCH and change directory to it:
if [ ! -d $SCRATCH/R_tests ]; then mkdir $SCRATCH/R_tests; fi; cd $SCRATCH/R_tests 

# copy the R file R-benchmark-25.R:
if [ ! -f R-benchmark-25.R ]; then cp /u/local/apps/submit_scripts/R/R-benchmark-25.R ./;fi 

# submit the R script R-benchmark-25.R to the queues using R_job_submitter.sh:
/u/local/apps/submit_scripts/R_job_submitter.sh -n R-benchmark-25.R  -m 1 -t 1 -s 4 -v 4.0.2 -nts 
JOB_ID2=`myjob | grep R-benchmar | awk '{print $1}'`

# echo JOB_ID:
echo "JOB_ID=$JOB_ID2"


# check the submission status of the job(s):

myjob


# check if output has been generated:

ls -ltr


# check the submission script generated by `/u/local/apps/submit_scripts/R_job_submitter.sh`:

cat R-benchmark-25.cmd


# let's check the joblog file (one of last two files in the list above): 

cat R-benchmark-25.joblog.$JOB_ID2

 
Job R-benchmark-25, ID no. 735109 started on:   n1020
Job R-benchmark-25, ID no. 735109 started at:   Wed Nov 22 11:55:23 PST 2023
 
Loading R/4.0.2
  Loading requirement: intel/.2019.2 curl/8.4.0
Currently Loaded Modulefiles:
 1) intel/.2019.2 <aL>   2) curl/8.4.0 <aL>   3) R/4.0.2  

Key:
<module-tag>  <aL>=auto-loaded  

R CMD BATCH --no-save --no-restore  R-benchmark-25.R R-benchmark-25.out.735109
real 28.07
user 32.88
sys 2.31
 
Job R-benchmark-25, ID no. 735109 finished at:  Wed Nov 22 11:55:51 PST 2023


# let's check the output file: 

cat  R-benchmark-25.out.$JOB_ID2

GPU type	Compute capability	No. of CUDA cores	Global memory side
A100	8.0	6912	80GB
V100	7.0	5120	32 GB
RTX2080Ti	7.5	4352	10 GB
P4	6.1	2560	8 GB

GPU type	scheduler options
A100	-l gpu,A100,cuda=1
V100	-l gpu,V100,cuda=1
RTX2080Ti	-l gpu,RTX2080Ti,cuda=1
P4	-l gpu,P4,cuda=1

Hoffman2 Happy Hours: Running interactive & batch jobs¶

Raffaella D'Auria, PhD¶

Today Learning Outcomes¶

The cluster at your fingertips¶

How to follow this presentation¶

NOTE:¶

How to run this presentation on a terminal¶

How to run this presentation from a remote desktop¶

How to run this presentation as a jupyter notebook:¶

How to run this presentation as a jupyter notebook - cont'd:¶

How to run this presentation as a jupyter notebook - cont'd II:¶

On which resources will your job run?¶

Highp vs shared vs campus resources:¶

What computational resources do I have access to?¶

Do I have access to highp resources?¶

Working interactively on the Hoffman2 Cluster¶

Working interactively on the Hoffman2 Cluster (Cont'd)¶

Working interactively on the Hoffman2 Cluster - multiple cores¶

Working interactively on the Hoffman2 Cluster - Examples¶

What GPU cards are available and how to request them¶

What GPU cards are available and how to request them (Cont'd)¶

How to check the status of GPU nodes¶

What applications/software is already available on Hoffman2?¶

Apps available via modules¶

Submitting non interactive (batch) jobs¶

What is a batch job?¶

Why?¶

How?¶

Hands-on submitting a job¶

When will my job start?¶

Anatomy of a submission script¶

Where to find sample submission scripts¶

Submitting R jobs the easy way¶

Alternatively get a sample submission script from the H2Docs¶