News

on average

ssh-keygen -t ed25519 -f ~/.ssh/elysium -N "passphrase"
Host login00*.elysium.hpc.rub.de login00*.elysium.hpc.ruhr-uni-bochum.de
    IdentityFile ~/.ssh/elysium
    User <loginID>
rub-deploy-spack-configs
export MODULEPATH=$MODULEPATH:$HOME/spack/share/spack/lmod/linux-almalinux9-x86_64/Core
. /cluster/spack/0.23.0/share/spack/setup-env.sh
spack list <keyword>  # Search for packages by name
# Example:
spack list openfoam
openfoam  openfoam-org
==> 2 packages
spack info <package>  # Show versions, variants, and dependencies
# Example:
spack info hdf5
spack info hdf5
Preferred version:  
    1.14.3           https://support.hdfgroup.org/ftp/HDF5/releases/hdf5-1.14/hdf5-1.14.3/src/hdf5-1.14.3.tar.gz

Safe versions:  
    1.14.3           https://support.hdfgroup.org/ftp/HDF5/releases/hdf5-1.14/hdf5-1.14.3/src/hdf5-1.14.3.tar.gz
    1.14.2           https://support.hdfgroup.org/ftp/HDF5/releases/hdf5-1.14/hdf5-1.14.2/src/hdf5-1.14.2.tar.gz
    1.14.1-2         https://support.hdfgroup.org/ftp/HDF5/releases/hdf5-1.14/hdf5-1.14.1-2/src/hdf5-1.14.1-2.tar.gz
    1.14.0           https://support.hdfgroup.org/ftp/HDF5/releases/hdf5-1.14/hdf5-1.14.0/src/hdf5-1.14.0.tar.gz
    1.12.3           https://support.hdfgroup.org/ftp/HDF5/releases/hdf5-1.12/hdf5-1.12.3/src/hdf5-1.12.3.tar.gz
    1.12.2           https://support.hdfgroup.org/ftp/HDF5/releases/hdf5-1.12/hdf5-1.12.2/src/hdf5-1.12.2.tar.gz
    1.12.1           https://support.hdfgroup.org/ftp/HDF5/releases/hdf5-1.12/hdf5-1.12.1/src/hdf5-1.12.1.tar.gz
    1.12.0           https://support.hdfgroup.org/ftp/HDF5/releases/hdf5-1.12/hdf5-1.12.0/src/hdf5-1.12.0.tar.gz
    1.10.11          https://support.hdfgroup.org/ftp/HDF5/releases/hdf5-1.10/hdf5-1.10.11/src/hdf5-1.10.11.tar.gz
    1.10.10          https://support.hdfgroup.org/ftp/HDF5/releases/hdf5-1.10/hdf5-1.10.10/src/hdf5-1.10.10.tar.gz

Variants:
    api [default]               default, v110, v112, v114, v116, v16, v18
        Choose api compatibility for earlier version
    cxx [false]                 false, true
        Enable C++ support
    fortran [false]             false, true
        Enable Fortran support
    hl [false]                  false, true
        Enable the high-level library
    mpi [true]                  false, true
        Enable MPI support
spack spec hdf5
Input spec
--------------------------------
 -   hdf5

Concretized
--------------------------------
[+]  hdf5@1.14.3%gcc@11.4.1~cxx~fortran+hl~ipo~java~map+mpi+shared~subfiling~szip~threadsafe+tools api=default build_system=cmake build_type=Release generator=make patches=82088c8 arch=linux-almalinux9-zen4
[+]      ^cmake@3.27.9%gcc@11.4.1~doc+ncurses+ownlibs build_system=generic build_type=Release arch=linux-almalinux9-zen4
[+]          ^curl@8.7.1%gcc@11.4.1~gssapi~ldap~libidn2~librtmp~libssh+libssh2+nghttp2 build_system=autotools libs=shared,static tls=mbedtls,openssl arch=linux-almalinux9-zen4
[+]              ^libssh2@1.11.0%gcc@11.4.1+shared build_system=autotools crypto=mbedtls patches=011d926 arch=linux-almalinux9-zen4
[+]                  ^xz@5.4.6%gcc@11.4.1~pic build_system=autotools libs=shared,static arch=linux-almalinux9-zen4
[+]              ^mbedtls@2.28.2%gcc@11.4.1+pic build_system=makefile build_type=Release libs=shared,static arch=linux-almalinux9-zen4
[+]              ^nghttp2@1.52.0%gcc@11.4.1 build_system=autotools arch=linux-almalinux9-zen4
[+]                  ^diffutils@3.10%gcc@11.4.1 build_system=autotools arch=linux-almalinux9-zen4
[+]              ^openssl@3.3.0%gcc@11.4.1~docs+shared build_system=generic certs=mozilla arch=linux-almalinux9-zen4
[+]                  ^ca-certificates-mozilla@2023-05-30%gcc@11.4.1 build_system=generic arch=linux-almalinux9-zen4
[+]          ^ncurses@6.5%gcc@11.4.1~symlinks+termlib abi=none build_system=autotools patches=7a351bc arch=linux-almalinux9-zen4
[+]      ^gcc-runtime@11.4.1%gcc@11.4.1 build_system=generic arch=linux-almalinux9-zen4
[e]      ^glibc@2.34%gcc@11.4.1 build_system=autotools arch=linux-almalinux9-zen4
[+]      ^gmake@4.4.1%gcc@11.4.1~guile build_system=generic arch=linux-almalinux9-zen4
[+]      ^openmpi@5.0.3%gcc@11.4.1~atomics~cuda~gpfs~internal-hwloc~internal-libevent~internal-pmix~java+legacylaunchers~lustre~memchecker~openshmem~orterunprefix~romio+rsh~static+vt+wrapper-rpath build_system=autotools fabrics=ofi romio-filesystem=none schedulers=slurm arch=linux-almalinux9-zen4
spack install hdf5 +mpi +cxx ~hl  # Enable MPI and C++, disable high-level API
spack install openmpi +cuda cuda_arch=80,90
spack compilers
spack install hdf5 %gcc@11.4.1
spack install --fresh hdf5 %gcc@13.2.0
spack install hdf5 ^openmpi@4.1.5
spack install hdf5 +mpi ^openmpi@4.1.5 +threads_multiple
spack install hdf5@1.14.3 +mpi ~hl ^openmpi@4.1.5 +cuda cuda_arch=80,90 %gcc@11.4.1
spack install gcc@13.2.0
spack compiler add $(spack location -i gcc@13.2.0)
spack compilers
spack install --fresh hdf5 %gcc@13.2.0
spack find -vl hdf5

-- linux-almalinux9-zen4 / gcc@11.4.1 ---------------------------
amrsck6 hdf5@1.14.3~cxx~fortran+hl~ipo~java~map+mpi+shared~subfiling~szip~threadsafe+tools api=default build_system=cmake build_type=Release generator=make patches=82088c8

2dsgtoe hdf5@1.14.3+cxx+fortran~hl~ipo~java~map+mpi+shared~subfiling~szip~threadsafe+tools api=default build_system=cmake build_type=Release generator=make patches=82088c8

==> 2 installed packages
spack spec /amrsck6  
spack spec /2dsgtoe 
spack diff /amrsck6 /2dsgtoe

--- hdf5@1.14.3/amrsck6mml43sfv4bhvvniwdydaxfgne
+++ hdf5@1.14.3/2dsgtoevoypx7dr45l5ke2dlb56agvz4
@@ virtual_on_incoming_edges @@
-  openmpi mpi
+  mpich mpi
spack uninstall /amrsck6
source /cluster/spack/0.23.0/share/spack/setup-env.sh
upstreams:
  central-spack:
    install_tree: /cluster/spack/opt
config:
  install_tree:
    root: $HOME/spack/opt/spack
  source_cache: $HOME/spack/cache
  license_dir: $HOME/spack/etc/spack/licenses
modules:
  default:
    roots:
      lmod: $HOME/spack/share/spack/lmod
    enable: [lmod]
    lmod:
      all:
        autoload: direct
      hide_implicits: true
      hierarchy: []
export MODULEPATH=$MODULEPATH:$HOME/spack/share/spack/lmod/linux-almalinux9-x86_64/Core
. /cluster/spack/0.23.0/share/spack/setup-env.sh
spack compiler find
repos:
  - $HOME/spack/var/spack/repos
repo:
  namespace: overrides
cd ~/spack/var/spack/repos/
mkdir -p packages/ffmpeg
cp /cluster/spack/0.23.0/var/spack/repos/builtin/packages/ffmpeg/package.py packages/ffmpeg
vim packages/ffmpeg/package.py
 1[login_id@login001 ~]$ sinfo
 2PARTITION      AVAIL  TIMELIMIT  NODES  STATE NODELIST
 3cpu               up 7-00:00:00      4  alloc cpu[033-034,037-038]
 4cpu               up 7-00:00:00    280   idle cpu[001-032,035-036,039-284]
 5cpu_filler        up    3:00:00      4  alloc cpu[033-034,037-038]
 6cpu_filler        up    3:00:00    280   idle cpu[001-032,035-036,039-284]
 7fat_cpu           up 2-00:00:00     13   idle fatcpu[001-013]
 8fat_cpu_filler    up    3:00:00     13   idle fatcpu[001-013]
 9gpu               up 2-00:00:00     20   idle gpu[001-020]
10gpu_filler        up    1:00:00     20   idle gpu[001-020]
11fat_gpu           up 2-00:00:00      1 drain* fatgpu005
12fat_gpu           up 2-00:00:00      5    mix fatgpu[001,003-004,006-007]
13fat_gpu           up 2-00:00:00      1   idle fatgpu002
14fat_gpu_filler    up    1:00:00      1 drain* fatgpu005
15fat_gpu_filler    up    1:00:00      5    mix fatgpu[001,003-004,006-007]
16fat_gpu_filler    up    1:00:00      1   idle fatgpu002
17vis               up 1-00:00:00      3   idle vis[001-003]
1[login_id@login001 ~]$ srun -N 1 --partition=cpu --job-name=test --time=00:05:00 --account=testproj_0000 --pty bash
2[login_id@cpu001 ~]$
1[login_id@login001 ~]$ sbatch -N 1 --partition=cpu --job-name=test --time=00:05:00 --account=testproj_0000 myscript.sh
2Submitted batch job 10290
1[login_id@login001 ~]$ squeue
2             JOBID PARTITION     NAME     USER ST       TIME  NODES NODELIST(REASON)
3             10290       cpu     test login_id  R       2:51      1 cpu001
1[login_id@login001 ~]$ sshare
2Account                    User  RawShares  NormShares    RawUsage  EffectvUsage  FairShare
3-------------------- ---------- ---------- ----------- ----------- ------------- ----------
4testproj_0000          login_id       1000    0.166667    20450435      0.163985   0.681818
1[login_id@login001 ~]$ rub-acclist
2Project ID    | Project Description
3--------------+--------------------------------------------------
4testproj_0000 | The fundamental interconnectedness of all things
5testproj_0001 | The translated quaternion for optimal pivoting
salloc -p vis -N1 --time=02:00:00 --account=$ACCOUNT
vglconnect -s $HPCUSER@vis001.elysium.hpc.rub.de -J $HPCUSER@login001.elysium.hpc.rub.de
module load vmd
vglrun +pr -fps 60 vmd
scancel $jobID
1#SBATCH --nodes=1                 # Request 1 Node
2#SBATCH --partition=gpu           # Run in partition cpu
3#SBATCH --job-name=minimal_gpu    # name of the job in squeue
4#SBATCH --gpus=1                  # number of GPUs to reserve
5#SBATCH --time=00:05:00           # estimated runtime (dd-hh:mm:ss)
6#SBATCH --account=lambem64_0000   # Project ID (check with rub-acclist)
 1# obtain the current location
 2HDIR=$(pwd)
 3
 4# create a temporary working directory on the node
 5WDIR=/tmp
 6cd ${WDIR}
 7
 8# copy set of input files to the working directory
 9cp ${HDIR}/inputdata/* ${WDIR}
10
11...
12
13# copy the set of output files back to the original folder
14cp outputdata ${HDIR}/outputs/
15
16# tidy up local files
17rm -rf ${WDIR}/*
 1# unload all previously loaded modules
 2module purge
 3
 4# show all module that are available
 5module avail
 6
 7# load a specific module
 8module load the_modules_name_and_version
 9
10# list all loaded modules
11module list
1for irun in $(seq 1 ${stride} ${ncores})
2do
3    # The core count needs to start at 0 and goes to ncores-1
4    taskset -c $(bc <<< "${irun-1}") ${myexe} inp.${irun} > out.${irun}
5done
6wait
1export OMP_NUM_THREADS=${SLURM_TASKS_PER_NODE}
2${myexe} input
1ncorespernode=48
2nnodes=${SLURM_JOB_NUM_NODES}
3ncorestotal=$(bc <<< "${ncorespernode}*${nnodes}")
4mpirun -np ${ncorestotal} -ppn ${ncorespernode} ${myexe} input
1nthreadsperproc=2
2ncorespernode=$(bc <<< "48/${nthreadsperproc}")
3nnodes=${SLURM_JOB_NUM_NODES}
4ncorestotal=$(bc <<< "${ncorespernode}*${nnodes}")
5export OMP_NUM_THREADS=${nthreadsperproc}
6mpirun -np ${ncorestotal} -ppn ${ncorespernode} ${myexe} input
1export CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7
2${myexe} input
# Copy local to cluster
rsync -r --progress --compress --bwlimit=10240 <local_source_path> login001.elysium.hpc.rub.de:<remote_destination_path>

# Copy cluster to local
rsync -r --progress --compress --bwlimit=10240 login001.elysium.hpc.rub.de:<remote_source_path> <local_destination_path>
# create a tar archive
tar -cvf myfiles.tar dir_or_files.*

# extract a tar archive
tar -xvf myfiles.tar

Type	Count	CPU	Memory	Local NVMe Storage	GPU
Thin-CPU	284	2xAMD EPYC 9254 (24 core)	384 GB	960 GB	-
Fat-CPU	13	2xAMD EPYC 9454 (48 core)	2304 GB	1.92 TB	-
Thin-GPU	20	2xAMD EPYC 9254 (24 core)	384 GB	1.92 TB	3xNVIDIA A30 Tensor Core GPU 24GB, 933GB/s
Fat-GPU	7	2xAMD EPYC 9454 (48 core)	1152 GB	1.92 TB + 15.36 TB	8xNVIDIA H100 SXM5 GPUs 80GB, 3.35TB/s

Partition	Timelimit	Nodelist	Max Tasks per Node	Max Memory per CPU³	Share-Cost²
cpu	2-00:00:00¹	cpu[001-284]	48	8 GB	1.000 / core
cpu_filler	3:00:00	cpu[001-336]	48	8 GB	0.050 / core
fat_cpu	2-00:00:00	fatcpu[001-013]	96	24 GB	1.347 / core
fat_cpu_filler	3:00:00	fatcpu[001-013]	96	24 GB	0.067 / core
gpu	2-00:00:00	gpu[001-020]	48	8 GB	49.374 / GPU
gpu_filler	1:00:00	gpu[001-020]	48	8 GB	12.344 / GPU
fat_gpu	2-00:00:00	fatgpu[001-007]	96	12 GB	196.867 / GPU
fat_gpu_filler	1:00:00	fatgpu[001-007]	96	12 GB	49.217 / GPU
vis	1-00:00:00	vis[001-003]	48	24 GB	5.000 / core

Metric name	Meaning	Meaningful for shared jobs
CPU
cpu_load	Load on the node (processes/threads requesting CPU time)	No
cpu_load_core	Load on CPU cores of a job (processes/threads per core)	Yes
cpu_user	Percentage of CPU time spent as user time for each CPU core	Yes
clock	Frequency of the CPU cores of the job	Yes (affected by other jobs)
ipc	Instructions per cycle	Yes
flops_any	Floating-point operations performed by CPU cores	Yes
core_power	Power consumption of individual CPU cores	Yes
Memory
mem_bw	Memory bandwidth	No (full socket only)
mem_used	Main memory used on the node	No
disk_free	Free disk space on the node	No
GPU
nv_compute_processes	Number of processes using the GPU	Yes
acc_mem_used	Accelerator (GPU) memory usage	Yes
acc_mem_util	Accelerator (GPU) memory utilization	Yes
acc_power	Accelerator (GPU) power usage	Yes
acc_utilization	Accelerator (GPU) compute utilization	Yes
Filesystem
lustre_write_bw	/lustre write bandwidth	No
lustre_read_bw	/lustre read bandwidth	No
lustre_close	/lustre file close requests	No
lustre_open	/lustre file open requests	No
lustre_statfs	/lustre file stat requests	No
io_reads	Local Disk I/O read operations	No
io_writes	Local Disk I/O write operations	No
nfs4_close	/home + /cluster file close requests	No
nfs4_open	/home + /cluster file open requests	No
nfsio_nread	/home + /cluster I/O read bandwidth	No
nfsio_nwrite	/home + /cluster I/O write bandwidth	No
Network
ib_recv	Omnipath receive bandwidth	No
ib_xmit	Omnipath transmit bandwidth	No
ib_recv_pkts	Omnipath received packets/s	No
ib_xmit_pkts	Omnipath transmitted packets/s	No
net_bytes_in	Ethernet incoming bandwidth	No
net_bytes_out	Ethernet outgoing bandwidth	No
net_pkts_in	Ethernet incoming packets/s	No
net_pkts_out	Ethernet outgoing packets/s	No
NUMA Nodes
numastats_numa_hit	NUMA hits	No
numastats_numa_miss	NUMA misses	No
numastats_interleave_hit	NUMA interleave hits	No
numastats_local_node	NUMA local node accesses	No
numastats_numa_foreign	NUMA foreign node accesses	No
numastats_other_node	NUMA other node accesses	No
Node metrics
node_total_power	Power consumption of the whole node	No

Flag	Example	Note
`--partiton=<partition>`	`--partition=cpu`	list of partitions with `sinfo`
`--time=<dd-hh:mm:ss>`	`--time=00-02:30:00`	maximum time the job will run
`--account=<account>`	`--account=snublaew_0001`	project the used computing time shall be billed to. list of project accounts with `rub-acclist`
`--gpus=<n>`	`--gpus=1`	number of GPUs. Must be at least 1 for GPU partitions

Flag	Example	Note
`--job-name=<name>`	`--job-name="mysim"`	job name that is shown in `squeue` for the job
`--exclusive`	`--exclusive`	Nodes are not shared with other jobs (default on cpu, fat_cpu, gpu).
`--output=<filename>`	`--output=%x-%j.out`	Filename to contain stdout (`%x=job name`, `%j=job-id`)
`--error=<filename>`	`--error=%x-%j.err`	Filename to contain stderr (`%x=job name`, `%j=job-id`)
`--mail-type=<TYPE>`	`--mail-type=ALL`	Notify user by email when certain event types occur. If specified `--mail-user` needs to be set.
`--mail-user=<rub-mail>`	`--mail-user=max.muster@rub.de`	Address to which job notifications of type `--mail-type` are send.

Subsections of

News

New Feature: Job Monitoring with ClusterCockpit

User Community Matrix Room

Elysium Launch Event

Cluster Elysium is now open!

Upcoming HPC course

Upcoming Introduction to the Tier-3 System

Upcoming Linux and HPC courses

Subsections of News

Overview

Subsections of Overview

Regulations

Governing Structure

FairShare

Project Management

Resources at RUB

HPC Cluster Elysium

Node Specifications

Interconnect Specifications

File Systems

Partition Overview

Resources Elsewhere

HPC Pyramid

State-wide Computing Resources (Tier-2, Tier-3)

National and EU-wide HPC-Resources (Tier-1 and Tier-0)

Access to HPC Resources elsewhere

HPC.NRW

Access

Subsections of Access

Get User Access

Updating the SSH-Key

Apply for a HPC Project

Updating a Project

Become Project Manager

Documentation

Subsections of Documentation

Basics

Login

Software

Subsections of Software

Modules

Compilers

MPI Libraries

Mathematical Libraries

Programming Languages

Tools and Utilities

Spack

Table of Contents

Quick Setup with rub-deploy-spack-configs

Guide to Using Spack

Searching for Packages

Viewing Package Variants

Checking the Installation

Enabling/Disabling Variants

Specifying Compilers

Specifying Dependencies

Putting It All Together

Building and Adding a New Compiler

Comparing installed package variants

List installed packages with variants

Inspect specific installations

Compare two installations

Removing Packages

Central Spack Installation

Overriding Package Definitions

SLURM

List of Partition

Requesting Nodes of a Partition

Shared Nodes

GPU Nodes

Visualization Nodes

List of Currently Running and Pending Jobs

List of Computing Resources Share

List of Project Accounts

Visualization

Requirements:

Resource allocation:

Establish Virtual GL connection:

Run your Software:

Quick Setup with `rub-deploy-spack-configs`