安装依赖
yum groupinstall 'Development Tools' -y
yum install hwloc hwloc-devel gtk2-devel gtk2 pam libevent-devel pam-devel numactl-devel readline-devel lua-devel hdf5-devel.x86_64 man2html freeipmi-devel openssl-devel rrdtool-devel mariadb-server mariadb mariadb-devel pam-devel numactl-devel numactl-devel readline-devel lua-devel hdf5-devel.x86_64 man2html freeipmi-devel openssl-devel rrdtool-devel json-c json-c-devel -y
yum install munge munge-devel freeipmi freeipmi-devel pmix-devel readline-devel rrdtool rrdtool-devel json-c json-c-devel yaml-cpp-devel yaml-cpp -y
yum install perl python3 libcurl-devel libyaml-devel libjwt-devel lz4-devel libnuma-devel -y
#安装nvidia显卡支持库
./cuda_12.0.1_525.85.12_linux.run (必须安装cuda才能支持 nvml)
./NVIDIA-Linux-x86_64-525.105.17.run -no-x-check -no-nouveau-check -no-opengl-files -s (无效)
安装pmix 调度器
安装 pmix 1.2.5 (过于老版本,弃用)
tar -xf pmix-1.2.5.tar.gz
cd pmix-1.2.5
./configure --prefix=/data/software/pmix/1.2.5
Make && make install
安装pmix 2.2.5
tar -xf pmix-2.2.5.tar.bz2
cd pmix-2.2.5/
./configure --prefix=/data/software/pmix/2.2.5
make -j 4 && make install
安装 pmix 3.1.6
tar -xf pmix-3.1.6.tar.gz
cd pmix-3.1.6/
./configure --prefix=/data/software/pmix/3.1.6
make -j 4 && make install
安装 pmix 4.1.1
cd pmix-4.1.1/
./configure --prefix=/data/software/pmix/4.1.1
make -j 4 && make install
编译slurm
rpmbuild --define '_slurm_sysconfdir /etc/slurm/' --define '_defaultdocdir /etc/slurm/docs' --define '_with_pmix --with-pmix=/data/software/pmix/2.2.5/:/data/software/pmix/3.1.6/:/data/software/pmix/4.1.1/' --define '_with_nvml --with-nvml=/usr/local/cuda-12.0' -ta slurm-22.05.11.tar.bz2
安装slurm 调度系统
master
#配置nis
#配置munge
#配置数据库
mkdir -p /opt/src/slurm
cp /root/rpmbuild/RPMS/x86_64/*.rpm /opt/src/slurm/
yum localinstall /opt/src/slurm/*.rpm