This shows you the differences between two versions of the page.
Both sides previous revision Previous revision Next revision | Previous revision | ||
cluster:224 [2023/10/13 13:57] hmeij07 |
cluster:224 [2024/01/12 14:36] (current) hmeij07 |
||
---|---|---|---|
Line 7: | Line 7: | ||
< | < | ||
+ | |||
+ | # first step | ||
+ | yum update -y # get to the latest | ||
+ | reboot | ||
# IP ranges | # IP ranges | ||
Line 12: | Line 16: | ||
10.10.102.48 n38-eth1 | 10.10.102.48 n38-eth1 | ||
10.11.103.48 n38-ib0 | 10.11.103.48 n38-ib0 | ||
+ | DEVROUTE=yes # others no | ||
+ | GATEWAY=192, | ||
cd / | cd / | ||
vi ifcfg-eth0 # 192.168.102.x | vi ifcfg-eth0 # 192.168.102.x | ||
vi ifcfg-eth1 # 10.10.102.x | vi ifcfg-eth1 # 10.10.102.x | ||
+ | |||
+ | # or via rc.local? see n102 | ||
+ | vi ifcfg-ib0 | ||
+ | DEVICE=ib0 | ||
+ | ONBOOT=yes | ||
+ | MTU=65520 | ||
+ | CONNECTED_MODE=yes | ||
+ | BOOTPROTO=none | ||
+ | IPADDR=10.11.103.48 | ||
+ | PREFIX=16 | ||
+ | # check with ibstat | ||
+ | Port 1: | ||
+ | State: Active | ||
+ | Physical state: LinkUp | ||
+ | # check with ethtool ib0 | ||
+ | Speed: 40000Mb/s | ||
# root: sync cottontail' | # root: sync cottontail' | ||
ssh-keygen -t rsa | ssh-keygen -t rsa | ||
- | scp 10.10.102.253:/ | + | scp 10.10.102.250:/ |
/ | / | ||
vi / | vi / | ||
Line 71: | Line 93: | ||
yum install libjpeg libjpeg-devel libjpeg-turbo-devel -y | yum install libjpeg libjpeg-devel libjpeg-turbo-devel -y | ||
- | #easybuild | + | # check first |
- | yum install | + | systemctl status rdma # loaded/ |
+ | rpm -qa | egrep " | ||
+ | # no # yum groupinstall " | ||
+ | yum install libibverbs-devel | ||
# amber20 cmake readline error fix needs | # amber20 cmake readline error fix needs | ||
- | yum install | + | yum install ncurses-devel readline-devel -y |
- | | + | |
- | | + | |
# amber20 | # amber20 | ||
Line 89: | Line 112: | ||
# FINISH native vanilla installs | # FINISH native vanilla installs | ||
# R version 4.1.2 (2021-11-01) -- "Bird Hippie" | # R version 4.1.2 (2021-11-01) -- "Bird Hippie" | ||
- | yum install R R-devel | + | yum install R R-devel |
# openjdk version " | # openjdk version " | ||
- | rpm -qa | grep ^java # check | + | rpm -qa | grep ^java # check, else |
yum install java-1.8.0-openjdk java-1.8.0-openjdk-devel \ | yum install java-1.8.0-openjdk java-1.8.0-openjdk-devel \ | ||
- | java-1.8.0-openjdk-headless | + | java-1.8.0-openjdk-headless |
- | # python v 3.9 | + | # python v 2.7.5 |
- | yum install python39 python39-devel | + | |
- | ln -s / | + | |
# fftw 3.3.5-11.el8 | # fftw 3.3.5-11.el8 | ||
- | yum install fftw fftw-devel | + | yum install fftw fftw-devel |
#gnu scientific libraries | #gnu scientific libraries | ||
- | yum install gsl gsl-devel | + | yum install gsl gsl-devel |
# ruby 2.5.9-109.module+el8.5.0 | # ruby 2.5.9-109.module+el8.5.0 | ||
- | yum install ruby ruby-devel | + | yum install ruby ruby-devel |
# obabel chem file formats | # obabel chem file formats | ||
- | yum install openbabel openbabel-devel | + | yum install openbabel openbabel-devel |
# compute nodes old level 3 | # compute nodes old level 3 | ||
systemctl set-default multi-user.target | systemctl set-default multi-user.target | ||
+ | |||
+ | ### centos7 so not an OpenHPC environment | ||
# other configs | # other configs | ||
+ | umount /home | ||
cd /; mv home /usr/local/ | cd /; mv home /usr/local/ | ||
mkdir /home | mkdir /home | ||
ln -s /home /share | ln -s /home /share | ||
vi /etc/passwd (/ | vi /etc/passwd (/ | ||
- | + | vi /etc/fstab | |
- | + | mount -a | |
- | # other configs | + | |
- | mv /home / | + | |
- | mkdir /home | + | |
- | ln -s /home /share | + | |
- | vi /etc/passwd | + | |
# postfix | # postfix | ||
- | dnf install postfix | + | yum install postfix mailx |
- | dnf install | + | echo " |
systemctl enable postfix | systemctl enable postfix | ||
- | echo " | + | systemctl restart |
### DONE | ### DONE | ||
- | undo vlan52, down iptables, reboot, test you can it via privs | + | undo vlan52, down iptables, reboot, |
+ | test you can to it via privaate networks | ||
### REST AT HOME | ### REST AT HOME | ||
- | # or via rc.local? | ||
- | vi ifcfg-ib0 | ||
- | DEVICE=ib0 | ||
- | ONBOOT=yes | ||
- | MTU=65520 | ||
- | CONNECTED_MODE=yes | ||
- | BOOTPROTO=none | ||
- | IPADDR=10.11.103.48 | ||
- | PREFIX=16 | ||
- | mkdir /sanscratch /localscratch | + | # / |
- | chmod ugo+rwx /sanscratch /home/ | + | / |
- | chmod o+t /sanscratch /home/ | + | |
- | ln -s / | + | # if sdb present |
+ | mkdir /sanscratch /localscratch5tb | ||
+ | chmod ugo+rwx /sanscratch /localscratch5tb | ||
+ | chmod o+t /sanscratch /localscratch5tb | ||
+ | ln -s / | ||
cd /home | cd /home | ||
Line 153: | Line 168: | ||
ls -l | ls -l | ||
- | cat /sanscratch/tmp/fstab.tmp >> /etc/fstab; mkdir / | + | # ADD all the NFS mounts see greentail52: |
# fstab file mounts | # fstab file mounts | ||
- | mkdir -p /zfshomes /home66 /home33 /mindstore /opt/ | + | mkdir -p /zfshomes /home66 /home33 /mindstore /astrostore |
mkdir -p / | mkdir -p / | ||
+ | mount -a # via 10.10 | ||
# compute nodes / | # compute nodes / | ||
Line 167: | Line 182: | ||
systemctl restart chronyd | systemctl restart chronyd | ||
chronyc sources | chronyc sources | ||
- | |||
- | cat / | ||
Line 174: | Line 187: | ||
rocommunity public | rocommunity public | ||
dontLogTCPWrappersConnects yes | dontLogTCPWrappersConnects yes | ||
- | # enable, start, | + | # add to zenoss |
+ | systemctl enable snmpd | ||
+ | systemctl start snmpd | ||
# compute nodes only | # compute nodes only | ||
- | # scp fron n79:/ | + | # scp from n79:/ |
- | amber16/ | + | # amber16/ |
+ | scp -rp 10.10.102.89:/ | ||
+ | |||
+ | # copy slurm from n79 | ||
+ | scp -rp 10.10.102.89:/ | ||
+ | ln -s / | ||
+ | |||
+ | |||
+ | # backup and update passwd, shadow, group and hosts files | ||
+ | # scp from n79 or n45 | ||
+ | |||
+ | # slurm config | ||
+ | echo SLURMD_OPTIONS=" | ||
+ | mkdir / | ||
+ | chown slurm:munge / | ||
+ | mkdir / | ||
+ | chown slurm:munge / | ||
+ | # check | ||
+ | chown -R munge:munge /etc/munge / | ||
+ | chown -R slurm:munge / | ||
+ | systemctl enable munge | ||
+ | systemctl start munge | ||
+ | # test unmunge | ||
+ | / | ||
+ | # check log | ||
+ | |||
+ | # /etc/bashrc (login node) | ||
+ | export PATH=/ | ||
+ | export LD_LIBRARY_PATH=/ | ||
+ | |||
+ | # crontab | ||
+ | |||
+ | # ionice gaussian | ||
+ | 0,15,30,45 * * * * / | ||
+ | |||
+ | # cpu temps | ||
+ | 40 * * * * / | ||
+ | |||
+ | on compute node / | ||
+ | * - | ||
+ | |||
+ | |||
+ | / | ||
+ | #timing issue with munge | ||
+ | #sleep 15 | ||
+ | #/ | ||
+ | chmod +x / | ||
+ | |||
+ | # important!! put private back in place | ||
+ | systemctl disable iptables | ||
+ | systemctl stop iptables | ||
+ | reboot | ||
+ | |||
+ | # file date_ctt2.sh | ||
+ | |||
+ | # ctt /etc/pdsh | ||
+ | |||
+ | # ctt:/ | ||
+ | |||
+ | # ctt2:/ | ||
- | # Put the warewulf cluster key in authorized_keys | ||
# Put eth0 fingerprints in cottontail/ | # Put eth0 fingerprints in cottontail/ | ||
- | # add to relevant known_hosts_servername | + | |
+ | # test slurm unmunge and update slurm.conf | ||
</ | </ |