cluster:224
Differences
This shows you the differences between two versions of the page.
| Both sides previous revisionPrevious revisionNext revision | Previous revision | ||
| cluster:224 [2023/10/13 13:57] – hmeij07 | cluster:224 [2024/01/12 14:36] (current) – hmeij07 | ||
|---|---|---|---|
| Line 7: | Line 7: | ||
| < | < | ||
| + | |||
| + | # first step | ||
| + | yum update -y # get to the latest | ||
| + | reboot | ||
| # IP ranges | # IP ranges | ||
| Line 12: | Line 16: | ||
| 10.10.102.48 n38-eth1 | 10.10.102.48 n38-eth1 | ||
| 10.11.103.48 n38-ib0 | 10.11.103.48 n38-ib0 | ||
| + | DEVROUTE=yes # others no | ||
| + | GATEWAY=192, | ||
| cd / | cd / | ||
| vi ifcfg-eth0 # 192.168.102.x | vi ifcfg-eth0 # 192.168.102.x | ||
| vi ifcfg-eth1 # 10.10.102.x | vi ifcfg-eth1 # 10.10.102.x | ||
| + | |||
| + | # or via rc.local? see n102 | ||
| + | vi ifcfg-ib0 | ||
| + | DEVICE=ib0 | ||
| + | ONBOOT=yes | ||
| + | MTU=65520 | ||
| + | CONNECTED_MODE=yes | ||
| + | BOOTPROTO=none | ||
| + | IPADDR=10.11.103.48 | ||
| + | PREFIX=16 | ||
| + | # check with ibstat | ||
| + | Port 1: | ||
| + | State: Active | ||
| + | Physical state: LinkUp | ||
| + | # check with ethtool ib0 | ||
| + | Speed: 40000Mb/s | ||
| # root: sync cottontail' | # root: sync cottontail' | ||
| ssh-keygen -t rsa | ssh-keygen -t rsa | ||
| - | scp 10.10.102.253:/ | + | scp 10.10.102.250:/ |
| / | / | ||
| vi / | vi / | ||
| Line 71: | Line 93: | ||
| yum install libjpeg libjpeg-devel libjpeg-turbo-devel -y | yum install libjpeg libjpeg-devel libjpeg-turbo-devel -y | ||
| - | #easybuild | + | # check first |
| - | yum install | + | systemctl status rdma # loaded/ |
| + | rpm -qa | egrep " | ||
| + | # no # yum groupinstall " | ||
| + | yum install libibverbs-devel | ||
| # amber20 cmake readline error fix needs | # amber20 cmake readline error fix needs | ||
| - | yum install | + | yum install ncurses-devel readline-devel -y |
| - | | + | |
| - | | + | |
| # amber20 | # amber20 | ||
| Line 89: | Line 112: | ||
| # FINISH native vanilla installs | # FINISH native vanilla installs | ||
| # R version 4.1.2 (2021-11-01) -- "Bird Hippie" | # R version 4.1.2 (2021-11-01) -- "Bird Hippie" | ||
| - | yum install R R-devel | + | yum install R R-devel |
| # openjdk version " | # openjdk version " | ||
| - | rpm -qa | grep ^java # check | + | rpm -qa | grep ^java # check, else |
| yum install java-1.8.0-openjdk java-1.8.0-openjdk-devel \ | yum install java-1.8.0-openjdk java-1.8.0-openjdk-devel \ | ||
| - | java-1.8.0-openjdk-headless | + | java-1.8.0-openjdk-headless |
| - | # python v 3.9 | + | # python v 2.7.5 |
| - | yum install python39 python39-devel | + | |
| - | ln -s / | + | |
| # fftw 3.3.5-11.el8 | # fftw 3.3.5-11.el8 | ||
| - | yum install fftw fftw-devel | + | yum install fftw fftw-devel |
| #gnu scientific libraries | #gnu scientific libraries | ||
| - | yum install gsl gsl-devel | + | yum install gsl gsl-devel |
| # ruby 2.5.9-109.module+el8.5.0 | # ruby 2.5.9-109.module+el8.5.0 | ||
| - | yum install ruby ruby-devel | + | yum install ruby ruby-devel |
| # obabel chem file formats | # obabel chem file formats | ||
| - | yum install openbabel openbabel-devel | + | yum install openbabel openbabel-devel |
| # compute nodes old level 3 | # compute nodes old level 3 | ||
| systemctl set-default multi-user.target | systemctl set-default multi-user.target | ||
| + | |||
| + | ### centos7 so not an OpenHPC environment | ||
| # other configs | # other configs | ||
| + | umount /home | ||
| cd /; mv home /usr/local/ | cd /; mv home /usr/local/ | ||
| mkdir /home | mkdir /home | ||
| ln -s /home /share | ln -s /home /share | ||
| vi /etc/passwd (/ | vi /etc/passwd (/ | ||
| - | + | vi /etc/fstab | |
| - | + | mount -a | |
| - | # other configs | + | |
| - | mv /home / | + | |
| - | mkdir /home | + | |
| - | ln -s /home /share | + | |
| - | vi /etc/passwd | + | |
| # postfix | # postfix | ||
| - | dnf install postfix | + | yum install postfix mailx |
| - | dnf install | + | echo " |
| systemctl enable postfix | systemctl enable postfix | ||
| - | echo " | + | systemctl restart |
| ### DONE | ### DONE | ||
| - | undo vlan52, down iptables, reboot, test you can it via privs | + | undo vlan52, down iptables, reboot, |
| + | test you can to it via privaate networks | ||
| ### REST AT HOME | ### REST AT HOME | ||
| - | # or via rc.local? | ||
| - | vi ifcfg-ib0 | ||
| - | DEVICE=ib0 | ||
| - | ONBOOT=yes | ||
| - | MTU=65520 | ||
| - | CONNECTED_MODE=yes | ||
| - | BOOTPROTO=none | ||
| - | IPADDR=10.11.103.48 | ||
| - | PREFIX=16 | ||
| - | mkdir /sanscratch /localscratch | + | # / |
| - | chmod ugo+rwx /sanscratch /home/ | + | / |
| - | chmod o+t /sanscratch /home/ | + | |
| - | ln -s / | + | # if sdb present |
| + | mkdir /sanscratch /localscratch5tb | ||
| + | chmod ugo+rwx /sanscratch /localscratch5tb | ||
| + | chmod o+t /sanscratch /localscratch5tb | ||
| + | ln -s / | ||
| cd /home | cd /home | ||
| Line 153: | Line 168: | ||
| ls -l | ls -l | ||
| - | cat /sanscratch/tmp/fstab.tmp >> /etc/fstab; mkdir / | + | # ADD all the NFS mounts see greentail52: |
| # fstab file mounts | # fstab file mounts | ||
| - | mkdir -p /zfshomes /home66 /home33 /mindstore /opt/ | + | mkdir -p /zfshomes /home66 /home33 /mindstore /astrostore |
| mkdir -p / | mkdir -p / | ||
| + | mount -a # via 10.10 | ||
| # compute nodes / | # compute nodes / | ||
| Line 167: | Line 182: | ||
| systemctl restart chronyd | systemctl restart chronyd | ||
| chronyc sources | chronyc sources | ||
| - | |||
| - | cat / | ||
| Line 174: | Line 187: | ||
| rocommunity public | rocommunity public | ||
| dontLogTCPWrappersConnects yes | dontLogTCPWrappersConnects yes | ||
| - | # enable, start, | + | # add to zenoss |
| + | systemctl enable snmpd | ||
| + | systemctl start snmpd | ||
| # compute nodes only | # compute nodes only | ||
| - | # scp fron n79:/ | + | # scp from n79:/ |
| - | amber16/ | + | # amber16/ |
| + | scp -rp 10.10.102.89:/ | ||
| + | |||
| + | # copy slurm from n79 | ||
| + | scp -rp 10.10.102.89:/ | ||
| + | ln -s / | ||
| + | |||
| + | |||
| + | # backup and update passwd, shadow, group and hosts files | ||
| + | # scp from n79 or n45 | ||
| + | |||
| + | # slurm config | ||
| + | echo SLURMD_OPTIONS=" | ||
| + | mkdir / | ||
| + | chown slurm:munge / | ||
| + | mkdir / | ||
| + | chown slurm:munge / | ||
| + | # check | ||
| + | chown -R munge:munge /etc/munge / | ||
| + | chown -R slurm:munge / | ||
| + | systemctl enable munge | ||
| + | systemctl start munge | ||
| + | # test unmunge | ||
| + | / | ||
| + | # check log | ||
| + | |||
| + | # /etc/bashrc (login node) | ||
| + | export PATH=/ | ||
| + | export LD_LIBRARY_PATH=/ | ||
| + | |||
| + | # crontab | ||
| + | |||
| + | # ionice gaussian | ||
| + | 0,15,30,45 * * * * / | ||
| + | |||
| + | # cpu temps | ||
| + | 40 * * * * / | ||
| + | |||
| + | on compute node / | ||
| + | * - | ||
| + | |||
| + | |||
| + | / | ||
| + | #timing issue with munge | ||
| + | #sleep 15 | ||
| + | #/ | ||
| + | chmod +x / | ||
| + | |||
| + | # important!! put private back in place | ||
| + | systemctl disable iptables | ||
| + | systemctl stop iptables | ||
| + | reboot | ||
| + | |||
| + | # file date_ctt2.sh | ||
| + | |||
| + | # ctt /etc/pdsh | ||
| + | |||
| + | # ctt:/ | ||
| + | |||
| + | # ctt2:/ | ||
| - | # Put the warewulf cluster key in authorized_keys | ||
| # Put eth0 fingerprints in cottontail/ | # Put eth0 fingerprints in cottontail/ | ||
| - | # add to relevant known_hosts_servername | + | |
| + | # test slurm unmunge and update slurm.conf | ||
| </ | </ | ||
cluster/224.1697205477.txt.gz · Last modified: by hmeij07
