This shows you the differences between two versions of the page.
Both sides previous revision Previous revision Next revision | Previous revision Next revision Both sides next revision | ||
cluster:213 [2022/03/25 12:47] hmeij07 [Config Recipe] |
cluster:213 [2022/05/10 17:48] hmeij07 |
||
---|---|---|---|
Line 44: | Line 44: | ||
# Put the warewulf cluster key in authorized_keys | # Put the warewulf cluster key in authorized_keys | ||
+ | # Put eth0 fingerprints in cottontail/ | ||
+ | # add to relevant known_hosts_servername file | ||
# configure private subnets and ping file server | # configure private subnets and ping file server | ||
Line 81: | Line 83: | ||
dnf install gnuplot | dnf install gnuplot | ||
dnf install alpine # pico | dnf install alpine # pico | ||
+ | yum groupinstall " | ||
# other configs | # other configs | ||
Line 113: | Line 116: | ||
# on head node / | # on head node / | ||
- | allow 192.168.0.0/ | + | allow 192.168.0.0/ |
# compute nodes / | # compute nodes / | ||
#pool 2.pool.ntp.org iburst | #pool 2.pool.ntp.org iburst | ||
Line 120: | Line 123: | ||
# check | # check | ||
chronyc sources | chronyc sources | ||
+ | |||
+ | |||
+ | # on head node install from epel repo | ||
+ | yum install slurm-openlava | ||
+ | # error on conflicting libs, too bad! | ||
Line 134: | Line 142: | ||
yum install cmake -y | yum install cmake -y | ||
yum install libjpeg libjpeg-devel libjpeg-turbo-devel -y | yum install libjpeg libjpeg-devel libjpeg-turbo-devel -y | ||
- | # amber | + | |
+ | #easybuild | ||
+ | yum install libibvers libibverbs-devel | ||
+ | |||
+ | # amber20 cmake readline error fix needs | ||
+ | yum install ncurses-c++-libs-6.1-9.20180224.el8.x86_64.rpm \ | ||
+ | ncurses-devel-6.1-9.20180224.el8.x86_64.rpm \ | ||
+ | readline-devel-7.0-10.el8.x86_64.rpm | ||
+ | |||
+ | # amber20 | ||
yum -y install tcsh make \ | yum -y install tcsh make \ | ||
gcc gcc-gfortran gcc-c++ \ | gcc gcc-gfortran gcc-c++ \ | ||
Line 170: | Line 187: | ||
# python v 3.9 | # python v 3.9 | ||
yum install python39 python39-devel | yum install python39 python39-devel | ||
+ | ln -s / | ||
# fftw 3.3.5-11.el8 | # fftw 3.3.5-11.el8 | ||
yum install fftw fftw-devel | yum install fftw fftw-devel | ||
Line 216: | Line 234: | ||
libhwloc.so.15 => / | libhwloc.so.15 => / | ||
- | # add to zenoss | + | # add to zenoss |
+ | rocommunity public | ||
+ | dontLogTCPWrappersConnects yes | ||
</ | </ | ||
Line 232: | Line 252: | ||
\\ | \\ | ||
+ | ==== Amber20 ==== | ||
+ | OpenHPC | ||
+ | |||
+ | < | ||
+ | |||
+ | | ||
+ | 989 tar xvfj ../ | ||
+ | 993 cd amber20_src/ | ||
+ | 994 cd build/ | ||
+ | 996 vi run_cmake | ||
+ | |||
+ | # Assume this is Linux: | ||
+ | |||
+ | # serial, do on heasd node, pull down miniconda, compile, install | ||
+ | cmake $AMBER_PREFIX/ | ||
+ | -DCMAKE_INSTALL_PREFIX=/ | ||
+ | -DCOMPILER=GNU | ||
+ | -DMPI=FALSE -DCUDA=FALSE -DINSTALL_TESTS=TRUE \ | ||
+ | -DDOWNLOAD_MINICONDA=TRUE -DMINICONDA_USE_PY3=TRUE \ | ||
+ | 2>&1 | tee cmake.log | ||
+ | |||
+ | # Env | ||
+ | |||
+ | [hmeij@n100 ~]$ module load cuda/11.6 | ||
+ | |||
+ | [hmeij@n100 ~]$ echo $CUDA_HOME | ||
+ | / | ||
+ | |||
+ | [hmeij@n100 ~]$ which nvcc mpicc gcc | ||
+ | / | ||
+ | / | ||
+ | / | ||
+ | |||
+ | # [FIXED} cmake error on conda install, set to FALSE | ||
+ | # OS native python, install on n[100-101] | ||
+ | -- Python version 3.9 -- OK | ||
+ | -- Found PythonLibs: / | ||
+ | -- Checking for Python package numpy -- not found | ||
+ | -- Checking for Python package scipy -- not found | ||
+ | -- Checking for Python package matplotlib -- not found | ||
+ | -- Checking for Python package setuptools -- found | ||
+ | [END FIXED] | ||
+ | |||
+ | # mpi & cuda FALSE builds serial | ||
+ | ./run_cmake | ||
+ | make install | ||
+ | # lots and lots of warnings | ||
+ | |||
+ | # then | ||
+ | source / | ||
+ | |||
+ | # on n100 now, parallel, set miniconda flags to FALSE | ||
+ | -MPI=TRUE | ||
+ | ./run_cmake | ||
+ | make install | ||
+ | |||
+ | # on n100 just change cuda flag | ||
+ | -CUDA=TRUE | ||
+ | ./run_cmake | ||
+ | make install | ||
+ | |||
+ | #tests | ||
+ | cd $AMBERHOME | ||
+ | make test.serial | ||
+ | export DO_PARALLEL=" | ||
+ | make test.parallel | ||
+ | export CUDA_VISIBLE_DEVICES=0 | ||
+ | make test.cuda.serial | ||
+ | make test.cuda.parallel | ||
+ | |||
+ | </ | ||
**[[cluster: | **[[cluster: | ||