cluster:209
Differences
This shows you the differences between two versions of the page.
| Both sides previous revisionPrevious revisionNext revision | Previous revision | ||
| cluster:209 [2021/11/02 13:32] – hmeij07 | cluster:209 [2022/04/10 19:49] (current) – [OHPC] hmeij07 | ||
|---|---|---|---|
| Line 10: | Line 10: | ||
| * https:// | * https:// | ||
| * https:// | * https:// | ||
| + | * https:// | ||
| + | |||
| + | **NOTE** this eats up lots of disk space with multiple compiler and tool chains as you will see, hence installed in / | ||
| < | < | ||
| Line 109: | Line 112: | ||
| # yumdownloader --desdir=somewhere | # yumdownloader --desdir=somewhere | ||
| # centos 7 nodes only | # centos 7 nodes only | ||
| - | cd / | + | cd / |
| + | rpm -ivh environment-modules-3.2.10-10.el7.x86_64.rpm \ | ||
| rpm -ivh lua-filesystem-1.6.2-2.el7.x86_64.rpm \ | rpm -ivh lua-filesystem-1.6.2-2.el7.x86_64.rpm \ | ||
| lua-json-1.3.2-2.el7.noarch.rpm \ | lua-json-1.3.2-2.el7.noarch.rpm \ | ||
| Line 116: | Line 120: | ||
| lua-bitop-1.0.2-3.el7.x86_64.rpm \ | lua-bitop-1.0.2-3.el7.x86_64.rpm \ | ||
| lua-lpeg-0.12-1.el7.x86_64.rpm | lua-lpeg-0.12-1.el7.x86_64.rpm | ||
| - | Lmod-8.2.7-1.el7.x86_64.rpm | + | Lmod-8.2.7-1.el7.x86_64.rpm |
| # log out and log back in | # log out and log back in | ||
| # end sidebar | # end sidebar | ||
| Line 125: | Line 129: | ||
| # example easybuild installation of software | # example easybuild installation of software | ||
| - | eb Bowtie2-2.4.2-GCC-9.3.0.eb --dry-run --robot --prefix=/share/apps/ | + | eb Bowtie2-2.4.2-GCC-9.3.0.eb --dry-run --robot --prefix=/sanscratch/ |
| # do not forget prefix else it goes to $HOME/ | # do not forget prefix else it goes to $HOME/ | ||
| # once done | # once done | ||
| - | module use /share/apps/ | + | module use /sanscratch/ |
| # use ' | # use ' | ||
| Line 145: | Line 149: | ||
| [hmeij@greentail52 ~]$ which bowtie2 | [hmeij@greentail52 ~]$ which bowtie2 | ||
| - | /share/apps/ | + | /sanscratch/ |
| </ | </ | ||
| Line 155: | Line 159: | ||
| # this required libibverbs and libibverbs-devel so not sure it will run on compute nodes | # this required libibverbs and libibverbs-devel so not sure it will run on compute nodes | ||
| - | eb astropy-4.2.1-intelcuda-2020b.eb | + | eb astropy-4.2.1-intelcuda-2020b.eb |
| # then ran into icc license problems, 2020b, check out license failed | # then ran into icc license problems, 2020b, check out license failed | ||
| Line 161: | Line 165: | ||
| # hint add eula flag when trying i/intel toolchain | # hint add eula flag when trying i/intel toolchain | ||
| eb intel-2021a.eb | eb intel-2021a.eb | ||
| - | --prefix=/share/apps/ | + | --prefix=/sanscratch/ |
| --accept-eula-for=Intel-oneAPI, | --accept-eula-for=Intel-oneAPI, | ||
| # built intel-compilers/ | # built intel-compilers/ | ||
| Line 184: | Line 188: | ||
| description = """ | description = """ | ||
| - | # to find config change to that location | + | # to find config, change to that location |
| - | cd easybuild/ | + | # aand you must set python 3.8.3 as indicated above, else run.py from |
| - | astropy]$ | + | # native OS python is found yielding 'make -j 16' error |
| + | |||
| + | cd easybuild/ | ||
| + | eb astropy-4.2.1-fosscuda-2020b.eb | ||
| + | --dry-run --robot --prefix=/ | ||
| # fosscuda attempt worked, see below for continuation | # fosscuda attempt worked, see below for continuation | ||
| Line 219: | Line 227: | ||
| 12) hwloc/ | 12) hwloc/ | ||
| - | # in our environment | + | # in our environment |
| + | export LD_LIBRARY_PATH=/ | ||
| [hmeij@greentail52 ~]$ which python nvcc mpirun | [hmeij@greentail52 ~]$ which python nvcc mpirun | ||
| Line 243: | Line 252: | ||
| [hmeij@n84 ~]$ module list | [hmeij@n84 ~]$ module list | ||
| ... | ... | ||
| + | |||
| + | </ | ||
| + | |||
| + | Helios GPU tutorial\\ | ||
| + | https:// | ||
| + | < | ||
| + | # pycuda not working, why would fosscuda? | ||
| + | ImportError: | ||
| + | undefined symbol: cuDevicePrimaryCtxRelease_v2 | ||
| + | </ | ||
| + | https:// | ||
| + | |||
| + | ===== Emcee ===== | ||
| + | |||
| + | < | ||
| + | |||
| + | module list | ||
| + | |||
| + | Currently Loaded Modules: | ||
| + | 1) GCCcore/ | ||
| + | 2) zlib/ | ||
| + | 3) binutils/ | ||
| + | 4) GCC/ | ||
| + | 5) numactl/ | ||
| + | 6) XZ/ | ||
| + | 7) libxml2/ | ||
| + | 8) libpciaccess/ | ||
| + | 9) hwloc/ | ||
| + | 10) OpenMPI/ | ||
| + | 11) OpenBLAS/ | ||
| + | 12) gompi/ | ||
| + | 13) FFTW/ | ||
| + | |||
| + | </ | ||
| + | |||
| + | I noticed emcee loaded two python versions, the default being 3.7.2 (requires centos7). But you can unload this python module and load module Python/ | ||
| + | |||
| + | Flexible but weird. | ||
| + | |||
| + | =====PyCUDA ===== | ||
| + | |||
| + | < | ||
| + | |||
| + | [hmeij@greentail52 ~]$ module load PyCUDA/ | ||
| + | [hmeij@greentail52 ~]$ module list | ||
| + | |||
| + | Currently Loaded Modules: | ||
| + | 1) GCCcore/ | ||
| + | 2) zlib/ | ||
| + | 3) binutils/ | ||
| + | 4) GCC/ | ||
| + | 5) CUDAcore/ | ||
| + | 6) CUDA/ | ||
| + | 7) gcccuda/ | ||
| + | 8) numactl/ | ||
| + | 9) XZ/ | ||
| + | 10) libxml2/ | ||
| + | 11) libpciaccess/ | ||
| + | 12) hwloc/ | ||
| + | 13) libevent/ | ||
| + | 14) Check/ | ||
| + | 15) GDRCopy/ | ||
| + | 16) UCX/ | ||
| + | 17) libfabric/ | ||
| + | 18) PMIx/ | ||
| + | 19) OpenMPI/ | ||
| + | |||
| + | # same error as pycuda inside of astrpy module | ||
| + | ImportError: | ||
| </ | </ | ||
| Line 301: | Line 379: | ||
| ... | ... | ||
| + | |||
| + | ===== OHPC ===== | ||
| + | |||
| + | Load module, search for application, | ||
| + | |||
| + | Then remove the dry-run flag. | ||
| + | |||
| + | < | ||
| + | |||
| + | | ||
| + | which eb | ||
| + | |||
| + | eb --search PyCUDA | ||
| + | find / | ||
| + | -name PyCUDA* | ||
| + | |||
| + | # dry-run | ||
| + | eb \ | ||
| + | / | ||
| + | easybuild/ | ||
| + | | ||
| + | |||
| + | [hmeij@cottontail2 ~]$ module list | ||
| + | |||
| + | Currently Loaded Modules: | ||
| + | 1) autotools | ||
| + | 2) prun/ | ||
| + | |||
| + | |||
| + | |||
| + | [hmeij@cottontail2 ~]$ module load PyCUDA/ | ||
| + | |||
| + | The following have been reloaded with a version change: | ||
| + | 1) hwloc/2.5.0 => hwloc/ | ||
| + | |||
| + | [hmeij@cottontail2 ~]$ module list | ||
| + | |||
| + | Currently Loaded Modules: | ||
| + | 1) autotools | ||
| + | 2) prun/ | ||
| + | 3) gnu9/ | ||
| + | 4) ucx/ | ||
| + | 5) openmpi4/ | ||
| + | 6) ohpc 28) FFTW/ | ||
| + | 7) GCCcore/ | ||
| + | 8) zlib/ | ||
| + | 9) binutils/ | ||
| + | 10) GCC/ | ||
| + | 11) CUDAcore/ | ||
| + | 12) CUDA/ | ||
| + | 13) gcccuda/ | ||
| + | 14) numactl/ | ||
| + | 15) XZ/ | ||
| + | 16) libxml2/ | ||
| + | 17) libpciaccess/ | ||
| + | 18) hwloc/ | ||
| + | 19) libevent/ | ||
| + | 20) Check/ | ||
| + | 21) GDRCopy/ | ||
| + | 22) UCX/ | ||
| + | |||
| + | |||
| + | |||
| + | [hmeij@cottontail2 ~]$ which gcc mpicc nvcc python | ||
| + | / | ||
| + | / | ||
| + | / | ||
| + | / | ||
| + | |||
| + | # look at the OHPC software page for a smaple pycuda gpu " | ||
| + | |||
| + | </ | ||
cluster/209.1635859921.txt.gz · Last modified: by hmeij07
