This shows you the differences between two versions of the page.
Both sides previous revision Previous revision Next revision | Previous revision | ||
cluster:119 [2013/09/20 19:16] hmeij [gromacs.sub] |
cluster:119 [2021/06/17 19:32] (current) hmeij07 |
||
---|---|---|---|
Line 1: | Line 1: | ||
\\ | \\ | ||
**[[cluster: | **[[cluster: | ||
- | |||
- | Jobs need to be submitted to the scheduler on host sharptail itself for now and will be dispatched to nodes n33-n37 in queue mwgpu. | ||
- | --- // | ||
==== Submitting GPU Jobs ==== | ==== Submitting GPU Jobs ==== | ||
+ | |||
+ | Please plenty of time between multiple GPU job submissions. | ||
+ | |||
+ | Jobs need to be submitted to the scheduler via cottontail to queues mwgpu, amber128, exx96. | ||
+ | |||
+ | This page is old, the gpu resource '' | ||
+ | --- // | ||
+ | |||
+ | **Articles** | ||
+ | |||
+ | * [[http:// | ||
+ | * [[http:// | ||
+ | |||
Line 44: | Line 54: | ||
</ | </ | ||
- | With '' | + | With '' |
< | < | ||
Line 58: | Line 68: | ||
3 Tesla K20m 21 C 0 % | 3 Tesla K20m 21 C 0 % | ||
==================================================== | ==================================================== | ||
+ | |||
+ | [hmeij@sharptail sharptail]$ ssh n33 gpu-free | ||
+ | 1,3,0 | ||
+ | |||
+ | |||
</ | </ | ||
Line 121: | Line 136: | ||
#BSUB -q mwgpu | #BSUB -q mwgpu | ||
#BSUB -J test | #BSUB -J test | ||
+ | |||
+ | # from greentail we need to set up the module env | ||
+ | export PATH=/ | ||
+ | / | ||
+ | / | ||
+ | / | ||
+ | / | ||
+ | / | ||
+ | / | ||
+ | export LD_LIBRARY_PATH=/ | ||
+ | / | ||
+ | / | ||
+ | / | ||
+ | / | ||
+ | / | ||
+ | |||
## leave sufficient time between job submissions (30-60 secs) | ## leave sufficient time between job submissions (30-60 secs) | ||
Line 215: | Line 246: | ||
##BSUB -q mwgpu | ##BSUB -q mwgpu | ||
##BSUB -n 1 | ##BSUB -n 1 | ||
- | ##BSUB -R " | + | ##BSUB -R " |
## signal GMXRC is a gpu run with: 1=thread_mpi | ## signal GMXRC is a gpu run with: 1=thread_mpi | ||
#export GMXRC=1 | #export GMXRC=1 | ||
Line 226: | Line 257: | ||
#BSUB -q mwgpu | #BSUB -q mwgpu | ||
#BSUB -n 1 | #BSUB -n 1 | ||
- | #BSUB -R " | + | #BSUB -R " |
# signal GMXRC is a gpu run with: 2=mvapich2 | # signal GMXRC is a gpu run with: 2=mvapich2 | ||
export GMXRC=2 | export GMXRC=2 | ||
Line 236: | Line 267: | ||
</ | </ | ||
+ | |||
+ | ==== matlab.sub ==== | ||
+ | |||
+ | < | ||
+ | |||
+ | #!/bin/bash | ||
+ | |||
+ | rm -rf out err *.out | ||
+ | |||
+ | # from greentail we need to recreate module env | ||
+ | export PATH=/ | ||
+ | / | ||
+ | / | ||
+ | / | ||
+ | / | ||
+ | / | ||
+ | / | ||
+ | export PATH=/ | ||
+ | export LD_LIBRARY_PATH=/ | ||
+ | / | ||
+ | / | ||
+ | / | ||
+ | / | ||
+ | / | ||
+ | |||
+ | #BSUB -o out | ||
+ | #BSUB -e err | ||
+ | #BSUB -N | ||
+ | #BSUB -J test | ||
+ | |||
+ | # GPU RUN: (1-4), queue mwgpu, n (1-4, matches gpu count), must run on one node | ||
+ | #BSUB -q mwgpu | ||
+ | #BSUB -n 1 | ||
+ | #BSUB -R " | ||
+ | # signal MATGPU is a gpu run | ||
+ | export MATGPU=1 | ||
+ | lava.mvapich2.wrapper matlab -nodisplay | ||
+ | |||
+ | |||
+ | </ | ||
+ | |||
==== lava.mvampich2.wrapper ==== | ==== lava.mvampich2.wrapper ==== | ||
Line 362: | Line 434: | ||
fi | fi | ||
+ | elif [ -n " | ||
+ | echo " | ||
+ | ${MYARGS} | ||
elif [ -n " | elif [ -n " | ||
cat ${MACHFILE}.lst | tr '\/ ' ' | cat ${MACHFILE}.lst | tr '\/ ' ' | ||
Line 372: | Line 447: | ||
exit $? | exit $? | ||
+ | |||
+ | |||
+ | </ | ||
+ | |||
+ | |||
+ | ===== elim code ===== | ||
+ | |||
+ | < | ||
+ | |||
+ | # | ||
+ | |||
+ | while (1) { | ||
+ | |||
+ | $gpu = 0; | ||
+ | $log = ''; | ||
+ | if (-e "/ | ||
+ | $tmp = `/ | ||
+ | @tmp = split(/ | ||
+ | foreach $i (0..$#tmp) { | ||
+ | ($a, | ||
+ | if ( $f == 0 ) { $gpu = $gpu + 1; } | ||
+ | #print "$a $f $gpu\n"; | ||
+ | $log .= " | ||
+ | } | ||
+ | } | ||
+ | # nr_of_args name1 value1 | ||
+ | $string = "1 gpu $gpu"; | ||
+ | |||
+ | $h = `hostname`; chop($h); | ||
+ | $d = `date +%m/ | ||
+ | foreach $i (' | ||
+ | if ( " | ||
+ | `echo " | ||
+ | } | ||
+ | } | ||
+ | |||
+ | # you need the \n to flush -hmeij | ||
+ | # you also need the space before the line feed -hmeij | ||
+ | print " | ||
+ | # or use | ||
+ | # | ||
+ | |||
+ | # smaller than specified in lsf.shared | ||
+ | sleep 10; | ||
+ | |||
+ | } | ||