Skip to content
Snippets Groups Projects
douar.run.mahone 1.91 KiB
Newer Older
  • Learn to ignore specific revisions
  • Douglas Guptill's avatar
    Douglas Guptill committed
    #!/bin/sh
    #
    # run douar, on mahone
    #
    # Author: Douglas Guptill
    # 2009-06-03: new, from a copy of the one on p690
    
    make_dir() {
      if ! test -d $1;  then mkdir $1; fi
    }
    
    if test $# -lt 1 ; then
      echo "Usage: $0 <number-of-processors>"
      exit
    fi
    
    PROCS=$1
    echo "Will use ${PROCS} processes."
    
    # For wsmp
    export MALLOC_TRIM_THRESHOLD_=-1
    export MALLOC_MMAP_MAX_=0
    # WSMP needs to know where its license file is.
    # But this doesn't seem to work yet....)
    # It looks like the license must be where we start the job.
    # When using the licemse from AIX, we get:
    #        ERROR**:  This License is registered for an AIX system
    # export WSMPLICPATH=/home/dguptill/software/wsmp/
    # export WSMPLICPATH=/home/pfullsac/PROGRAMS2008/v0.1/run_test_all/pbwithlic/wsmp.lic
    # The PGPLOT routines need this.
    export PGPLOT_DIR=/home/dguptill/software/pgplot-5.2.2
    export LD_LIBRARY_PATH=${PGPLOT_DIR}:${LD_LIBRARY_PATH}
    echo  "LD_LIBRARY_PATH is ${LD_LIBRARY_PATH}"
    # douar needs some directories..
    make_dir DEBUG
    make_dir DEBUG/mpilogs
    make_dir OUT
    # define the binary of douar
    # BIN=/home/dguptill/software/douar/bin/douar.mpich.02
    BIN=/home/dguptill/software/douar/douar
    
    # Here is the run command
    # COM="mpirun -np ${PROCS} --host localhost,localhost,localhost,localhost --byslot ${BIN}"
    # for the head node and MPICH
    # trouble:
    #p0_15929:  p4_error: Child process exited while making connection to remote process on cl003: 0
    #p0_15929: (6.230469) net_send: could not write to fd=5, errno = 32
    #
    # COM="/usr/local/mpich.pgi.64/bin/mpirun -machinefile /home/dguptill/douar/machinefile -np ${PROCS} ${BIN}"
    COM="/usr/local/mpich.pgi.64/bin/mpirun -arch LINUX -machinefile /home/dguptill/douar/machinefile -np ${PROCS} ${BIN} /home/dguptill/douar/input.txt"
    echo "COM is <${COM}>"
    
    # start douar and go away....
    #
    # nohup ${COM} &
    # echo "douar has been started.  Look in nohup.out ."
    
    # start douar and watch it........
    #
    OUT=douar.out
    ${COM} 2>douar.err | tee -a ${OUT}