Ignore:
Timestamp:
Dec 14, 2010 1:33:02 PM (14 years ago)
Author:
raasch
Message:

mrun/mbuild/subjob adjustments for new Tsubama system at Tokyo Institute of Techology (lctit)

File:
1 edited

Legend:

Unmodified
Added
Removed
  • palm/trunk/SCRIPTS/mrun

    r622 r635  
    213213     #                     has now argument threads_per_task
    214214     #                     adjustments for Kyushu Univ. (lcrte, ibmku)
     215     # 14/12/10 - Siggi  - adjustments for new Tsubame system at Tokyo
     216     #                     institute of technology (lctit)
    215217
    216218
     
    662664    do_remote=true
    663665    case  $host  in
    664         (ibm|ibmh|ibmku|ibms|ibmy|nech|necriam|lckyoto|lcsgib|lcsgih|lctit|unics|lcxt4|lcxt5m|lck)  true;;
     666        (ibm|ibmh|ibmku|ibms|ibmy|nech|necriam|lckyoto|lcsgib|lcsgih|unics|lcxt4|lcxt5m|lck)  true;;
    665667        (*)  printf "\n"
    666668             printf "\n  +++ sorry: execution of batch jobs on remote host \"$host\""
     
    839841                   do_remote=true
    840842                   case  $host  in
    841                        (ibm|ibmh|ibmku|ibms|ibmy|lckyoto|lcsgib|lcsgih|lctit|nech|necriam|unics|lcxt4|lcxt5m|lck)  true;;
     843                       (ibm|ibmh|ibmku|ibms|ibmy|lckyoto|lcsgib|lcsgih|nech|necriam|unics|lcxt4|lcxt5m|lck)  true;;
    842844                       (*)  printf "\n  +++ sorry: execution of batch jobs on remote host \"$host\""
    843845                            printf "\n      is not available"
     
    11211123    do_remote=true
    11221124    case  $host  in
    1123         (ibm|ibmh|ibmku|ibms|ibmy|lckyoto|lcsgib|lcsgih|lctit|nech|necriam|unics|lcxt4|lcxt5m|lck)  true;;
     1125        (ibm|ibmh|ibmku|ibms|ibmy|lckyoto|lcsgib|lcsgih|nech|necriam|unics|lcxt4|lcxt5m|lck)  true;;
    11241126        (*)  printf "\n"
    11251127             printf "\n  +++ sorry: execution of batch jobs on remote host \"$host\""
     
    12081210       then
    12091211          node_usage=shared
    1210        elif [[ $host = lctit ]]
    1211        then
    1212           node_usage=RAM64GB
    12131212       elif [[ $(echo $host | cut -c1-5) = lcsgi ]]
    12141213       then
     
    12191218    fi
    12201219
    1221     if [[ $node_usage != shared  &&  $node_usage != not_shared  &&  $node_usage != singlejob  &&  "$(echo $node_usage | cut -c1-3)" != "sla"  &&  $node_usage != RAM64GB  ]]
     1220    if [[ $node_usage != shared  &&  $node_usage != not_shared  &&  $node_usage != singlejob  &&  "$(echo $node_usage | cut -c1-3)" != "sla" ]]
    12221221    then
    12231222       printf "\n"
     
    12701269        (lcsgib)     queue=bigq;;
    12711270        (lcsgih)     queue=bigq;;
    1272         (lctit)      queue=RAM64GB;;
     1271        (lctit)      queue=S;;
    12731272        (nech)       queue=none;;
    12741273        (necriam)    queue=SP;;
     
    19671966
    19681967    # JOBMODUS FESTSTELLEN
    1969  if [[ "$ENVIRONMENT" = BATCH  &&  $localhost != lctit  ||  "$QUEUE" != interactive  &&  $localhost = lctit ]]
     1968 if [[ "$ENVIRONMENT" = BATCH ]]
    19701969 then
    19711970    jobmo=BATCH
    19721971 else
    19731972    jobmo=INTERACTIVE
     1973 fi
     1974
     1975
     1976    # no interactive runs on lctit
     1977 if [[ $host = lctit  &&  $jobmo = INTERACTIVE  &&  $do_batch = false ]]
     1978 then
     1979    printf "\n  +++ no interactive runs allowed on host \"$host\" "
     1980    printf "\n      please submit batch job using mrun option \"-b\" \n"
     1981    locat=normal; exit
    19741982 fi
    19751983
     
    25332541          continue   # ANDERENFALLS IST STATUS=1, FALLS A.OUT VORHANDEN
    25342542       else
    2535           [[ $localhost = lctit ]]  &&  export LM_LICENSE_FILE=27050@tggls
    25362543          [[ $localhost = lcxt4 ]]  &&  . /opt/modules/default/init/ksh
    25372544          [[ "$module_calls" != "" ]]  &&  eval $module_calls
     
    34393446          elif [[ $host = lctit ]]
    34403447          then
    3441              export runfile=runfile.$kennung
    3442 
    3443              echo "cd $PWD"                                  >   $runfile
    3444              echo "export OMP_NUM_THREADS=$OMP_NUM_THREADS"  >>  $runfile
    3445              echo "export cpurest=$cpurest"                  >>  $runfile
    3446              echo "export fname=$fname"                      >>  $runfile
    3447              echo "export localhost=$localhost"              >>  $runfile
    3448              echo "export return_addres=$return_addres"      >>  $runfile
    3449              echo "export return_username=$return_username"  >>  $runfile
    3450              echo "export tasks_per_node=$tasks_per_node"    >>  $runfile
    3451              echo "export write_binary=$write_binary"        >>  $runfile
    3452              echo "export use_seperate_pe_for_dvrp_output=$use_seperate_pe_for_dvrp_output"  >>  $runfile
    3453              echo "./a.out"                                  >>  $runfile
    3454              chmod  u+x  $runfile
    3455 
    3456              if [[ "$QUEUE" = interactive ]]
    3457              then
    3458                 mpirun  -np $numprocs  a.out  $ROPTS
    3459              else
    3460                  (( mem_tsubame = $memory / 1024.0 ))
    3461                  echo "Memory for Tsubame for each process in GB:", $mem_tsubame
    3462 #                n1ge  -fore  -g 1S060156  -mpi $numprocs  -mem 4  -N palm  -q $queue  a.out  $ROPTS
    3463 #               /n1ge/TITECH_GRID/tools/bin/n1ge -fore -g $group_number -mpi ${numprocs}:$tasks_per_node -mem $mem_tsubame -N palm -rt $minuten -q $queue  a.out  $ROPTS
    3464                  n1ge -fore -g $group_number -mpi ${numprocs}:$tasks_per_node -mem $mem_tsubame -N palm -rt $minuten -q $queue  a.out  $ROPTS
    3465              fi
    3466 
    3467              rm  $runfile
     3448             mpirun  -np $numprocs  -hostfile $PBS_NODEFILE ./a.out  $ROPTS
    34683449          else
    34693450             mpprun  -n $numprocs  a.out  $ROPTS
     
    42334214          then
    42344215
    4235              if [[ $localhost = lcsgih  ||  $localhost = lcsgib  ||  $localhost = nech  ||  $localhost = ibmh  ||  $localhost = ibmku  ||  $localhost = ibms  ||  $localhost = lctit ]]
     4216             if [[ $localhost = lcsgih  ||  $localhost = lcsgib  ||  $localhost = nech  ||  $localhost = ibmh  ||  $localhost = ibmku  ||  $localhost = ibms ]]
    42364217             then
    42374218                echo "*** ssh will be used to initiate restart-runs!"
    42384219                echo "    return_addres=\"$return_addres\" "
    42394220                echo "    return_username=\"$return_username\" "
    4240                 if [[ $return_addres = 172.20.25.41 ]]
    4241                 then
    4242                       # WORKAROUND AUF SCIROCCO AM TIT
    4243                    print  "PATH=\$PATH:$LOCAL_MRUN_PATH;export PALM_BIN=$LOCAL_MRUN_PATH;cd $LOCAL_PWD; $mc "  |  ssh $return_addres -l $return_username
    4244                 elif [[ $(echo $return_addres | grep -c "130.75.105") = 1 ]]
     4221                if [[ $(echo $return_addres | grep -c "130.75.105") = 1 ]]
    42454222                then
    42464223                   ssh $return_addres -l $return_username "PATH=\$PATH:$LOCAL_MRUN_PATH;export LD_LIBRARY_PATH=\$LD_LIBRARY_PATH:/muksoft/packages/intel/Compiler/11.0/083/lib/intel64/;export PALM_BIN=$LOCAL_MRUN_PATH;cd $LOCAL_PWD; $mc "
     
    44604437       cat   ${PALM_BIN}/$mrun_script_name          >>  $jobfile
    44614438       echo  "%END%"                                >>  $jobfile
    4462        if [[ $host = lctit ]]
    4463        then
    4464           echo "sed 's/bin\/ksh/home2\/usr5\/mkanda\/pub\/ksh/' < $mrun_script_name > mrun_new" >>  $jobfile
    4465           echo "mv  mrun_new  $mrun_script_name"    >>  $jobfile
    4466        fi
    44674439       echo  "chmod u+x $mrun_script_name"          >>  $jobfile
    44684440       echo  "execute_mrun=true"                    >>  $jobfile
Note: See TracChangeset for help on using the changeset viewer.