Changeset 1620 for palm/trunk/SCRIPTS/mrun
- Timestamp:
- Jul 17, 2015 11:37:41 AM (10 years ago)
- File:
-
- 1 edited
Legend:
- Unmodified
- Added
- Removed
-
palm/trunk/SCRIPTS/mrun
r1610 r1620 22 22 # Current revisions: 23 23 # ------------------ 24 # 24 # adjustments for Mistral at DKRZ Hamburg (lcbullhh) 25 25 # 26 26 # Former revisions: … … 324 324 typeset -i cputime i ii iia iii iio icycle inode ival jobges jobsek last_char_int maxcycle minuten nodes pes remaining_pes sekunden tp1 325 325 326 327 328 326 # ERROR HANDLING IN CASE OF EXIT 329 327 trap 'rm -rf $working_directory/tmp_mrun … … 610 608 do_remote=true 611 609 case $host in 612 (ibm|ibmh|ibmkisti|ibmku|ibms|nech|lc crayb|lccrayh|lccrayf|lcflow|lckyoto|unics|lcxe6|lcxt5m|lck|lckiaps|lckordi|lckyuh|lckyut|lcsb) true;;610 (ibm|ibmh|ibmkisti|ibmku|ibms|nech|lcbullhh|lccrayb|lccrayh|lccrayf|lcflow|lckyoto|unics|lcxe6|lcxt5m|lck|lckiaps|lckordi|lckyuh|lckyut|lcsb) true;; 613 611 (*) printf "\n" 614 612 printf "\n +++ sorry: execution of batch jobs on remote host \"$host\"" … … 669 667 fi 670 668 671 672 669 # CHECK, IF FILE-ARCHIVING HAS FAILED IN PREVIOUS JOB (OF A JOB-CHAIN) 673 670 if [[ -f ~/job_queue/ARCHIVE_ERROR_$fname ]] … … 697 694 if [[ "$read_from_config" = false ]] 698 695 then 699 700 696 [[ $silent = false ]] && printf "\n Reading the configuration file... " 701 697 … … 769 765 do_remote=true 770 766 case $host in 771 (ibm|ibmh|ibmkisti|ibmku|ibms|lc crayb|lccrayh|lccrayf|lcflow|lckyoto|nech|unics|lcxe6|lcxt5m|lck|lckiaps|lckordi|lckyuh|lckyut|lcsb) true;;767 (ibm|ibmh|ibmkisti|ibmku|ibms|lcbullhh|lccrayb|lccrayh|lccrayf|lcflow|lckyoto|nech|unics|lcxe6|lcxt5m|lck|lckiaps|lckordi|lckyuh|lckyut|lcsb) true;; 772 768 (*) printf "\n +++ sorry: execution of batch jobs on remote host \"$host\"" 773 769 printf "\n is not available" … … 887 883 else 888 884 889 890 885 # EVALUATE THE CONFIGURATION-FILE BY FORTRAN-PROGRAM 891 886 [[ $silent = false ]] && printf "..." … … 1034 1029 do_remote=true 1035 1030 case $host in 1036 (ibm|ibmh|ibmkisti|ibmku|ibms|lc crayb|lccrayh|lccrayf|lcflow|lckyoto|nech|unics|lcxe6|lcxt5m|lck|lckiaps|lckordi|lckyuh|lckyut|lcsb) true;;1031 (ibm|ibmh|ibmkisti|ibmku|ibms|lcbullhh|lccrayb|lccrayh|lccrayf|lcflow|lckyoto|nech|unics|lcxe6|lcxt5m|lck|lckiaps|lckordi|lckyuh|lckyut|lcsb) true;; 1037 1032 (*) printf "\n" 1038 1033 printf "\n +++ sorry: execution of batch jobs on remote host \"$host\"" … … 1045 1040 1046 1041 1042 1047 1043 # IN CASE OF PARALLEL EXECUTION, CHECK SOME SPECIFICATIONS CONCERNING PROCESSOR NUMBERS 1048 1044 if [[ "$cond1" = parallel || "$cond2" = parallel ]] … … 1160 1156 (ibmh) queue=cluster;; 1161 1157 (ibmkisti) queue=class.32plus;; 1158 (lcbullhh) queue=compute;; 1162 1159 (lccrayb) queue=mpp1q;; 1163 1160 (lccrayh) queue=mpp1q;; … … 2170 2167 fi 2171 2168 2172 2173 2169 # QUERY FOR CONTINUE (ON LOCAL MACHINES ONLY) 2174 2170 if [[ $remotecall = false && $silent = false && $jobmo != BATCH ]] … … 2634 2630 rm -rf $check_sources 2635 2631 cd $working_directory 2636 2637 2632 2638 2633 # DETERMINE PATH FOR MAKE DEPOSITORY … … 2825 2820 [[ "$check_for_file" = "" ]] && compile_error=true 2826 2821 continue # STATUS=1, IF a.out EXISTS 2827 elif [[ $localhost = lc crayb || $localhost = lccrayf || $localhost = lccrayh ]]2822 elif [[ $localhost = lcbullhh || $localhost = lccrayb || $localhost = lccrayf || $localhost = lccrayh ]] 2828 2823 then 2829 2824 make $mopts -f Makefile PROG=a.out F90=$compiler_name COPT="$cpp_options" F90FLAGS="$fopts" LDFLAGS="$lopts" … … 3497 3492 # COPY HOSTFILE FROM SOURCE DIRECTORY OR CREATE IT, IF IT 3498 3493 # DOES NOT EXIST 3499 if [[ $host != lccrayb && $host != lccrayf && $host != lccrayh && $host != lckyuh && $host != lckyut ]]3494 if [[ $host != lccrayb && $host != lccrayf && $host != lccrayh && $host != lckyuh && $host != lckyut ]] 3500 3495 then 3501 3496 if [[ -f $hostfile ]] … … 3666 3661 echo "mpirun -np $ii -hostfile $PBS_NODEFILE ./a.out $ROPTS" 3667 3662 mpirun -np $ii -hostfile $PBS_NODEFILE ./a.out $ROPTS 3663 3664 elif [[ $host = lcbullhh ]] 3665 then 3666 export OMPI_MCA_pml=cm 3667 export OMPI_MCA_mtl=mxm 3668 export OMPI_MCA_coll=^ghc 3669 export OMPI_MCA_mtl_mxm_np=0 3670 export MXM_RDMA_PORTS=mlx5_0:1 3671 export MXM_LOG_LEVEL=ERROR 3672 export OMP_NUM_THREADS=$threads_per_task 3673 export KMP_AFFINITY=verbose,granularity=core,compact,1 3674 export KMP_STACKSIZE=64m 3675 3676 srun --nodes=$nodes --ntasks-per-node=$tasks_per_node ./a.out 3668 3677 else 3669 3678 mpprun -n $numprocs a.out $ROPTS 3670 3679 fi 3671 3680 else 3672 3681 a.out $ROPTS 3673 3682 fi … … 3892 3901 then 3893 3902 ssh $usern@hlogin1 ". \\$HOME/.profile; cd $TEMPDIR; batch_scp $PORTOPT $cps -b -m -u $return_username $return_address ${localout[$i]} \"${pathout[$i]}\" ${localhost}_${fname}${endout[$i]} ${extout[$i]}" 3903 elif [[ $localhost = lcbullhh ]] 3904 then 3905 ssh $usern@mlogin101 ". \\$HOME/.profile; cd $TEMPDIR; batch_scp $PORTOPT $cps -b -m -u $return_username $return_address ${localout[$i]} \"${pathout[$i]}\" ${localhost}_${fname}${endout[$i]} ${extout[$i]}" 3894 3906 elif [[ $localhost = lcxe6 ]] 3895 3907 then … … 4454 4466 then 4455 4467 4456 if [[ $localhost = lc crayb || $localhost = lccrayh || $localhost = nech || $localhost = ibmh || $localhost = ibmkisti || $localhost = ibmku || $localhost = ibms || $localhost = lcflow || $localhost = lckyu* ||$localhost = lcxe6 ]]4468 if [[ $localhost = lcbullhh || $localhost = lccrayb || $localhost = lccrayh || $localhost = nech || $localhost = ibmh || $localhost = ibmkisti || $localhost = ibmku || $localhost = ibms || $localhost = lcflow || $localhost = lckyu* || $localhost = lcxe6 ]] 4457 4469 then 4458 4470 echo "*** ssh will be used to initiate restart-runs!" … … 4464 4476 then 4465 4477 ssh $SSH_PORTOPT $usern@136.172.40.15 "ssh $SSH_PORTOPT $return_address -l $return_username \". \\\$HOME/.profile; module load intel-compiler hdf5 netcdf; PATH=\\\$PATH:$LOCAL_MRUN_PATH;export PALM_BIN=$LOCAL_MRUN_PATH;cd $LOCAL_PWD; $mc\" " 4478 elif [[ $localhost = lcbullhh ]] 4479 then 4480 ssh $SSH_PORTOPT $usern@mlogin101 "ssh $SSH_PORTOPT $return_address -l $return_username \". \\\$HOME/.profile; module load intel-compiler hdf5 netcdf; PATH=\\\$PATH:$LOCAL_MRUN_PATH;export PALM_BIN=$LOCAL_MRUN_PATH;cd $LOCAL_PWD; $mc\" " 4466 4481 elif [[ $localhost = lccrayb ]] 4467 4482 then … … 4582 4597 else 4583 4598 4584 4585 4599 # PREPARING ACTIONS, 4586 4600 # IF A BATCH-JOB IS TO BE GENERATED AND STARTED ON A REMOTE-MACHINE GERECHNET … … 4696 4710 # THIS MAY CREATE A QUITE LARGE JOB-FILE, WHICH CAN CAUSE PROBLEMS WITH SOME 4697 4711 # QUEUEING-SYSTEMS 4698 if [[ $host = ibmkisti || $host = lc crayb || $host = lccrayf || $host = lccrayh ]]4712 if [[ $host = ibmkisti || $host = lcbullhh || $host = lccrayb || $host = lccrayf || $host = lccrayh ]] 4699 4713 then 4700 4714 … … 4711 4725 if [[ $host = $localhost ]] 4712 4726 then 4713 4714 4727 # DUE TO UNKNOWN REASONS, COPY WITH cp COMMAND CREATES CORRUPT 4715 4728 # FILES ON CRAY XC30 SYSTEMS (CSC HELSINKI), rsync IS USED INSTEAD … … 4727 4740 echo "localdir=\`pwd\`" >> $jobfile 4728 4741 echo "ssh $SSH_PORTOPT $remote_username@gaiad \"cd \$localdir; scp $PORTOPT -r $return_username@$return_address:$working_directory/SOURCES_FOR_RUN_$fname .\" " >> $jobfile 4742 elif [[ $host = lcbullhh ]] 4743 then 4744 echo "localdir=\`pwd\`" >> $jobfile 4745 echo "ssh $SSH_PORTOPT $remote_username@mlogin101 \"cd \$localdir; scp $PORTOPT -r $return_username@$return_address:$working_directory/SOURCES_FOR_RUN_$fname .\" " >> $jobfile 4746 4729 4747 elif [[ $host = lccrayb ]] 4730 4748 then
Note: See TracChangeset
for help on using the changeset viewer.