#!/bin/bash # Submission script for GridEngine (GE). Each job will # be executed via the jobScript.sh # This jobScript supports up to 7 parameters. Edit # the user specific part of the script according to # your program. # # Input to the script is a filelist with 1 file per line. # For each file a job is started. With the parameter # nFilesPerJob a comma separated filelist will be # generated and handed to the job script. This feature # is usefull when running many small jobs. Each # job has its own logfile. All needed directories for the # logfiles will be created if non existing. # # IMPORTANT: the hera/prometheus cluster jobs will only # see the /hera file system. All needed scripts, programs # and parameters have to be located on /hera or the job # will crash. This script syncs your working dir to the submission # dir on /hera . Make sure your scripts use the submission dir! # Software should be taken from /cvmfs/hades.gsi.de/install/ # # job log files will be named like inputfiles. If nFilesPerJob > 1 # the log files will contain the partnumber. # ###################################################################### # CONFIGURATION user=$(whoami) currentDir=$(pwd | xargs -i basename {}) currentDir=../$currentDir day=095 submmissionbase=/hera/hades/user/${user}/sub/apr12/test submissiondir=${submmissionbase}/loopDST nFilesPerJob=10 # number of files to be analyzed by 1 job (default==1) jobscript=${submissiondir}/jobScript.sh # exec script (full path, call without dot, set it executable!) outputdir=/hera/hades/user/${user}/apr12/loop # outputdir for files AND logFiles pathoutputlog=${outputdir}/out # protocol from batch farm for each file filename=apr12ana_${day} # filename of log file if nFilesPerJob > 1 (partnumber will be appended) par1=/cvmfs/hades.gsi.de/install/5.34.01/hydra2-3.8/defall.sh # optional par1 : environment script par2=${submissiondir}/analysis # optional par2 : executable par3="" # optional par3 : input file list par4=${outputdir} # optional par4 : outputfile (part number will be appended (_num.root)) par5=-1 # optional par5 : number of events par6="no" # optional par6 par7="no" # optional par7 "single" to run comma separated list as single files in jobscript resources="-l h_rt=4:0:0,h_vmem=2G" # runtime < 10h, mem < 2GB jobarrayFile="loop_day_${day}_jobarray.dat" filelist=${currentDir}/lists/day_${day}.list # file list in local dir! not in submissiondir!!! ###################################################################### nFiles=$( cat $filelist | wc -l) #--------------------------------------------------------------------- # create needed dirs if [ ! -d $submmissionbase ] then echo "===> CREATE SUBMISSIONBASEDIR : $submmissionbase" mkdir -p $submmissionbase else echo "===> USE SUBMISSIONBASEDIR : $submmissionbase" fi #--------------------------------------------------------------------- # output dirs if [ ! -d $pathoutputlog ] then echo "===> CREATE LOGDIR : $pathoutputlog" mkdir -p $pathoutputlog else echo "===> USE LOGDIR : $pathoutputlog" fi if [ ! -d $outputdir ] then echo "===> CREATE OUTPUTDIR : $outputdir" mkdir -p $outputdir else echo "===> USE OUTPUTDIR : $outputdir" fi if [ ! -d $outputdir/crash ] then echo "===> CREATE CRASHDIR : $outputdir/crash" mkdir -p $outputdir/crash fi #--------------------------------------------------------------------- ctF=0 # counter for file number ctJ=0 # counter for job number partNumber=0 # counter for part number if [ -f $jobarrayFile ] then rm -f $jobarrayFile fi echo "===> CREATING JOB ARRAY FILE" #--------------------------------------------------------------------- # read the files list into an job array declare -a jobarray ct1=0 for file in $(cat $filelist) do jobarray[$ct1]=$file ((ct1+=1)) done #--------------------------------------------------------------------- #--------------------------------------------------------------------- # loop over the job array and submit parts with # nFilesPerJob to GE while ((ctF<$nFiles)) do #--------------------------------------------------------------------- # build comma separated file list # per job if [ $nFilesPerJob -gt 1 ] then infileList=${jobarray[${ctF}]} ((ctF+=1)) for (( ctList=1;ctList<$nFilesPerJob; ctList++ )) do if [ $ctF -lt ${nFiles} ] then infileList="${infileList},${jobarray[${ctF}]}" ((ctF+=1)) fi done else infileList=${jobarray[${ctF}]} ((ctF+=1)) fi #--------------------------------------------------------------------- ((partNumber+=1)) logfile="${pathoutputlog}/${filename}_${partNumber}.log" if [ $nFilesPerJob -eq 1 ] then file=$(basename ${infileList}) logfile="${pathoutputlog}/${file}.log" par4=${outputdir}/${filename}_${file}.root else par4=${outputdir}/${filename}_${partNumber}.root fi if [ -f ${logfile} ] then rm -f ${logfile} fi ###################################################################### # SEND NEW JOB (USER SPECIFIC) par3=${infileList} command="-j y -wd ${submissiondir} ${resources} -o ${logfile} \ ${jobscript} ${par1} ${par2} ${par3} ${par4} ${par5} ${par6} ${par7}" #jobscript.sh defall.sh prog filelist outfile nev echo "${par1} ${par2} ${par3} ${par4} ${par5} ${par6} ${par7}" >> $jobarrayFile ###################################################################### done #--------------------------------------------------------------------- #--------------------------------------------------------------------- # sync the local modified stuff # to the submission dir echo "===> SYNC CURENTDIR TO SUBMISSIONDIR : rsync -vHaz $currentDir ${submmissionbase}" rsync -vHaz $currentDir ${submmissionbase}/ syncStat=$? if [ ! $syncStat -eq 0 ] then echo "===> ERROR : SYNCHRONIZATION ENCOUNTERED PROBLEMS" else echo "-------------------------------------------------" nFiles=$( cat $jobarrayFile | wc -l) ctsend=0 block=2000 while ((${ctsend} * ${block} < ${nFiles})) do ((start=${ctsend}*${block}+1)) ((stop= ${start}+${block}-1)) ((rest=${nFiles}-${start})) if [ $rest -le $block ] then ((stop=$start+$rest)) fi qsub -t ${start}-${stop} -j y -wd ${submissiondir} ${resources} -o ${pathoutputlog} ${jobscript} ${submissiondir}/${jobarrayFile} ${pathoutputlog} ((ctsend+=1)) done echo "${nFiles} jobs for day ${day} submitted" fi