Skip to content
Snippets Groups Projects

First patch for silent ATLAS SIM failures (BMK-129)

Merged Andrea Valassi requested to merge valassi/hep-workloads:BMK-129 into qa
2 files
+ 46
44
Compare changes
  • Side-by-side
  • Inline
Files
2
@@ -4,33 +4,35 @@ echo "[$0] `date` starting"
status=0
function doOne(){
[ $DEBUG -gt 0 ] && echo "`date` : start process $i";
WDIR=$BASE_WDIR/proc_$1
[ $DEBUG -gt 0 ] &&echo $WDIR
[ -e $WDIR ] && rm -f $DIR
mkdir -p $WDIR
cd $WDIR
# input file to be moved on /cvmfs/
inputdatadir=/cvmfs/atlas.cern.ch/repo/benchmarks/hep-workloads/input-data
inputdata=$inputdatadir/EVNT.13043099._000859.pool.root.1
if ! Sim_tf.py --inputEVNTFile="$inputdata" --maxEvents="$nevents" \
--postInclude "default:RecJobTransforms/UseFrontier.py" \
--preExec "EVNTtoHITS:simFlags.SimBarcodeOffset.set_Value_and_Lock(200000)" "EVNTtoHITS:simFlags.TRTRangeCut=30.0;simFlags.TightMuonStepping=True" \
--preInclude "EVNTtoHITS:SimulationJobOptions/preInclude.BeamPipeKill.py,SimulationJobOptions/preInclude.FrozenShowersFCalOnly.py" \
--skipEvents="0" --firstEvent="6160001" \
--outputHITSFile='myHITS.pool.root' \
--physicsList="FTFP_BERT_ATL_VALIDATION" \
--randomSeed="6163" --DBRelease="100.0.2" --conditionsTag "default:OFLCOND-MC16-SDR-14" \
--geometryVersion="default:ATLAS-R2-2016-01-00-01_VALIDATION" --runNumber="407343" --AMITag="s3126" --DataRunNumber="284500" \
--simulator="FullG4" --truthStrategy="MC15aPlus" 2>&1 > out_$1.log; then
echo "Sim_tf.py failed"
status=1 # BMK-129
fi
[ $DEBUG -gt 0 ] && echo -e "\n`date` : done process $i\n"
[ $DEBUG -gt 0 ] && echo "`date` : start process $i";
WDIR=$BASE_WDIR/proc_$1
[ $DEBUG -gt 0 ] &&echo $WDIR
[ -e $WDIR ] && rm -f $DIR
mkdir -p $WDIR
cd $WDIR
# input file to be moved on /cvmfs/
inputdatadir=/cvmfs/atlas.cern.ch/repo/benchmarks/hep-workloads/input-data
inputdata=$inputdatadir/EVNT.13043099._000859.pool.root.1
if ! Sim_tf.py --inputEVNTFile="$inputdata" --maxEvents="$nevents" \
--postInclude "default:RecJobTransforms/UseFrontier.py" \
--preExec "EVNTtoHITS:simFlags.SimBarcodeOffset.set_Value_and_Lock(200000)" "EVNTtoHITS:simFlags.TRTRangeCut=30.0;simFlags.TightMuonStepping=True" \
--preInclude "EVNTtoHITS:SimulationJobOptions/preInclude.BeamPipeKill.py,SimulationJobOptions/preInclude.FrozenShowersFCalOnly.py" \
--skipEvents="0" --firstEvent="6160001" \
--outputHITSFile='myHITS.pool.root' \
--physicsList="FTFP_BERT_ATL_VALIDATION" \
--randomSeed="6163" --DBRelease="100.0.2" --conditionsTag "default:OFLCOND-MC16-SDR-14" \
--geometryVersion="default:ATLAS-R2-2016-01-00-01_VALIDATION" --runNumber="407343" --AMITag="s3126" --DataRunNumber="284500" \
--simulator="FullG4" --truthStrategy="MC15aPlus" 2>&1 > out_$1.log; then
echo "Sim_tf.py failed"
status=1
echo -e "\n`date` : Process $i failed\n"
return $status # BMK-129
else
[ $DEBUG -gt 0 ] && echo -e "\n`date` : Process $i successsfully completed\n"
return 0
fi
}
export APP=`basename $0 -bmk.sh`
@@ -45,8 +47,8 @@ export ncopies=$((`nproc`/$NTHREADS))
#when $NTHREADS > nproc
if [ "$ncopies" -lt 1 ]; then
ncopies=1
NTHREADS=$((`nproc`/$ncopies))
ncopies=1
NTHREADS=$((`nproc`/$ncopies))
fi
@@ -59,17 +61,17 @@ user_ncopies=""
user_threads=""
while getopts "w:n:e:t:dh" o; do
case ${o} in
w)
w)
RESULTS_DIR=$OPTARG
;;
n)
[ $OPTARG -gt 0 ] && user_ncopies=$OPTARG
;;
e)
[ $OPTARG -gt 0 ] && nevents_thread=$OPTARG
e)
[ $OPTARG -gt 0 ] && nevents_thread=$OPTARG
;;
t)
[ $OPTARG -gt 0 ] && user_nthreads=$OPTARG
[ $OPTARG -gt 0 ] && user_nthreads=$OPTARG
;;
d)
DEBUG=1
@@ -83,14 +85,14 @@ done
if [ "$user_nthreads" != "" ] && [ "$user_ncopies" != "" ]; then
ncopies=$user_ncopies
NTHREADS=$user_nthreads
ncopies=$user_ncopies
NTHREADS=$user_nthreads
elif [ "$user_nthreads" != "" ]; then
NTHREADS=$user_nthreads
ncopies=$((`nproc`/$NTHREADS))
NTHREADS=$user_nthreads
ncopies=$((`nproc`/$NTHREADS))
elif [ "$user_ncopies" != "" ]; then
ncopies=$user_ncopies
NTHREADS=$((`nproc`/$ncopies))
ncopies=$user_ncopies
NTHREADS=$((`nproc`/$ncopies))
fi
export s_msg="ok"
@@ -100,7 +102,7 @@ tot_load=$(($ncopies*$NTHREADS))
[ $tot_load -gt `nproc` ] && s_msg="[ERROR] ncopies*NTHREADS=$ncopies*$NTHREADS=$tot_load > number of available cores (`nproc`)" && generateSummary && exit 1
[ $tot_load -eq 0 ] && s_msg="[ERROR] ncopies*NTHREADS=$ncopies*$NTHREADS=$tot_load. Please fix it" && generateSummary && exit 1
[ $tot_load -ne `nproc` ] && s_msg="[WARNING] ncopies*NTHREADS ($ncopies*$NTHREADS=$tot_load) != `nproc` (number of available cores)" && echo $s_msg
[ $tot_load -ne `nproc` ] && s_msg="[WARNING] ncopies*NTHREADS ($ncopies*$NTHREADS=$tot_load) != `nproc` (number of available cores)" && echo $s_msg
export ATHENA_PROC_NUMBER=$NTHREADS #enc variable for ATHENA threads number
@@ -117,7 +119,7 @@ release=21.0.15
export ATLAS_LOCAL_ROOT_BASE=/cvmfs/atlas.cern.ch/repo/ATLASLocalRootBase
source ${ATLAS_LOCAL_ROOT_BASE}/user/atlasLocalSetup.sh -q
asetup --cmtconfig=x86_64-slc6-gcc49-opt AtlasOffline,${release}
unset FRONTIER_SERVER
unset FRONTIER_SERVER
for i in `seq 1 $ncopies`;
Loading