Workflow 4206, Stage 1
Priority | 50 |
Processors | 1 |
Wall seconds | 80000 |
RSS bytes | 2096103424 (1999 MiB) |
Max distance for inputs | 30.0 |
Enabled input RSEs |
CERN_PDUNE_EOS, DUNE_CA_SFU, DUNE_CERN_EOS, DUNE_ES_PIC, DUNE_FR_CCIN2P3_DISK, DUNE_IN_TIFR, DUNE_IT_INFN_CNAF, DUNE_UK_GLASGOW, DUNE_UK_LANCASTER_CEPH, DUNE_UK_MANCHESTER_CEPH, DUNE_US_BNL_SDCC, DUNE_US_FNAL_DISK_STAGE, FNAL_DCACHE, FNAL_DCACHE_STAGING, FNAL_DCACHE_TEST, MONTECARLO, NIKHEF, PRAGUE, QMUL, RAL-PP, RAL_ECHO, SURFSARA, T3_US_NERSC |
Enabled output RSEs |
CERN_PDUNE_EOS, DUNE_CA_SFU, DUNE_CERN_EOS, DUNE_ES_PIC, DUNE_FR_CCIN2P3_DISK, DUNE_IN_TIFR, DUNE_IT_INFN_CNAF, DUNE_UK_GLASGOW, DUNE_UK_LANCASTER_CEPH, DUNE_UK_MANCHESTER_CEPH, DUNE_US_BNL_SDCC, DUNE_US_FNAL_DISK_STAGE, FNAL_DCACHE, FNAL_DCACHE_STAGING, FNAL_DCACHE_TEST, NIKHEF, PRAGUE, QMUL, RAL-PP, RAL_ECHO, SURFSARA, T3_US_NERSC |
Enabled sites |
BR_CBPF, CA_SFU, CA_Victoria, CERN, CH_UNIBE-LHEP, CZ_FZU, ES_CIEMAT, ES_PIC, FR_CCIN2P3, IN_TIFR, IT_CNAF, NL_NIKHEF, NL_SURFsara, UK_Bristol, UK_Brunel, UK_Durham, UK_Edinburgh, UK_Imperial, UK_Lancaster, UK_Liverpool, UK_Manchester, UK_Oxford, UK_QMUL, UK_RAL-PPD, UK_RAL-Tier1, UK_Sheffield, US_BNL, US_Caltech, US_Colorado, US_FNAL-FermiGrid, US_FNAL-T1, US_Michigan, US_MIT, US_Nebraska, US_NotreDame, US_PuertoRico, US_SU-ITS, US_Swan, US_UChicago, US_UConn-HPC, US_UCSD, US_Wisconsin |
Scope | usertests |
Events for this stage |
Output patterns
| Destination | Pattern | Lifetime | For next stage |
---|
1 | https://fndcadoor.fnal.gov:2880/dune/scratch/users/calcuttj/beamevent/112024/neg1/04206/1 | *.root | | |
Environment variables
Name | Value |
---|
FCL_FILE | /cvmfs/fifeuser4.opensciencegrid.org/sw/dune/9e6c863a75128e4b76e13ec834df18e6da90d621/no_tof.fcl |
NFILES | 5 |
NTUPLE_DIR | /cvmfs/fifeuser4.opensciencegrid.org/sw/dune/0b0e77e50bec3aa86c8944031b79d1ae68ae0216 |
PRODUCT_TAR | /cvmfs/fifeuser1.opensciencegrid.org/sw/dune/8481315476ef9dce699137f4d2cd7f54ba3cfa74 |
File states
Job states
Total | Submitted | Started | Processing | Outputting | Finished | Notused | Aborted | Stalled | Jobscript error | Outputting failed | None processed |
---|
8157 | 2112 | 0 | 3866 | 0 | 1825 | 0 | 6 | 285 | 2 | 11 | 50 |
RSEs used
Name | Inputs | Outputs |
---|
DUNE_CERN_EOS | 14958 | 0 |
DUNE_ES_PIC | 9646 | 0 |
PRAGUE | 2275 | 0 |
Stats of processed input files as CSV or JSON, and of uploaded output files as CSV or JSON (up to 10000 files included)
File reset events, by site
Site | Allocated | Outputting |
---|
UK_Manchester | 320 | 10 |
UK_RAL-Tier1 | 250 | 10 |
NL_SURFsara | 205 | 0 |
UK_QMUL | 200 | 20 |
CZ_FZU | 90 | 0 |
CERN | 65 | 0 |
UK_Imperial | 60 | 10 |
UK_Lancaster | 35 | 15 |
ES_PIC | 15 | 0 |
UK_Liverpool | 10 | 0 |
UK_Brunel | 5 | 0 |
Jobscript
#!/bin/bash
#
#These must be defined
if [ -z $FCL_FILE ]; then
echo "Fatal Must provide FCL_FILE env var"
exit 1
fi
if [ -z $NTUPLE_DIR ]; then
echo "Fatal Must provide NTUPLE_DIR env var"
exit 1
fi
stat ${NTUPLE_DIR}
if [ $? -ne 0 ]; then
echo "Failed to $NTUPLE_DIR. Exiting safely"
exit 0
fi
source /cvmfs/dune.opensciencegrid.org/products/dune/setup_dune.sh
setup metacat
export METACAT_SERVER_URL=https://metacat.fnal.gov:9443/dune_meta_prod/app
export METACAT_AUTH_SERVER_URL=https://metacat.fnal.gov:8143/auth/dune
if [ -n "$PRODUCTS_TAR" ]; then
stat ${PRODUCTS_TAR}
if [ $? -ne 0 ]; then
echo "Failed to stat $PRODUCTS_TAR. Exiting safely"
exit 0
fi
export PRODUCTS=$PRODUCTS_TAR:$PRODUCTS
echo "Set protoduneana to $PRODUCTS_TAR"
fi
#Setup recent lar software suite
DUNE_VERSION=${DUNE_VERSION:-v10_01_01d00}
setup dunesw \
"${DUNE_VERSION}" \
-q "${DUNE_QUALIFIER:-e26:prof}"
setup_exit=$?
if [ $? -ne 0 ]; then
echo "Failed to setup dunesw $DUNE_VERSION $DUNE_QUALIFIER"
exit $setup_exit
fi
echo "DUNESW loc:"
ups active | grep dunesw
if [ -z ${JUSTIN_PROCESSORS} ]; then
JUSTIN_PROCESSORS=1
fi
echo "Justin processors: ${JUSTIN_PROCESSORS}"
export TF_NUM_THREADS=${JUSTIN_PROCESSORS}
export OPENBLAS_NUM_THREADS=${JUSTIN_PROCESSORS}
export JULIA_NUM_THREADS=${JUSTIN_PROCESSORS}
export MKL_NUM_THREADS=${JUSTIN_PROCESSORS}
export NUMEXPR_NUM_THREADS=${JUSTIN_PROCESSORS}
export OMP_NUM_THREADS=${JUSTIN_PROCESSORS}
echo "printing env"
env
echo "Justin specific env vars"
env | grep JUSTIN
echo "Will use justin-get-file"
#
nfiles=${NFILES:-1}
python $NTUPLE_DIR/ntuple_prod_utils.py get_nfiles_justin \
-n $nfiles \
--dids input_dids.list \
--pfns input_pfns.list
#pfn_exit=$?
#if [ $pfn_exit -ne 0 ]; then
# echo "Error in get_nfiles_justin. Exiting"
# exit $pfn_exit
#fi
n_files_retrieved=`wc -l input_pfns.list | cut -f1 -d' '`
echo "Files retrieved: ${n_files_retrieved}"
if [ $n_files_retrieved -eq 0 ]; then
echo "No files retrieved. Exiting safely"
exit 0
fi
pfn_list=`cat input_pfns.list`
echo "PFN list:"
echo $pfn_list
now=$(date -u +"%Y%m%dT%H%M%SZ")
##TODO -- edit this
#jobid=`echo "${JUSTIN_JOBSUB_ID:-1}" | awk -F '.' '{print $1}'`
jobid=`echo "${JUSTIN_JOBSUB_ID:-1}" | cut -f1 -d'@' | sed -e "s/\./_/"`
PREFIX=${PREFIX:-"beamana"}
OUTFILE="${PREFIX}_${jobid}_${JUSTIN_STAGE_ID}_${JUSTIN_WORKFLOW_ID}_${now}.root"
nevents=${NEVENTS:--1}
echo "Running pdspana"
touch ana.log
starttime=`date +"%s"`.0
LD_PRELOAD=$XROOTD_LIB/libXrdPosixPreload.so lar \
-c ${FCL_FILE} \
-n ${nevents} \
-T ${OUTFILE} \
-s ${pfn_list} >ana.log 2>&1
larExit=$?
endtime=`date +"%s"`.0
if [ $larExit -ne 0 ]; then
echo "Error in ntuple production"
cat ana.log
exit $larExit
fi
echo "Ran successfully"
echo "formed"
echo "$pfn_list" > justin-processed-pfns.txt