justIN           Dashboard       Workflows       Jobs       AWT       Sites       Storages       Docs       Login

Workflow 12502, Stage 1

Workflow12502
Campaign849
Priority50
Processors1
Wall seconds80000
Image/cvmfs/singularity.opensciencegrid.org/fermilab/fnal-wn-sl7:latest
RSS bytes5241831424 (4999 MiB)
Max distance for inputs100.0
Enabled input RSEs CERN_PDUNE_EOS, DUNE_CA_SFU, DUNE_CERN_EOS, DUNE_ES_PIC, DUNE_FR_CCIN2P3_DISK, DUNE_IN_TIFR, DUNE_IT_INFN_CNAF, DUNE_UK_GLASGOW, DUNE_UK_LANCASTER_CEPH, DUNE_UK_MANCHESTER_CEPH, DUNE_US_BNL_SDCC, DUNE_US_FNAL_DISK_STAGE, FNAL_DCACHE, FNAL_DCACHE_STAGING, FNAL_DCACHE_TEST, MONTECARLO, NIKHEF, PRAGUE, QMUL, RAL-PP, RAL_ECHO, SURFSARA, T3_US_NERSC
Enabled output RSEs CERN_PDUNE_EOS, DUNE_CA_SFU, DUNE_CERN_EOS, DUNE_ES_PIC, DUNE_FR_CCIN2P3_DISK, DUNE_IN_TIFR, DUNE_IT_INFN_CNAF, DUNE_UK_GLASGOW, DUNE_UK_LANCASTER_CEPH, DUNE_UK_MANCHESTER_CEPH, DUNE_US_BNL_SDCC, DUNE_US_FNAL_DISK_STAGE, FNAL_DCACHE, FNAL_DCACHE_STAGING, FNAL_DCACHE_TEST, NIKHEF, PRAGUE, QMUL, RAL-PP, RAL_ECHO, SURFSARA, T3_US_NERSC
Enabled sites BR_CBPF, CA_SFU, CA_Victoria, CERN, CH_UNIBE-LHEP, CZ_FZU, ES_CIEMAT, ES_PIC, FR_CCIN2P3, IT_CNAF, NL_NIKHEF, NL_SURFsara, UK_Bristol, UK_Brunel, UK_Durham, UK_Edinburgh, UK_Glasgow, UK_Imperial, UK_Lancaster, UK_Liverpool, UK_Manchester, UK_Oxford, UK_QMUL, UK_RAL-PPD, UK_RAL-Tier1, UK_Sheffield, US_BNL, US_Colorado, US_FNAL-FermiGrid, US_FNAL-T1, US_Michigan, US_NotreDame, US_PuertoRico, US_SU-ITS, US_Swan, US_UChicago, US_UConn-HPC, US_UCSD, US_Wisconsin
Scopeusertests
Events for this stage

Output patterns

 DestinationPatternLifetimeFor next stageRSE expression
1https://fndcadoor.fnal.gov:2880/dune/scratch/users/jjo/fnal/12502/1out_*.tgz

Environment variables

NameValue
INPUT_TAR_DIR_LOCAL/cvmfs/fifeuser4.opensciencegrid.org/sw/dune/052d43a26e9fd1b52dc226f18c4daf77c376f535
NUM_EVENTS10

File states

Total filesFindingUnallocatedAllocatedOutputtingProcessedNot foundFailed
100000010000

Job states

TotalSubmittedStartedProcessingOutputtingFinishedNotusedAbortedStalledJobscript errorOutputting failedNone processed
17800001600016200
Files processed00101020203030404050506060707080809090Jan-28 21:00Jan-28 22:00Jan-28 23:00Jan-29 00:00Jan-29 01:00Files processedBin start timesNumber per binNL_SURFsaraUK_QMULUK_SheffieldUK_ManchesterUK_RAL-Tier1NL_NIKHEFUK_BrunelUK_RAL-PPDUS_UChicagoCZ_FZUUS_FNAL-FermiG…US_FNAL-FermiGridCERNES_PIC

RSEs used

NameInputsOutputs
MONTECARLO1180
None0100

Stats of processed input files as CSV or JSON, and of uploaded output files as CSV or JSON (up to 10000 files included)

File reset events, by site

SiteAllocatedOutputting
CA_SFU80
UK_QMUL20
UK_Manchester20
US_UChicago20
NL_SURFsara10
UK_RAL-Tier110

Jobscript

#!/bin/bash
#
# fdhd_test.jobscript
# Simple testing jobscript to run a short FD-HD chain
#

# ---- Setup environment ----
source /cvmfs/dune.opensciencegrid.org/products/dune/setup_dune.sh

# Use requested version and qualifier
setup dunesw v10_16_00d00 -q e26:prof
if [ $? -ne 0 ]; then
  echo "Error setting up dunesw v10_16_00d00"
  exit 1
fi

# Prefer uploaded FHiCLs and WireCell configs if provided
if [ -n "${INPUT_TAR_DIR_LOCAL:-}" ]; then
    # Tell art/lar where to find .fcl files
    export FW_SEARCH_PATH="${INPUT_TAR_DIR_LOCAL}/cffm-if/dune10kt-1x2x6:${FW_SEARCH_PATH}"
    export FCL_SEARCH_PATH="${INPUT_TAR_DIR_LOCAL}/cffm-if/dune10kt-1x2x6:${FCL_SEARCH_PATH}"
    export FHICL_FILE_PATH="${INPUT_TAR_DIR_LOCAL}/cffm-if/dune10kt-1x2x6:${FHICL_FILE_PATH}"

    # WireCell lookup
    export WIRECELL_PATH="${INPUT_TAR_DIR_LOCAL}/cffm-if/dune10kt-1x2x6:${WIRECELL_PATH}"
fi

echo "FW_SEARCH_PATH=${FW_SEARCH_PATH}"
echo "FCL_SEARCH_PATH=${FCL_SEARCH_PATH}"
echo "FHICL_FILE_PATH=${FHICL_FILE_PATH}"
echo "WIRECELL_PATH=${WIRECELL_PATH}"

# Parallelism
if [ -z "${JUSTIN_PROCESSORS}" ]; then
  JUSTIN_PROCESSORS=1
fi
export TF_NUM_THREADS=${JUSTIN_PROCESSORS}
export OPENBLAS_NUM_THREADS=${JUSTIN_PROCESSORS}
export JULIA_NUM_THREADS=${JUSTIN_PROCESSORS}
export MKL_NUM_THREADS=${JUSTIN_PROCESSORS}
export NUMEXPR_NUM_THREADS=${JUSTIN_PROCESSORS}
export OMP_NUM_THREADS=${JUSTIN_PROCESSORS}

# ---- Get one input file (MC counter or real file, depending on submission) ----
did_pfn_rse="$($JUSTIN_PATH/justin-get-file)"
if [ -z "${did_pfn_rse}" ] ; then
  echo "No unprocessed files available, exiting."
  exit 0
fi

did=$(echo "$did_pfn_rse" | cut -f1 -d' ')
pfn=$(echo "$did_pfn_rse" | cut -f2 -d' ')
rse=$(echo "$did_pfn_rse" | cut -f3 -d' ')
name_only=$(echo "$did" | cut -f2 -d':' )

echo "Processing file: ${pfn}"
echo "RSE: ${rse}"
echo "DID: ${did}"

# ---- Set event count ----
nevents="${NUM_EVENTS:-10}"

# ---- Timestamp for unique output names ----
now=$(date -u +"%Y%m%dT%H%M%SZ")
jobid=$(echo "${JUSTIN_JOBSUB_ID:-1}" | cut -f1 -d'@' | sed -e "s/\./_/")
stageid=${JUSTIN_STAGE_ID:-1}

# ---- LArSoft chain ----

# 1. GEN (pure MC)
echo "Running: GEN stage ..."
ls -lh
lar -n "${nevents}" -c gen_genie.fcl -o gen.root
if [ $? -ne 0 ]; then echo "GEN failed"; exit 1; fi

# 2. G4
echo "Running: G4 stage ..."
ls -lh
lar -c g4.fcl -s gen.root -o g4.root
if [ $? -ne 0 ]; then echo "G4 failed"; exit 1; fi

# 3. WireCell Sim SP
echo "Running: WC SIM SP stage ..."
ls -lh
label_tag="${name_only}_${jobid}_${stageid}_${now}"
outdir="out_${label_tag}"
mkdir -p "${outdir}"

lar -c wcls_sim_sp.fcl -s g4.root -o sp.root
if [ $? -ne 0 ]; then echo "WCLS failed"; exit 1; fi

# 4. Truth labelling
echo "Running: True labelling stage ..."
ls -lh
truthdir="truth_${label_tag}"
mkdir -p "${truthdir}"
pushd "${truthdir}"

lar -c wcls-labelling2d_sep.fcl -s "../sp.root"
rc=$?
if [ $rc -ne 0 ]; then
  echo "Truth labeling failed"
  popd
  exit 1
fi

echo "Truth dir contents after lar:"
ls -lh

shopt -s nullglob
for f in pixeldata-anode*.h5; do
  mv -v "$f" "../${outdir}/${label_tag}_${f}"
done
shopt -u nullglob

popd

echo "Per-job output directory contents:"
ls -lh "${outdir}" || true

# ---- Package per-job outputs into a tarball for stage-out ----
tarball="${outdir}.tgz"

echo "Creating tarball ${tarball} from ${outdir}"
tar -czf "${tarball}" "${outdir}"

echo "Tarball contents:"
tar -tzf "${tarball}"

ls -lh "${tarball}"

# ---- Mark as processed ----
echo "${pfn}" > justin-processed-pfns.txt

echo "Job completed successfully."

exit 0
justIN time: 2026-02-04 05:41:45 UTC       justIN version: 01.06.00