Skip to content

Commit d45eac1

Browse files
committed
dpl-workflow.sh: dump raw data for GPU crashes by default in online
1 parent d0daea3 commit d45eac1

File tree

1 file changed

+3
-0
lines changed

1 file changed

+3
-0
lines changed

prodtests/full-system-test/dpl-workflow.sh

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -222,6 +222,9 @@ has_detector_flp_processing CPV && CPV_INPUT=digits
222222
! has_detector_flp_processing TOF && TOF_CONFIG+=" --local-cmp"
223223

224224
if [[ $EPNSYNCMODE == 1 ]]; then
225+
# dump raw data in case of GPU crash and set dump directory size limits; files are automatically cleaned by EPN after 60 days
226+
GPU_CONFIG_KEY+="GPU_proc.debugOnFailure=1;GPU_proc.debugOnFailureDirectory=/data/tf/debug;GPU_proc.debugOnFailureMaxFiles=1000;GPU_proc.debugOnFailureMaxSize=500;GPU_proc.debugOnFailureSignalMask=2240;"
227+
225228
EVE_OPT+=" --eve-dds-collection-index 0"
226229
MIDDEC_CONFIG+=" --feeId-config-file \"$MID_FEEID_MAP\""
227230
if [[ $EXTINPUT == 1 ]] && [[ $GPUTYPE != "CPU" ]] && [[ -z "$GPU_NUM_MEM_REG_CALLBACKS" ]]; then

0 commit comments

Comments
 (0)