From 51e384554b4653a05abea435432431cdca4728fb Mon Sep 17 00:00:00 2001 From: Dan Smith Date: Wed, 14 Apr 2021 07:23:10 -0700 Subject: [PATCH] Add some debug to async_wait failures This dumps some data in the case where we fail to wait for a child pid to help debug what is going on. This also cleans up a few review comments from the actual fix. Change-Id: I7b58ce0cf2b41bdffa448973edb4c992fe5f730c Related-Bug: #1923728 --- inc/async | 31 +++++++++++++++++++++++++------ 1 file changed, 25 insertions(+), 6 deletions(-) diff --git a/inc/async b/inc/async index 11bcdfa39e..56338f5343 100644 --- a/inc/async +++ b/inc/async @@ -48,7 +48,7 @@ function async_log { command=$(iniget $inifile job command | tr '#' '-') message=$(echo "$message" | sed "s#%command#$command#g") - echo "[Async ${name}:${pid}]: $message" + echo "[$BASHPID Async ${name}:${pid}]: $message" } # Inner function that actually runs the requested task. We wrap it like this @@ -57,7 +57,7 @@ function async_log { function async_inner { local name="$1" local rc - local fifo=${DEST}/async/${name}.fifo + local fifo="${DEST}/async/${name}.fifo" shift set -o xtrace if $* >${DEST}/async/${name}.log 2>&1; then @@ -116,6 +116,24 @@ function async_runfunc { async_run $1 $* } +# Dump some information to help debug a failed wait +function async_wait_dump { + local failpid=$1 + + echo "=== Wait failure dump from $BASHPID ===" + echo "Processes:" + ps -f + echo "Waiting jobs:" + for name in $(ls ${DEST}/async/*.ini); do + echo "Job $name :" + cat "$name" + done + echo "Failed PID status:" + sudo cat /proc/$failpid/status + sudo cat /proc/$failpid/cmdline + echo "=== End wait failure dump ===" +} + # Wait for an async future to complete. May return immediately if already # complete, or of the future has already been waited on (avoid this). May # block until the future completes. @@ -129,18 +147,18 @@ function async_wait { for name in $*; do running=$(ls ${DEST}/async/*.ini 2>/dev/null | wc -l) inifile="${DEST}/async/${name}.ini" - fifo=${DEST}/async/${name}.fifo + fifo="${DEST}/async/${name}.fifo" if pid=$(async_pidof "$name"); then async_log "$name" "Waiting for completion of %command" \ - "($running other jobs running)" + "running on PID $pid ($running other jobs running)" time_start async_wait if [[ "$pid" != "self" ]]; then # Signal the child to go ahead and exit since we are about to # wait for it to collect its status. - echo "Signaling exit" + async_log "$name" "Signaling child to exit" echo WAKEUP > $fifo - echo "Signaled" + async_log "$name" "Signaled" # Do not actually call wait if we ran synchronously if wait $pid; then rc=0 @@ -161,6 +179,7 @@ function async_wait { "$rc in $runtime seconds" rm -f $inifile if [ $rc -ne 0 ]; then + async_wait_dump $pid echo Stopping async wait due to error: $* break fi