1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69
|
#!/bin/sh
# PCP QA Test No. 1186
# pmie retry back-off for bad host
#
# Copyright (c) 2017 Ken McDonell. All Rights Reserved.
#
# :not_in_ci:
# This test depends on reasonable platform scheduler performance
# and when pmie yields for the waiting for a back-off timeout,
# pmie needs to run shortly after the timeout expires.
# We've seen evidence of a back-off of 5 seconds leading to a
# 16 second delay before pmie runs again, and the test is doomed
# if this happens.
seq=`basename $0`
echo "QA output created by $seq"
# get standard environment, filters and checks
. ./common.product
. ./common.filter
. ./common.check
_cleanup()
{
cd $here
$sudo rm -rf $tmp $tmp.*
}
status=1 # failure is the default!
trap "_cleanup; exit \$status" 0 1 2 3 15
# real QA test starts here
cat <<End-of-File >$tmp.config
sample.long.one :no.such.host.pcp.io == 1 -> print "botch";
End-of-File
PCP_DERIVED_CONFIG=; export PCP_DERIVED_CONFIG
pmie -Dappl2 -t 12 -c $tmp.config 2>$tmp.err &
# expect back off 5 + 10 + 12 + 12 ... = 27 + 12 + ...
#
sleep 33
kill -TERM $!
cat $tmp.err >>$seq_full
# eval time lines look like
# eval time: Wed Jul 5 19:51:44.118012 2017
#
sed -e 's/\:/ /'g <$tmp.err \
| $PCP_AWK_PROG '
/Evaluating task/ { inblock = 1; next }
/expr_/ { inblock = 0; next }
inblock == 1 && /retry delta/ { print }
inblock == 1 && /eval time/ { this_time = $6*3600+$7*60+$8
if (last_time == 0)
print $1,$2,"start"
else {
delta = int(this_time - last_time + 0.5)
if (delta < 0)
delta += 24*3600
print $1,$2,"last +",delta
}
last_time = this_time
}'
# success, all done
status=0
exit
|