File: 1794

package info (click to toggle)

pcp 7.1.1-1

links: PTS, VCS
area: main
in suites: forky, sid
size: 253,896 kB
sloc: ansic: 1,488,097; sh: 185,322; xml: 160,462; cpp: 83,813; python: 25,576; perl: 18,365; yacc: 6,877; lex: 2,864; makefile: 2,759; exp: 250; awk: 165; fortran: 60; java: 22

file content (84 lines) | stat: -rwxr-xr-x 2,142 bytes

#!/bin/sh
# PCP QA Test No. 1794
# Exercise pcp2arrow(1) parquet file generation.
#
# Copyright (c) 2024 Red Hat.  All Rights Reserved.
#

seq=`basename $0`
echo "QA output created by $seq"

. ./common.python


test -x $PCP_BIN_DIR/pcp2arrow || _notrun "pcp2arrow(1) is not installed"
$python -c "import pandas" >/dev/null 2>&1 || _notrun "pandas is not installed"

_cleanup()
{
    cd $here
    $sudo rm -rf $tmp $tmp.*
}

status=0	# success is the default!
trap "_cleanup; exit \$status" 0 1 2 3 15

_filter()
{
    sed \
	-e "s@$tmp@TMP@g" \
	-e "s@0.0[0-9][0-9]*@SMALLNUM@g" \
	-e "s@0.0@ZERONUM@g" \
    # end
}

# real QA test starts here
for archive in viewqa1 viewqa2 viewqa3 moomba.client proc
do
    echo
    echo === pcp2arrow $archive
    pcp2arrow -z -t 10 -o $tmp.$archive -a archives/$archive
    find $tmp.$archive >> $seq_full
    $python -c "
import pandas
df = pandas.read_parquet('$tmp.$archive')
if (len(df.columns) < 42):
    print('Columns:', sorted(df.columns))
    # exercise bug in extracting instance values
    if 'kernel.all.load[1 minute]' in df.columns:
        print('1 and 15 minute load averages')
        ldf = df[['kernel.all.load[1 minute]', 'kernel.all.load[15 minute]']]
        print(ldf.head())
else:
    print('Columns:', len(df.columns))
print('Shape:', df.shape)
" | _filter
done

# Test raw mode (pmFetchArchive optimization)
echo
echo "=== Testing raw mode with --raw flag ==="
for archive in viewqa1 moomba.client
do
    echo
    echo === pcp2arrow --raw $archive
    pcp2arrow -z -r -s 5 -o $tmp.raw.$archive -a archives/$archive kernel.all.load disk.all.read
    find $tmp.raw.$archive >> $seq_full
    $python -c "
import pandas
df = pandas.read_parquet('$tmp.raw.$archive')
print('Columns:', sorted(df.columns))
print('Shape:', df.shape)
print('Has timestamp:', 'timestamp' in df.columns)
# Verify timestamps are valid (not 1970 epoch)
if 'timestamp' in df.columns and len(df) > 0:
    ts = df['timestamp'].iloc[0]
    if ts.year >= 1999:
        print('Timestamp valid: True')
    else:
        print('Timestamp valid: False (year=%d)' % ts.year)
" | _filter
done

# success, all done
exit