1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125
|
// Copyright (c) 2017-2023, University of Tennessee. All rights reserved.
// SPDX-License-Identifier: BSD-3-Clause
// This program is free software: you can redistribute it and/or modify it under
// the terms of the BSD 3-Clause license. See the accompanying LICENSE file.
#include "test.hh"
#include "lapack.hh"
#include "lapack/flops.hh"
#include "print_matrix.hh"
#include "error.hh"
#include "lapacke_wrappers.hh"
#include <vector>
// -----------------------------------------------------------------------------
template< typename scalar_t >
void test_upgtr_work( Params& params, bool run )
{
using real_t = blas::real_type< scalar_t >;
// Constants
real_t eps = std::numeric_limits<real_t>::epsilon();
// get & mark input values
lapack::Uplo uplo = params.uplo();
int64_t n = params.dim.n();
int64_t align = params.align();
real_t tol = params.tol() * eps;
// mark non-standard output values
params.ref_time();
// params.ref_gflops();
// params.gflops();
if (! run)
return;
// ---------- setup
int64_t ldq = roundup( blas::max( 1, n ), align );
size_t size_AP = (size_t) (n*(n+1)/2);
size_t size_D = (size_t) (n);
size_t size_E = (size_t) (n-1);
size_t size_tau = (size_t) (n-1);
size_t size_Q = (size_t) ldq * n;
std::vector< scalar_t > AP( size_AP );
std::vector< scalar_t > tau( size_tau );
std::vector< scalar_t > Q_tst( size_Q );
std::vector< scalar_t > Q_ref( size_Q );
std::vector< real_t > D( size_D );
std::vector< real_t > E( size_E );
int64_t idist = 1;
int64_t iseed[4] = { 0, 1, 2, 3 };
lapack::larnv( idist, iseed, AP.size(), &AP[0] );
lapack::larnv( idist, iseed, tau.size(), &tau[0] );
// reduce to tridiagonal form to use the tau later
int64_t info = lapack::hptrd( uplo, n, &AP[0], &D[0], &E[0], &tau[0] );
if (info != 0) {
fprintf( stderr, "lapack::upgtr returned error %lld\n", llong( info ) );
}
// ---------- run test
testsweeper::flush_cache( params.cache() );
double time = testsweeper::get_wtime();
int64_t info_tst = lapack::upgtr( uplo, n, &AP[0], &tau[0], &Q_tst[0], ldq );
time = testsweeper::get_wtime() - time;
if (info_tst != 0) {
fprintf( stderr, "lapack::upgtr returned error %lld\n", llong( info_tst ) );
}
params.time() = time;
// double gflop = lapack::Gflop< scalar_t >::upgtr( n );
// params.gflops() = gflop / time;
if (params.ref() == 'y' || params.check() == 'y') {
// ---------- run reference
testsweeper::flush_cache( params.cache() );
time = testsweeper::get_wtime();
int64_t info_ref = LAPACKE_upgtr( to_char( uplo ), n, &AP[0], &tau[0], &Q_ref[0], ldq );
time = testsweeper::get_wtime() - time;
if (info_ref != 0) {
fprintf( stderr, "LAPACKE_upgtr returned error %lld\n", llong( info_ref ) );
}
params.ref_time() = time;
// params.ref_gflops() = gflop / time;
// ---------- check error compared to reference
real_t error = 0;
if (info_tst != info_ref) {
error = 1;
}
error = blas::max( error, rel_error( Q_tst, Q_ref ) );
params.error() = error;
params.okay() = (error < tol);
}
}
// -----------------------------------------------------------------------------
void test_upgtr( Params& params, bool run )
{
switch (params.datatype()) {
case testsweeper::DataType::Single:
test_upgtr_work< float >( params, run );
break;
case testsweeper::DataType::Double:
test_upgtr_work< double >( params, run );
break;
case testsweeper::DataType::SingleComplex:
test_upgtr_work< std::complex<float> >( params, run );
break;
case testsweeper::DataType::DoubleComplex:
test_upgtr_work< std::complex<double> >( params, run );
break;
default:
throw std::runtime_error( "unknown datatype" );
break;
}
}
|