1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123
|
// Copyright (c) 2017-2023, University of Tennessee. All rights reserved.
// SPDX-License-Identifier: BSD-3-Clause
// This program is free software: you can redistribute it and/or modify it under
// the terms of the BSD 3-Clause license. See the accompanying LICENSE file.
#include "test.hh"
#include "lapack.hh"
#include "lapack/flops.hh"
#include "print_matrix.hh"
#include "error.hh"
#include "lapacke_wrappers.hh"
#include <vector>
#if LAPACK_VERSION >= 30700 // >= 3.7.0
// -----------------------------------------------------------------------------
template< typename scalar_t >
void test_larfy_work( Params& params, bool run )
{
using real_t = blas::real_type< scalar_t >;
// Constants
real_t eps = std::numeric_limits<real_t>::epsilon();
// get & mark input values
lapack::Uplo uplo = params.uplo();
int64_t n = params.dim.n();
int64_t incv = params.incx();
int64_t align = params.align();
real_t tol = params.tol() * eps;
// mark non-standard output values
params.ref_time();
//params.ref_gflops();
//params.gflops();
if (! run)
return;
// ---------- setup
scalar_t tau; // todo value
int64_t ldc = roundup( blas::max( 1, n ), align );
size_t size_V = (size_t) (1 + (n-1)*std::abs(incv));
size_t size_C = (size_t) ldc * n;
std::vector< scalar_t > V( size_V );
std::vector< scalar_t > C_tst( size_C );
std::vector< scalar_t > C_ref( size_C );
int64_t idist = 1;
int64_t iseed[4] = { 0, 1, 2, 3 };
lapack::larnv( idist, iseed, V.size(), &V[0] );
lapack::larnv( idist, iseed, 1, &tau );
lapack::generate_matrix( params.matrix, n, n, &C_tst[0], ldc );
C_ref = C_tst;
// ---------- run test
testsweeper::flush_cache( params.cache() );
double time = testsweeper::get_wtime();
lapack::larfy( uplo, n, &V[0], incv, tau, &C_tst[0], ldc );
time = testsweeper::get_wtime() - time;
params.time() = time;
//double gflop = lapack::Gflop< scalar_t >::larfy( n );
//params.gflops() = gflop / time;
if (params.ref() == 'y' || params.check() == 'y') {
// ---------- run reference
testsweeper::flush_cache( params.cache() );
time = testsweeper::get_wtime();
int64_t info_ref = LAPACKE_larfy( to_char( uplo ), n, &V[0], incv, tau, &C_ref[0], ldc );
time = testsweeper::get_wtime() - time;
if (info_ref != 0) {
fprintf( stderr, "LAPACKE_larfy returned error %lld\n", llong( info_ref ) );
}
params.ref_time() = time;
//params.ref_gflops() = gflop / time;
// ---------- check error compared to reference
real_t error = rel_error( C_tst, C_ref );
params.error() = error;
params.okay() = (error < tol);
}
}
// -----------------------------------------------------------------------------
void test_larfy( Params& params, bool run )
{
switch (params.datatype()) {
case testsweeper::DataType::Single:
test_larfy_work< float >( params, run );
break;
case testsweeper::DataType::Double:
test_larfy_work< double >( params, run );
break;
case testsweeper::DataType::SingleComplex:
test_larfy_work< std::complex<float> >( params, run );
break;
case testsweeper::DataType::DoubleComplex:
test_larfy_work< std::complex<double> >( params, run );
break;
default:
throw std::runtime_error( "unknown datatype" );
break;
}
}
#else
// -----------------------------------------------------------------------------
void test_larfy( Params& params, bool run )
{
fprintf( stderr, "larfy requires LAPACK >= 3.7.0\n\n" );
exit(0);
}
#endif // LAPACK >= 3.7.0
|