1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81
|
// Copyright (c) 2017-2023, University of Tennessee. All rights reserved.
// SPDX-License-Identifier: BSD-3-Clause
// This program is free software: you can redistribute it and/or modify it under
// the terms of the BSD 3-Clause license. See the accompanying LICENSE file.
#include <sycl/detail/cl.h>
#include <sycl.hpp>
#include <oneapi/mkl.hpp>
#include <stdexcept>
#include <cassert>
#include <cstdio>
//------------------------------------------------------------------------------
int main()
{
try {
double alpha = 2, beta = 3;
int n = 2;
double A[] = { 1, 2, 3, 4 };
double B[] = { 5, 4, 3, 2 };
double C[] = { 2, 3, 1, 0 };
double D[] = { 40, 61, 21, 28 };
// enumerate devices
std::vector< sycl::device > devices;
auto platforms = sycl::platform::get_platforms();
for (auto& platform : platforms) {
auto all_devices = platform.get_devices();
for (auto& device : all_devices) {
if (device.is_gpu()) {
devices.push_back( device );
}
}
}
if (devices.size() == 0) {
printf( "no sycl GPU devices\n" );
return -1;
}
sycl::queue queue( devices[0] );
double *dA, *dB, *dC;
dA = (double*) sycl::malloc_shared( n*n*sizeof(double), queue );
dB = (double*) sycl::malloc_shared( n*n*sizeof(double), queue );
dC = (double*) sycl::malloc_shared( n*n*sizeof(double), queue );
// dA = A, dB = B, dC = c
queue.memcpy( dA, A, n*n*sizeof(double) );
queue.memcpy( dB, B, n*n*sizeof(double) );
queue.memcpy( dC, C, n*n*sizeof(double) );
// C = alpha A B + beta C
oneapi::mkl::blas::gemm(
queue,
oneapi::mkl::transpose::N, oneapi::mkl::transpose::N,
n, n, n,
alpha, dA, n, dB, n, beta, dC, n );
// C = dC
queue.memcpy( dC, C, n*n*sizeof(double) );
sycl::free( dA, queue );
sycl::free( dB, queue );
sycl::free( dC, queue );
// verify C == D
double result = 0;
for (int i = 0; i < n*n; ++i) {
printf( "C[%d] = %.2f, D = %.2f\n", i, C[i], D[i] );
result += std::abs( D[i] - C[i] );
}
bool okay = (result == 0);
printf( "%s\n", okay ? "ok" : "failed" );
return ! okay;
}
catch (...) {
printf( "caught error\n" );
return -2;
}
}
|