1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90
|
/******************************************************************************
* Copyright (c) Intel Corporation - All rights reserved. *
* This file is part of the LIBXSMM library. *
* *
* For information on the license, see the LICENSE file. *
* Further information: https://github.com/hfp/libxsmm/ *
* SPDX-License-Identifier: BSD-3-Clause *
******************************************************************************/
/* Hans Pabst (Intel Corp.)
******************************************************************************/
#include <stdlib.h>
#include <assert.h>
#include <stdio.h>
#if !defined(BLASINT_TYPE)
# define BLASINT_TYPE int
#endif
/** Function prototype for DGEMM; this way any kind of LAPACK/BLAS library is sufficient at link-time. */
void dgemm_(const char*, const char*, const BLASINT_TYPE*, const BLASINT_TYPE*, const BLASINT_TYPE*,
const double*, const double*, const BLASINT_TYPE*, const double*, const BLASINT_TYPE*,
const double*, double*, const BLASINT_TYPE*);
void init(int seed, double* dst, BLASINT_TYPE nrows, BLASINT_TYPE ncols, BLASINT_TYPE ld, double scale);
void init(int seed, double* dst, BLASINT_TYPE nrows, BLASINT_TYPE ncols, BLASINT_TYPE ld, double scale)
{
const double seed1 = scale * (seed + 1);
BLASINT_TYPE i = 0;
#if defined(_OPENMP)
# pragma omp parallel for private(i)
#endif
for (i = 0; i < ncols; ++i) {
BLASINT_TYPE j = 0;
for (; j < nrows; ++j) {
const BLASINT_TYPE k = i * ld + j;
dst[k] = (double)(seed1 / (k + 1));
}
for (; j < ld; ++j) {
const BLASINT_TYPE k = i * ld + j;
dst[k] = (double)seed;
}
}
}
int main(int argc, char* argv[])
{
int size = 2 == argc ? atoi(argv[1]) : 500;
const BLASINT_TYPE m = 2 < argc ? atoi(argv[1]) : 23;
const BLASINT_TYPE k = 3 < argc ? atoi(argv[3]) : m;
const BLASINT_TYPE n = 2 < argc ? atoi(argv[2]) : k;
const BLASINT_TYPE lda = 4 < argc ? atoi(argv[4]) : m;
const BLASINT_TYPE ldb = 5 < argc ? atoi(argv[5]) : k;
const BLASINT_TYPE ldc = 6 < argc ? atoi(argv[6]) : m;
const double alpha = 7 < argc ? atof(argv[7]) : 1.0;
const double beta = 8 < argc ? atof(argv[8]) : 1.0;
const char transa = 'N', transb = 'N';
double *a = 0, *b = 0, *c = 0;
int i;
if (9 < argc) size = atoi(argv[9]);
a = (double*)malloc(lda * k * sizeof(double));
b = (double*)malloc(ldb * n * sizeof(double));
c = (double*)malloc(ldc * n * sizeof(double));
printf("dgemm('%c', '%c', %i/*m*/, %i/*n*/, %i/*k*/,\n"
" %g/*alpha*/, %p/*a*/, %i/*lda*/,\n"
" %p/*b*/, %i/*ldb*/,\n"
" %g/*beta*/, %p/*c*/, %i/*ldc*/)\n",
transa, transb, m, n, k, alpha, (const void*)a, lda,
(const void*)b, ldb,
beta, (const void*)c, ldc);
assert(0 != a && 0 != b && 0 != c);
init(42, a, m, k, lda, 1.0);
init(24, b, k, n, ldb, 1.0);
init( 0, c, m, n, ldc, 1.0);
for (i = 0; i < size; ++i) {
dgemm_(&transa, &transb, &m, &n, &k, &alpha, a, &lda, b, &ldb, &beta, c, &ldc);
}
printf("Called %i times.\n", size);
free(a);
free(b);
free(c);
return EXIT_SUCCESS;
}
|