1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29
|
void
% if n is None:
${kname}(int n,
const ${dtype}* restrict b, int ldb,
${dtype}* restrict c, int ldc)
{
% else:
${kname}(const ${dtype}* restrict b, ${dtype}* restrict c)
{
const int n = ${n};
const ${'long long' if k*ldb >= 2**31 else 'int'} ldb = ${ldb};
const ${'long long' if m*ldc >= 2**31 else 'int'} ldc = ${ldc};
% endif
#pragma omp parallel for simd private(dotp)
for (int i = 0; i < n; i++)
{
% for j, jx in enumerate(A):
% if beta == 0:
c[i + ${j}*ldc] = ${dot(lambda kx: f'b[i + {kx}*ldb]', jx)};
% elif beta == 1:
c[i + ${j}*ldc] += ${dot(lambda kx: f'b[i + {kx}*ldb]', jx)};
% else:
c[i + ${j}*ldc] = ${dot(lambda kx: f'b[i + {kx}*ldb]', jx)}
+ ${beta}*c[i + ${j}*ldc];
% endif
% endfor
}
}
|