1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126
|
//------------------------------------------------------------------------------
// GB_dense_ewise3_accum: C += A+B where all 3 matries are dense
//------------------------------------------------------------------------------
// SuiteSparse:GraphBLAS, Timothy A. Davis, (c) 2017-2022, All Rights Reserved.
// SPDX-License-Identifier: Apache-2.0
//------------------------------------------------------------------------------
// C += A+B where no matrix is iso and all three matrices are as-if-full
#include "GB_dense.h"
#include "GB_binop.h"
#include "GB_stringify.h"
#ifndef GBCUDA_DEV
#include "GB_binop__include.h"
#endif
void GB_dense_ewise3_accum // C += A+B, all matrices dense
(
GrB_Matrix C, // input/output matrix
const GrB_Matrix A,
const GrB_Matrix B,
const GrB_BinaryOp op, // only GB_BINOP_SUBSET operators supported
GB_Context Context
)
{
#ifndef GBCUDA_DEV
//--------------------------------------------------------------------------
// check inputs
//--------------------------------------------------------------------------
ASSERT_MATRIX_OK (C, "C for dense C+=A+B", GB0) ;
ASSERT (!GB_ZOMBIES (C)) ;
ASSERT (!GB_JUMBLED (C)) ;
ASSERT (!GB_PENDING (C)) ;
ASSERT_MATRIX_OK (A, "A for dense C+=A+B", GB0) ;
ASSERT (!GB_ZOMBIES (A)) ;
ASSERT (!GB_JUMBLED (A)) ;
ASSERT (!GB_PENDING (A)) ;
ASSERT_MATRIX_OK (B, "B for dense C+=A+B", GB0) ;
ASSERT (!GB_ZOMBIES (B)) ;
ASSERT (!GB_JUMBLED (B)) ;
ASSERT (!GB_PENDING (B)) ;
ASSERT (GB_as_if_full (C)) ;
ASSERT (GB_as_if_full (A)) ;
ASSERT (GB_as_if_full (B)) ;
ASSERT (!GB_IS_BITMAP (C)) ;
ASSERT (!GB_IS_BITMAP (A)) ;
ASSERT (!GB_IS_BITMAP (B)) ;
ASSERT (!C->iso) ;
ASSERT (!A->iso) ;
ASSERT (!B->iso) ;
ASSERT_BINARYOP_OK (op, "op for dense C+=A+B", GB0) ;
ASSERT (!GB_OP_IS_POSITIONAL (op)) ;
ASSERT (op->ztype == C->type) ;
ASSERT (op->ztype == A->type) ;
ASSERT (op->ztype == B->type) ;
ASSERT (op->ztype == op->xtype) ;
ASSERT (op->ztype == op->ytype) ;
ASSERT (op->opcode >= GB_MIN_binop_code) ;
ASSERT (op->opcode <= GB_RDIV_binop_code) ;
GB_ENSURE_FULL (C) ; // convert C to full, if sparsity control allows it
// FUTURE::: handle IS*, LOR, LAND, LXOR operators
#ifdef GB_DEBUGIFY_DEFN
GB_debugify_ewise (false, GxB_FULL, C->type, NULL,
false, false, op, false, A, B) ;
#endif
//--------------------------------------------------------------------------
// determine the number of threads to use
//--------------------------------------------------------------------------
int64_t cnz = GB_nnz (C) ;
GB_GET_NTHREADS_MAX (nthreads_max, chunk, Context) ;
int nthreads = GB_nthreads (3 * cnz, chunk, nthreads_max) ;
//--------------------------------------------------------------------------
// define the worker for the switch factory
//--------------------------------------------------------------------------
#define GB_Cdense_ewise3_accum(op,xname) \
GB (_Cdense_ewise3_accum_ ## op ## xname)
#define GB_BINOP_WORKER(op,xname) \
{ \
GB_Cdense_ewise3_accum(op,xname) (C, A, B, nthreads) ; \
} \
break ;
//--------------------------------------------------------------------------
// launch the switch factory
//--------------------------------------------------------------------------
GB_Opcode opcode ;
GB_Type_code xcode, ycode, zcode ;
if (GB_binop_builtin (A->type, false, B->type, false,
op, false, &opcode, &xcode, &ycode, &zcode))
{
#define GB_BINOP_SUBSET
#include "GB_binop_factory.c"
}
else
{
// this function is not called if the op cannot be applied
ASSERT (GB_DEAD_CODE) ;
}
//--------------------------------------------------------------------------
// return result
//--------------------------------------------------------------------------
ASSERT_MATRIX_OK (C, "C+=A+B output", GB0) ;
#endif
}
|