File: GB_emult_02c.c

package info (click to toggle)
suitesparse 1%3A7.10.1%2Bdfsg-1
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid, trixie
  • size: 254,920 kB
  • sloc: ansic: 1,134,743; cpp: 46,133; makefile: 4,875; fortran: 2,087; java: 1,826; sh: 996; ruby: 725; python: 495; asm: 371; sed: 166; awk: 44
file content (58 lines) | stat: -rw-r--r-- 2,311 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
//------------------------------------------------------------------------------
// GB_emult_02c: C<#M>=A.*B when A is sparse/hyper; M and B are bitmap/full
//------------------------------------------------------------------------------

// SuiteSparse:GraphBLAS, Timothy A. Davis, (c) 2017-2025, All Rights Reserved.
// SPDX-License-Identifier: Apache-2.0

//------------------------------------------------------------------------------

// C is sparse, with the same sparsity structure as A.
// M is bitmap/full.  A is sparse/hyper, and B is bitmap/full.

{

    //--------------------------------------------------------------------------
    // Method2(c): C<#M>=A.*B, A is sparse/hyper, M and B are bitmap/full
    //--------------------------------------------------------------------------

    const int8_t *restrict Mb = M->b ;
    const GB_M_TYPE *restrict Mx = (Mask_struct) ? NULL : ((GB_M_TYPE *) M->x) ;
    const size_t msize = M->type->size ;

    int tid ;
    #pragma omp parallel for num_threads(A_nthreads) schedule(dynamic,1)
    for (tid = 0 ; tid < A_ntasks ; tid++)
    {
        int64_t kfirst = kfirst_Aslice [tid] ;
        int64_t klast  = klast_Aslice  [tid] ;
        for (int64_t k = kfirst ; k <= klast ; k++)
        {
            int64_t j = GBh_A (Ah, k) ;
            int64_t pB_start = j * vlen ;
            GB_GET_PA_AND_PC (pA, pA_end, pC, tid, k, kfirst, klast,
                pstart_Aslice, Cp_kfirst,
                GB_IGET (Ap, k), GB_IGET (Ap, k+1), GB_IGET (Cp, k)) ;
            for ( ; pA < pA_end ; pA++)
            { 
                int64_t i = GB_IGET (Ai, pA) ;
                int64_t pB = pB_start + i ;
                if (!GBb_B (Bb, pB)) continue ;
                bool mij = GBb_M (Mb, pB) && GB_MCAST (Mx, pB, msize) ;
                mij = mij ^ Mask_comp ;
                if (!mij) continue ;
                // C (i,j) = A (i,j) .* B (i,j)
                GB_ISET (Ci, pC, i) ;       // Ci [pC] = i ;
                #ifndef GB_ISO_EMULT
                GB_DECLAREA (aij) ;
                GB_GETA (aij, Ax, pA, A_iso) ;     
                GB_DECLAREB (bij) ;
                GB_GETB (bij, Bx, pB, B_iso) ;
                GB_EWISEOP (Cx, pC, aij, bij, i, j) ;
                #endif
                pC++ ;
            }
        }
    }
}