File: test113.m

package info (click to toggle)
suitesparse-graphblas 7.4.0%2Bdfsg-2
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid, trixie
  • size: 67,112 kB
  • sloc: ansic: 1,072,243; cpp: 8,081; sh: 512; makefile: 506; asm: 369; python: 125; awk: 10
file content (46 lines) | stat: -rw-r--r-- 1,033 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
function test113
%TEST113 performance tests for GrB_kron

% SuiteSparse:GraphBLAS, Timothy A. Davis, (c) 2017-2022, All Rights Reserved.
% SPDX-License-Identifier: Apache-2.0

fprintf ('test113: performance tests for GrB_kron\n') ;

[save save_chunk] = nthreads_get ;
chunk = 4096 ;
ncores = feature_numcores ;

A = sprand (310, 302, 0.1) ;
B = sprand (300, 301, 0.1) ;
fprintf ('nnz(A) %g\n', nnz (A)) ;
fprintf ('nnz(B) %g\n', nnz (B)) ;
fprintf ('nnz(C) %g\n', nnz (A) * nnz (B)) ;

tic
C = kron (A,B) ;
tm = toc ;
fprintf ('built-in: %g sec\n', tm) ;

[m n] = size (C) ;
Empty = sparse (m,n) ;

for nthreads = [1 2 4 8 16 20 40]

    if (nthreads > 2*ncores)
        break ;
    end

    nthreads_set (nthreads,chunk) ;

    tic
    C1 = GB_mex_kron (Empty, [ ], [ ], 'times', A, B) ;
    t (nthreads) = toc ;

    assert (isequal (C, C1.matrix)) ;

    fprintf ('GB: %12.4f sec speedup: %12.4f  vs built-in: %12.4f\n', ...
        t (nthreads), t (1) / t (nthreads), tm / t (nthreads)) ;

end

nthreads_set (save, save_chunk) ;