1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82
|
function test118
%TEST118 performance tests for GrB_assign
% test C(:,:)<M> = A
% SuiteSparse:GraphBLAS, Timothy A. Davis, (c) 2017-2022, All Rights Reserved.
% SPDX-License-Identifier: Apache-2.0
fprintf ('test118 ----------------------------------- C(:,:)<M> = A\n') ;
[save save_chunk] = nthreads_get ;
chunk = 4096 ;
rng ('default') ;
n = 2000 ;
S = sparse (n,n) ;
I.begin = 0 ;
I.inc = 1 ;
I.end = n-1 ;
ncores = feature_numcores ;
for dc = [0 1e-5 1e-4 1e-3 1e-2 1e-1 0.5]
C0 = sparse (n,n,dc) ;
for da = [1e-5 1e-4 1e-3 1e-2 1e-1 0.5]
A = sprand (n, n, da) ;
for dm = [1e-5 1e-4 1e-3 1e-2 1e-1 0.5]
M = spones (sprand (n, n, dm)) ;
Mbool = logical (M) ;
fprintf ('\n--------------------------------------\n') ;
fprintf ('dc: %g, da: %g, dm: %g ', dc, da, dm) ;
fprintf ('\n') ;
fprintf ('nnz(M): %g million, ', nnz (M) / 1e6) ;
fprintf ('nnz(A): %g million\n', nnz (A) / 1e6) ;
% warmup
% C1 = C0 ;
% C1 (Mbool) = A (Mbool) ;
tic
C1 = C0 ;
C1 (Mbool) = A (Mbool) ;
tm = toc ;
t1 = 0 ;
for nthreads = [1 2 4 8 16 20 32 40 64]
if (nthreads > 2*ncores)
break ;
end
nthreads_set (nthreads, chunk) ;
if (nthreads > 1 & t1 < 0.1)
continue
end
% if (nnz(A)<nnz(M)) use method 06s, else method 06n
C2 = GB_mex_assign (C0, M, [ ], A, I, I) ;
tic
C2 = GB_mex_assign (C0, M, [ ], A, I, I) ;
tg = toc ;
assert (isequal (C1, C2.matrix)) ;
if (nthreads == 1)
t1 = tg ;
end
fprintf ('%3d : %8.4f GB: %8.4f', nthreads, tm, tg) ;
fprintf (' speedup: %8.2f %8.2f\n', t1/tg, tm / tg) ;
end
end
end
end
nthreads_set (save, save_chunk) ;
|