File: generalized_spmv.cu

package info (click to toggle)
python-escript 5.0-3
  • links: PTS, VCS
  • area: main
  • in suites: stretch
  • size: 87,772 kB
  • ctags: 49,550
  • sloc: python: 585,488; cpp: 133,173; ansic: 18,675; xml: 3,283; sh: 690; makefile: 215
file content (161 lines) | stat: -rw-r--r-- 5,596 bytes parent folder | download | duplicates (4)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
#include <unittest/unittest.h>

#include <cusp/detail/device/generalized_spmv/coo_flat.h>
#include <cusp/detail/device/generalized_spmv/csr_scalar.h>

#include <cusp/array1d.h>
#include <cusp/coo_matrix.h>
#include <cusp/csr_matrix.h>
#include <cusp/multiply.h>
#include <cusp/gallery/poisson.h>
#include <cusp/gallery/random.h>

template <typename Matrix,
          typename Array1,
          typename Array2,
          typename Array3,
          typename BinaryFunction1,
          typename BinaryFunction2>
void generalized_spmv(const Matrix& A,
                      const Array1& x,
                      const Array2& y,
                            Array3& z,
                      BinaryFunction1 combine,
                      BinaryFunction2 reduce,
                      cusp::csr_format)
{
    cusp::detail::device::cuda::spmv_csr_scalar
        (A.num_rows,
         A.row_offsets.begin(), A.column_indices.begin(), A.values.begin(),
         x.begin(), y.begin(), z.begin(),
         combine, reduce);
}

template <typename Matrix,
          typename Array1,
          typename Array2,
          typename Array3,
          typename BinaryFunction1,
          typename BinaryFunction2>
void generalized_spmv(const Matrix& A,
                      const Array1& x,
                      const Array2& y,
                            Array3& z,
                      BinaryFunction1 combine,
                      BinaryFunction2 reduce,
                      cusp::coo_format)
{
    cusp::detail::device::cuda::spmv_coo
        (A.num_rows, A.num_entries,
         A.row_indices.begin(), A.column_indices.begin(), A.values.begin(),
         x.begin(), y.begin(), z.begin(),
         combine, reduce);
}

template <typename Matrix,
          typename Array1,
          typename Array2,
          typename Array3,
          typename BinaryFunction1,
          typename BinaryFunction2>
void generalized_spmv(const Matrix& A,
                      const Array1& x,
                      const Array2& y,
                            Array3& z,
                      BinaryFunction1 combine,
                      BinaryFunction2 reduce)
{
  generalized_spmv(A, x, y, z, combine, reduce, typename Matrix::format());
}

template <typename TestMatrix>
void _TestGeneralizedSpMV(void)
{
  typedef typename TestMatrix::index_type   IndexType;
  typedef typename TestMatrix::value_type   ValueType;
  typedef typename TestMatrix::memory_space MemorySpace;

  {
    // initialize example matrix
    cusp::array2d<ValueType, cusp::host_memory> A(5,4);
    A(0,0) = 13; A(0,1) = 80; A(0,2) =  0; A(0,3) =  0; 
    A(1,0) =  0; A(1,1) = 27; A(1,2) =  0; A(1,3) =  0;
    A(2,0) = 55; A(2,1) =  0; A(2,2) = 24; A(2,3) = 42;
    A(3,0) =  0; A(3,1) = 69; A(3,2) =  0; A(3,3) = 83;
    A(4,0) =  0; A(4,1) =  0; A(4,2) = 27; A(4,3) =  0;

    // convert to desired format
    TestMatrix test_matrix = A;

    // allocate vectors
    cusp::array1d<ValueType, MemorySpace> x(4);
    cusp::array1d<ValueType, MemorySpace> y(5);
    cusp::array1d<ValueType, MemorySpace> z(5,-1);

    // initialize input and output vectors
    x[0] = 1.0f; y[0] = 10.0f; 
    x[1] = 2.0f; y[1] = 20.0f;
    x[2] = 3.0f; y[2] = 30.0f;
    x[3] = 4.0f; y[3] = 40.0f;
                 y[4] = 50.0f;

    generalized_spmv(test_matrix, x, y, z, thrust::multiplies<ValueType>(), thrust::plus<ValueType>());

    ASSERT_EQUAL(z[0], 183.0f);
    ASSERT_EQUAL(z[1],  74.0f);
    ASSERT_EQUAL(z[2], 325.0f);
    ASSERT_EQUAL(z[3], 510.0f);
    ASSERT_EQUAL(z[4], 131.0f);
  }
 
  typedef typename cusp::coo_matrix<IndexType,ValueType,cusp::host_memory> HostMatrix;
  //cusp::array1d<HostMatrix, cusp::host_memory> matrices;
  std::vector<HostMatrix> matrices;

  { HostMatrix M; cusp::gallery::poisson5pt(M,   5,   5);   matrices.push_back(M); }
  { HostMatrix M; cusp::gallery::poisson5pt(M,  10,  10);   matrices.push_back(M); } 
  { HostMatrix M; cusp::gallery::poisson5pt(M, 117, 113);   matrices.push_back(M); } 
  { HostMatrix M; cusp::gallery::poisson5pt(M, 313, 444);   matrices.push_back(M); } 
  { HostMatrix M; cusp::gallery::poisson5pt(M, 876, 321);   matrices.push_back(M); } 
  { HostMatrix M; cusp::gallery::random( 21,  23,   5, M);  matrices.push_back(M); }
  { HostMatrix M; cusp::gallery::random( 45,  37,  15, M);  matrices.push_back(M); }
  { HostMatrix M; cusp::gallery::random(129, 127,  40, M);  matrices.push_back(M); }
  { HostMatrix M; cusp::gallery::random(355, 378, 234, M);  matrices.push_back(M); }
  { HostMatrix M; cusp::gallery::random(512, 512, 276, M);  matrices.push_back(M); }
 
  for(size_t i = 0; i < matrices.size(); i++)
  {
    TestMatrix M = matrices[i];

    // allocate vectors
    cusp::array1d<ValueType, MemorySpace> x = unittest::random_integers<bool>(M.num_cols);
    cusp::array1d<ValueType, MemorySpace> y(M.num_rows,0);
    cusp::array1d<ValueType, MemorySpace> z = unittest::random_integers<char>(M.num_rows);

    generalized_spmv(M, x, y, z, thrust::multiplies<ValueType>(), thrust::plus<ValueType>());
  
    // compute reference
    cusp::array1d<ValueType, MemorySpace> reference(M.num_rows,0);
    cusp::multiply(M, x, reference);

    ASSERT_EQUAL(z, reference);
  }
}


void TestCsrGeneralizedSpMV(void)
{
  typedef cusp::csr_matrix<int,float,cusp::device_memory> TestMatrix;
  _TestGeneralizedSpMV<TestMatrix>();
}
DECLARE_UNITTEST(TestCsrGeneralizedSpMV);

void TestCooGeneralizedSpMV(void)
{
  KNOWN_FAILURE;
  //typedef cusp::coo_matrix<int,float,cusp::device_memory> TestMatrix;
  //_TestGeneralizedSpMV<TestMatrix>();
}
DECLARE_UNITTEST(TestCooGeneralizedSpMV);