1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53
|
/*
* Copyright 2008-2009 NVIDIA Corporation
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#ifndef __ELL_H__
#define __ELL_H__
////////////////////////////////////////////////////////////////////////////////
//! Compute y += A*x for a sparse ELL matrix A and column vectors x and y
//! @param num_rows number of rows in A
//! @param num_cols number of columns in A
//! @param num_entries_per_row number columns in each row (smaller rows are zero padded)
//! @param stride seperation between row entries (stride >= num_rows, for alignment)
//! @param Aj ELL column indices
//! @param Ax ELL nonzero values
//! @param x column vector
//! @param y column vector
////////////////////////////////////////////////////////////////////////////////
template <typename IndexType, typename ValueType>
void ell_matvec(const IndexType num_rows,
const IndexType num_cols,
const IndexType num_entries_per_row,
const IndexType stride,
const IndexType * Aj,
const ValueType * Ax,
const ValueType * x,
ValueType * y)
{
for(IndexType n = 0; n < num_entries_per_row; n++){
const IndexType * Aj_n = Aj + n * stride;
const ValueType * Ax_n = Ax + n * stride;
for(IndexType i = 0; i < num_rows; i++){
y[i] += Ax_n[i] * x[Aj_n[i]];
}
}
}
#endif
|