File: ell.h

package info (click to toggle)
python-escript 5.0-3
  • links: PTS, VCS
  • area: main
  • in suites: stretch
  • size: 87,772 kB
  • ctags: 49,550
  • sloc: python: 585,488; cpp: 133,173; ansic: 18,675; xml: 3,283; sh: 690; makefile: 215
file content (53 lines) | stat: -rw-r--r-- 2,038 bytes parent folder | download | duplicates (4)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
/*
 *  Copyright 2008-2009 NVIDIA Corporation
 *
 *  Licensed under the Apache License, Version 2.0 (the "License");
 *  you may not use this file except in compliance with the License.
 *  You may obtain a copy of the License at
 *
 *      http://www.apache.org/licenses/LICENSE-2.0
 *
 *  Unless required by applicable law or agreed to in writing, software
 *  distributed under the License is distributed on an "AS IS" BASIS,
 *  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 *  See the License for the specific language governing permissions and
 *  limitations under the License.
 */


#ifndef __ELL_H__
#define __ELL_H__

////////////////////////////////////////////////////////////////////////////////
//! Compute y += A*x for a sparse ELL matrix A and column vectors x and y
//! @param num_rows             number of rows in A
//! @param num_cols             number of columns in A
//! @param num_entries_per_row  number columns in each row (smaller rows are zero padded)
//! @param stride               seperation between row entries (stride >= num_rows, for alignment)
//! @param Aj                   ELL column indices
//! @param Ax                   ELL nonzero values
//! @param x                    column vector
//! @param y                    column vector
////////////////////////////////////////////////////////////////////////////////
template <typename IndexType, typename ValueType>
void ell_matvec(const IndexType num_rows,
                const IndexType num_cols,
                const IndexType num_entries_per_row,
                const IndexType stride,
                const IndexType * Aj, 
                const ValueType * Ax, 
                const ValueType * x,
                      ValueType * y)
{
    for(IndexType n = 0; n < num_entries_per_row; n++){
        const IndexType * Aj_n = Aj + n * stride;
        const ValueType * Ax_n = Ax + n * stride;
        for(IndexType i = 0; i < num_rows; i++){
            y[i] += Ax_n[i] * x[Aj_n[i]];
        }
    }
}



#endif