File: ger_problems.yaml

package info (click to toggle)
rocblas 6.4.4-4
  • links: PTS, VCS
  • area: main
  • in suites: sid
  • size: 1,082,776 kB
  • sloc: cpp: 244,923; f90: 50,012; python: 50,003; sh: 24,630; asm: 8,917; makefile: 150; ansic: 107; xml: 36; awk: 14
file content (41 lines) | stat: -rw-r--r-- 1,076 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
---
include: ../../../../clients/include/rocblas_common.yaml

Definitions:

  - &double_buffered_loads_size_range
    - { scan: [2048..8192..512], M: *c_scan_value, N: *c_scan_value, lda: *c_scan_value }
    - { M: 2176, N: 2176,  lda: 2176 }

  - &generic_ger_size_range  # non-fp32 will use generic kernel, fp32 will use special kernel
    - { M: 2048, N: [2560..8192..512], lda: 2048 }
    - { scan: [2048..8192..512], M: *c_scan_value, N: [32..128..32], lda: *c_scan_value }

Tests:
  - name: ger_double_buffered_bench
    category: bench
    function: ger
    precision: *single_double_precisions
    alpha: 1
    incx: 1
    incy: 1
    matrix_size: *double_buffered_loads_size_range

  - name: ger_generic_bench
    category: bench
    function: ger
    precision: *single_double_precisions
    alpha: 1
    incx: 1
    incy: 1
    matrix_size: *generic_ger_size_range

  - name: gerc_generic_bench
    category: bench
    function: gerc
    precision: *single_double_precisions_complex
    alpha: 1
    incx: 1
    incy: 1
    matrix_size: *generic_ger_size_range
...