File: gemm_problems.yaml

package info (click to toggle)
rocblas 6.4.4-4
  • links: PTS, VCS
  • area: main
  • in suites: sid
  • size: 1,082,776 kB
  • sloc: cpp: 244,923; f90: 50,012; python: 50,003; sh: 24,630; asm: 8,917; makefile: 150; ansic: 107; xml: 36; awk: 14
file content (83 lines) | stat: -rw-r--r-- 1,661 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
---
include: ../../../../clients/include/rocblas_common.yaml

Definitions:
  - &square_sizes
    - { scan: [ 512..8192..512 ], N: *c_scan_value, M: *c_scan_value, K: *c_scan_value, lda: *c_scan_value, ldb: *c_scan_value, ldc: *c_scan_value }


Tests:
  - name: gemm_ex_bench_const_nk
    category: bench
    function: gemm_ex
    precision:
      - *hpa_half_precision
      - *single_precision
      - *double_precision
    transA: [ N, T ]
    transB: [ N, T ]
    alpha: 1
    incx: 1
    incy: 1
    N: 384
    M: 2048..24576..2048
    K: 384
    lda: 24576 # m or k, depends on transA
    ldb: 384 # k or n, depends on transB
    ldc: 24576
    ldd: 24576

  - name: gemm_ex_bench_const_mk
    category: bench
    function: gemm_ex
    precision:
      - *hpa_half_precision
      - *single_precision
      - *double_precision
    transA: [ N, T ]
    transB: [ N, T ]
    alpha: 1
    incx: 1
    incy: 1
    N: 2048..24576..2048
    M: 384
    K: 384
    lda: 384
    ldb: 24576
    ldc: 384
    ldd: 384

  - name: gemm_ex_bench_const_mn
    category: bench
    function: gemm_ex
    precision:
      - *hpa_half_precision
      - *single_precision
      - *double_precision
    transA: [ N, T ]
    transB: [ N, T ]
    alpha: 1
    incx: 1
    incy: 1
    N: 384
    M: 384
    K: 2048..24576..2048
    lda: 24576
    ldb: 24576
    ldc: 384
    ldd: 384

  - name: gemm_ex_bench_m_equals_n_equals_k
    category: bench
    function: gemm_ex
    precision:
      - *hpa_half_precision
      - *single_precision
      - *double_precision
    transA: [ N, T ]
    transB: [ N, T ]
    alpha: 1
    incx: 1
    incy: 1
    matrix_size: *square_sizes
...