File: fp-matrix-pragma.c

package info (click to toggle)
llvm-toolchain-19 1%3A19.1.7-3
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid, trixie
  • size: 1,998,520 kB
  • sloc: cpp: 6,951,680; ansic: 1,486,157; asm: 913,598; python: 232,024; f90: 80,126; objc: 75,281; lisp: 37,276; pascal: 16,990; sh: 10,009; ml: 5,058; perl: 4,724; awk: 3,523; makefile: 3,167; javascript: 2,504; xml: 892; fortran: 664; cs: 573
file content (51 lines) | stat: -rw-r--r-- 1,663 bytes parent folder | download | duplicates (7)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
// RUN: %clang -emit-llvm -S -fenable-matrix -mllvm -disable-llvm-optzns %s -o - | FileCheck %s
// UNSUPPORTED: target={{.*}}-zos{{.*}}

typedef float fx2x2_t __attribute__((matrix_type(2, 2)));
typedef int ix2x2_t __attribute__((matrix_type(2, 2)));

fx2x2_t fp_matrix_contract(fx2x2_t a, fx2x2_t b, float c, float d) {
// CHECK: call contract <4 x float> @llvm.matrix.multiply.v4f32.v4f32.v4f32
// CHECK: fdiv contract <4 x float>
// CHECK: fmul contract <4 x float>
#pragma clang fp contract(fast)
  return (a * b / c) * d;
}

fx2x2_t fp_matrix_reassoc(fx2x2_t a, fx2x2_t b, fx2x2_t c) {
// CHECK: fadd reassoc <4 x float>
// CHECK: fsub reassoc <4 x float>
#pragma clang fp reassociate(on)
  return a + b - c;
}

fx2x2_t fp_matrix_ops(fx2x2_t a, fx2x2_t b, fx2x2_t c) {
// CHECK: call reassoc contract <4 x float> @llvm.matrix.multiply.v4f32.v4f32.v4f32
// CHECK: fadd reassoc contract <4 x float>
#pragma clang fp contract(fast) reassociate(on)
  return a * b + c;
}

fx2x2_t fp_matrix_compound_ops(fx2x2_t a, fx2x2_t b, fx2x2_t c, fx2x2_t d,
    float e, float f) {
// CHECK: call reassoc contract <4 x float> @llvm.matrix.multiply.v4f32.v4f32.v4f32
// CHECK: fadd reassoc contract <4 x float>
// CHECK: fsub reassoc contract <4 x float>
// CHECK: fmul reassoc contract <4 x float>
// CHECK: fdiv reassoc contract <4 x float>
#pragma clang fp contract(fast) reassociate(on)
  a *= b;
  a += c;
  a -= d;
  a *= e;
  a /= f;

  return a;
}

ix2x2_t int_matrix_ops(ix2x2_t a, ix2x2_t b, ix2x2_t c) {
// CHECK: call <4 x i32> @llvm.matrix.multiply.v4i32.v4i32.v4i32
// CHECK: add <4 x i32>
#pragma clang fp contract(fast) reassociate(on)
  return a * b + c;
}