File: arm-integer-dot-product.cl

package info (click to toggle)
llvm-toolchain-19 1%3A19.1.7-3
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid, trixie
  • size: 1,998,520 kB
  • sloc: cpp: 6,951,680; ansic: 1,486,157; asm: 913,598; python: 232,024; f90: 80,126; objc: 75,281; lisp: 37,276; pascal: 16,990; sh: 10,009; ml: 5,058; perl: 4,724; awk: 3,523; makefile: 3,167; javascript: 2,504; xml: 892; fortran: 664; cs: 573
file content (45 lines) | stat: -rw-r--r-- 2,202 bytes parent folder | download | duplicates (12)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
// RUN: %clang_cc1 %s -triple spir-unknown-unknown -finclude-default-header -fdeclare-opencl-builtins -cl-std=CL1.2 -emit-llvm -o - -O0 | FileCheck %s

// Pragmas are only accepted for backward compatibility.
// The builtins are made available with the following defines.

#define cl_arm_integer_dot_product_int8 1
#define cl_arm_integer_dot_product_accumulate_int8 1
#define cl_arm_integer_dot_product_accumulate_int16 1
#define cl_arm_integer_dot_product_accumulate_saturate_int8 1

#pragma OPENCL EXTENSION cl_arm_integer_dot_product_int8 : enable
#pragma OPENCL EXTENSION cl_arm_integer_dot_product_int8 : disable
void test_int8(uchar4 ua, uchar4 ub, char4 sa, char4 sb) {
    uint ur = arm_dot(ua, ub);
    // CHECK: call spir_func i32 @_Z7arm_dotDv4_hS_
    int sr = arm_dot(sa, sb);
    // CHECK: call spir_func i32 @_Z7arm_dotDv4_cS_
}

#pragma OPENCL EXTENSION cl_arm_integer_dot_product_accumulate_int8 : enable
#pragma OPENCL EXTENSION cl_arm_integer_dot_product_accumulate_int8 : disable
void test_accumulate_int8(uchar4 ua, uchar4 ub, uint uc, char4 sa, char4 sb, int c) {
    uint ur = arm_dot_acc(ua, ub, uc);
    // CHECK: call spir_func i32 @_Z11arm_dot_accDv4_hS_j
    int sr = arm_dot_acc(sa, sb, c);
    // CHECK: call spir_func i32 @_Z11arm_dot_accDv4_cS_i
}

#pragma OPENCL EXTENSION cl_arm_integer_dot_product_accumulate_int16 : enable
#pragma OPENCL EXTENSION cl_arm_integer_dot_product_accumulate_int16 : disable
void test_accumulate_int16(ushort2 ua, ushort2 ub, uint uc, short2 sa, short2 sb, int c) {
    uint ur = arm_dot_acc(ua, ub, uc);
    // CHECK: call spir_func i32 @_Z11arm_dot_accDv2_tS_j
    int sr = arm_dot_acc(sa, sb, c);
    // CHECK: call spir_func i32 @_Z11arm_dot_accDv2_sS_i
}

#pragma OPENCL EXTENSION cl_arm_integer_dot_product_accumulate_saturate_int8 : enable
#pragma OPENCL EXTENSION cl_arm_integer_dot_product_accumulate_saturate_int8 : disable
void test_accumulate_saturate_int8(uchar4 ua, uchar4 ub, uint uc, char4 sa, char4 sb, int c) {
    uint ur = arm_dot_acc_sat(ua, ub, uc);
    // CHECK: call spir_func i32 @_Z15arm_dot_acc_satDv4_hS_j
    int sr = arm_dot_acc_sat(sa, sb, c);
    // CHECK: call spir_func i32 @_Z15arm_dot_acc_satDv4_cS_i
}