File: shifts.ll

package info (click to toggle)
intel-graphics-compiler 1.0.17791.18-1
  • links: PTS, VCS
  • area: main
  • in suites: sid
  • size: 102,312 kB
  • sloc: cpp: 935,343; lisp: 286,143; ansic: 16,196; python: 3,279; yacc: 2,487; lex: 1,642; pascal: 300; sh: 174; makefile: 27
file content (61 lines) | stat: -rw-r--r-- 2,856 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
;=========================== begin_copyright_notice ============================
;
; Copyright (C) 2022-2024 Intel Corporation
;
; SPDX-License-Identifier: MIT
;
;============================ end_copyright_notice =============================
;
; REQUIRES: llvm-14-plus
; RUN: igc_opt --opaque-pointers -enable-debugify --igc-replace-unsupported-intrinsics -S 2>&1 < %s | FileCheck %s
; ------------------------------------------------
; ReplaceUnsupportedIntrinsics: funnel shifts
; ------------------------------------------------

; Debug-info related check
;
; CHECK-NOT: WARNING
; CHECK: CheckModuleDebugify: PASS

define spir_kernel void @test_shift(i32 %src1, i32 %src2, i32 %src3) {
; CHECK-LABEL: @test_shift(
; CHECK-NEXT:  entry:
; CHECK:    [[TMP0:%.*]] = and i32 [[SRC3:%.*]], 31
; CHECK:    [[TMP1:%.*]] = sub i32 32, [[TMP0]]
; CHECK:    [[TMP2:%.*]] = shl i32 [[SRC1:%.*]], [[TMP0]]
; CHECK:    [[TMP3:%.*]] = lshr i32 [[SRC2:%.*]], [[TMP1]]
; CHECK:    [[TMP4:%.*]] = or i32 [[TMP2]], [[TMP3]]
; CHECK:    [[TMP5:%.*]] = and i32 [[SRC3]], 31
; CHECK:    [[TMP6:%.*]] = sub i32 32, [[TMP5]]
; CHECK:    [[TMP7:%.*]] = shl i32 [[SRC1]], [[TMP6]]
; CHECK:    [[TMP8:%.*]] = lshr i32 [[SRC2]], [[TMP5]]
; CHECK:    [[TMP9:%.*]] = or i32 [[TMP7]], [[TMP8]]
; CHECK:    [[TMP10:%.*]] = insertelement <2 x i32> undef, i32 [[SRC1]], i32 0
; CHECK:    [[TMP11:%.*]] = insertelement <2 x i32> [[TMP10]], i32 [[SRC2]], i32 1
; CHECK:    [[TMP12:%.*]] = insertelement <2 x i32> undef, i32 [[SRC2]], i32 0
; CHECK:    [[TMP13:%.*]] = insertelement <2 x i32> [[TMP12]], i32 [[SRC3]], i32 1
; CHECK:    [[TMP14:%.*]] = insertelement <2 x i32> undef, i32 [[SRC3]], i32 0
; CHECK:    [[TMP15:%.*]] = insertelement <2 x i32> [[TMP14]], i32 [[SRC1]], i32 1
; CHECK:    [[TMP16:%.*]] = and <2 x i32> [[TMP15]], <i32 31, i32 31>
; CHECK:    [[TMP17:%.*]] = sub <2 x i32> <i32 32, i32 32>, [[TMP16]]
; CHECK:    [[TMP18:%.*]] = shl <2 x i32> [[TMP11]], [[TMP17]]
; CHECK:    [[TMP19:%.*]] = lshr <2 x i32> [[TMP13]], [[TMP16]]
; CHECK:    [[TMP20:%.*]] = or <2 x i32> [[TMP18]], [[TMP19]]
; CHECK:    ret void
;
entry:
  %fshl_result = call i32 @llvm.fshl.i32(i32 %src1, i32 %src2, i32 %src3)
  %fshr_result = call i32 @llvm.fshr.i32(i32 %src1, i32 %src2, i32 %src3)
  %0 = insertelement <2 x i32> undef, i32 %src1, i32 0
  %1 = insertelement <2 x i32> %0, i32 %src2, i32 1
  %2 = insertelement <2 x i32> undef, i32 %src2, i32 0
  %3 = insertelement <2 x i32> %2, i32 %src3, i32 1
  %4 = insertelement <2 x i32> undef, i32 %src3, i32 0
  %5 = insertelement <2 x i32> %4, i32 %src1, i32 1
  %fshr_vector_result = call <2 x i32> @llvm.fshr.v2i32(<2 x i32> %1, <2 x i32> %3, <2 x i32> %5)
  ret void
}

declare i32 @llvm.fshl.i32(i32, i32, i32) #0
declare i32 @llvm.fshr.i32(i32, i32, i32) #0
declare <2 x i32> @llvm.fshr.v2i32(<2 x i32>, <2 x i32>, <2 x i32>) #0