File: split-sink-merge.ll

package info (click to toggle)
intel-graphics-compiler2 2.16.0-2
  • links: PTS, VCS
  • area: main
  • in suites: sid
  • size: 106,644 kB
  • sloc: cpp: 805,640; lisp: 287,672; ansic: 16,414; python: 3,952; yacc: 2,588; lex: 1,666; pascal: 313; sh: 186; makefile: 35
file content (72 lines) | stat: -rw-r--r-- 3,662 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
;=========================== begin_copyright_notice ============================
;
; Copyright (C) 2024 Intel Corporation
;
; SPDX-License-Identifier: MIT
;
;============================ end_copyright_notice =============================
; RUN: igc_opt -igc-wave-shuffle-index-sinking -S < %s | FileCheck %s
; ------------------------------------------------
; WaveShuffleIndexSinking
;
; This test does not primarily demonstrate the benefits/profitability of the optimization
; This test focuses on the auxiliary functionality of splitting and merging various WaveShuffleIndex instructions
; Only the 4 combinations of N/N, N/Y, Y/N, and Y/Y for Split/Merge need to be considered, Sink is for informational purposes only
;
; Test Scenarios
; %ws0: Split: N, Sink: Y, Merge: N
; %ws1: Split: Y, Sink: Y/Y, Merge: N (profitable to sink both paths)
; %ws2: Split: Y, Sink: Y/N, Merge: N (profitable to sink one path)
; %ws3: Split: Y, Sink: N/N, Merge: Y (nothing to group and sink with)
; %ws4: Split: N, Sink: N, Merge: Y
; %ws5: Split: N, Sink: N, Merge: Y
; ------------------------------------------------

define void @test_split_sink_merge(i32 %a, i32 %b, i32 %c, i32 %d) {
; CHECK: [[USE1_WS0_WS1C1_HOISTED:%.*]] = shl i32 %a, 2
; CHECK: [[WS0:%.*]] = call i32 @llvm.genx.GenISA.WaveShuffleIndex.i32(i32 [[USE1_WS0_WS1C1_HOISTED]], i32 0, i32 0)
  %ws0 = call i32 @llvm.genx.GenISA.WaveShuffleIndex.i32(i32 %a, i32 0, i32 0)
  %use1_ws0 = shl i32 %ws0, 2
; CHECK: add i32 [[WS0]], %c
  %anchor1_ws0 = add i32 %use1_ws0, %c
; CHECK: [[USE2_WS1C2_WS2C1_HOISTED:%.*]] = shl i32 %a, 3
; CHECK-DAG: [[WS1C1:%.*]] = call i32 @llvm.genx.GenISA.WaveShuffleIndex.i32(i32 [[USE1_WS0_WS1C1_HOISTED]], i32 1, i32 0)
; CHECK-DAG: [[WS1C2:%.*]] = call i32 @llvm.genx.GenISA.WaveShuffleIndex.i32(i32 [[USE2_WS1C2_WS2C1_HOISTED]], i32 1, i32 0)
  %ws1 = call i32 @llvm.genx.GenISA.WaveShuffleIndex.i32(i32 %a, i32 1, i32 0)
  %use1_ws1 = shl i32 %ws1, 2
; CHECK: add i32 [[WS1C1]], %c
  %anchor1_ws1 = add i32 %use1_ws1, %c
  %use2_ws1 = shl i32 %ws1, 3
; CHECK: add i32 [[WS1C2]], %d
  %anchor2_ws1 = add i32 %use2_ws1, %d
; CHECK-DAG: [[WS2C1:%.*]] = call i32 @llvm.genx.GenISA.WaveShuffleIndex.i32(i32 [[USE2_WS1C2_WS2C1_HOISTED]], i32 2, i32 0)
; CHECK-DAG: [[WS2C2:%.*]] = call i32 @llvm.genx.GenISA.WaveShuffleIndex.i32(i32 %a, i32 2, i32 0)
  %ws2 = call i32 @llvm.genx.GenISA.WaveShuffleIndex.i32(i32 %a, i32 2, i32 0)
  %use1_ws2 = shl i32 %ws2, 3
; CHECK: add i32 [[WS2C1]], %d
  %anchor1_ws2 = add i32 %use1_ws2, %d
; CHECK: [[USE2_WS2C2_NOT_HOISTED:%.*]] = shl i32 [[WS2C2]], 4
  %use2_ws2 = shl i32 %ws2, 4
; CHECK: add i32 [[USE2_WS2C2_NOT_HOISTED]], %d
  %anchor2_ws2 = add i32 %use2_ws2, %d
; CHECK: [[WS3:%.*]] = call i32 @llvm.genx.GenISA.WaveShuffleIndex.i32(i32 %b, i32 0, i32 0)
  %ws3 = call i32 @llvm.genx.GenISA.WaveShuffleIndex.i32(i32 %b, i32 0, i32 0)
; CHECK-NEXT: add i32 [[WS3]], %c
  %use1_ws3 = add i32 %ws3, %c
; CHECK-NEXT: add i32 [[WS3]], %d
  %use2_ws3 = add i32 %ws3, %d
; CHECK: [[WS4:%.*]] = call i32 @llvm.genx.GenISA.WaveShuffleIndex.i32(i32 %b, i32 1, i32 0)
  %ws4 = call i32 @llvm.genx.GenISA.WaveShuffleIndex.i32(i32 %b, i32 1, i32 0)
; CHECK-NEXT: {{%.*}} = add i32 [[WS4]], %c
  %use1_ws4 = add i32 %ws4, %c
; CHECK-NOT: call i32 @llvm.genx.GenISA.WaveShuffleIndex.i32(i32 %b, i32 1, i32 0)
  %ws5 = call i32 @llvm.genx.GenISA.WaveShuffleIndex.i32(i32 %b, i32 1, i32 0)
; CHECK-NEXT: {{%.*}} = add i32 [[WS4]], %d
  %use1_ws5 = add i32 %ws5, %d
  ret void
}

; Function Attrs: convergent nounwind readnone
declare i32 @llvm.genx.GenISA.WaveShuffleIndex.i32(i32, i32, i32) #0

attributes #0 = { convergent nounwind readnone }