File: wave-ballot-cse-control-flow.ll

package info (click to toggle)
intel-graphics-compiler2 2.16.0-2
  • links: PTS, VCS
  • area: main
  • in suites: sid
  • size: 106,644 kB
  • sloc: cpp: 805,640; lisp: 287,672; ansic: 16,414; python: 3,952; yacc: 2,588; lex: 1,666; pascal: 313; sh: 186; makefile: 35
file content (145 lines) | stat: -rw-r--r-- 5,688 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
;=========================== begin_copyright_notice ============================
;
; Copyright (C) 2025 Intel Corporation
;
; SPDX-License-Identifier: MIT
;
;============================ end_copyright_notice =============================

; RUN: igc_opt -wave-ballot-cse -S %s | FileCheck %s

; Test that CSE does NOT work across basic blocks (due to convergent nature)
define i32 @test_no_cross_block_cse(i1 %cond) {
; CHECK-LABEL: @test_no_cross_block_cse
; CHECK-NEXT:    %mask1 = call i32 @llvm.genx.GenISA.WaveBallot(i1 true, i32 0)
; CHECK-NEXT:    br i1 %cond, label %then, label %else
; CHECK:       then:
; CHECK-NEXT:    %mask2 = call i32 @llvm.genx.GenISA.WaveBallot(i1 true, i32 0)
; CHECK-NEXT:    %result_then = add i32 %mask1, %mask2
; CHECK-NEXT:    br label %merge
; CHECK:       else:
; CHECK-NEXT:    %mask3 = call i32 @llvm.genx.GenISA.WaveBallot(i1 true, i32 0)
; CHECK-NEXT:    %result_else = add i32 %mask1, %mask3
; CHECK-NEXT:    br label %merge
; CHECK:       merge:
; CHECK-NEXT:    %result = phi i32 [ %result_then, %then ], [ %result_else, %else ]
; CHECK-NEXT:    ret i32 %result
;
  %mask1 = call i32 @llvm.genx.GenISA.WaveBallot(i1 true, i32 0)
  br i1 %cond, label %then, label %else

then:
  %mask2 = call i32 @llvm.genx.GenISA.WaveBallot(i1 true, i32 0)
  %result_then = add i32 %mask1, %mask2
  br label %merge

else:
  %mask3 = call i32 @llvm.genx.GenISA.WaveBallot(i1 true, i32 0)
  %result_else = add i32 %mask1, %mask3
  br label %merge

merge:
  %result = phi i32 [ %result_then, %then ], [ %result_else, %else ]
  ret i32 %result
}

; Test within-block CSE works in multiple blocks
define i32 @test_within_block_cse_multiple_blocks(i1 %cond) {
; CHECK-LABEL: @test_within_block_cse_multiple_blocks
; CHECK-NEXT:    %mask1 = call i32 @llvm.genx.GenISA.WaveBallot(i1 true, i32 0)
; CHECK-NEXT:    %entry_work = add i32 %mask1, %mask1
; CHECK-NEXT:    br i1 %cond, label %then, label %else
; CHECK:       then:
; CHECK-NEXT:    %mask_then = call i32 @llvm.genx.GenISA.WaveBallot(i1 false, i32 1)
; CHECK-NEXT:    %result_then = add i32 %mask_then, %mask_then
; CHECK-NEXT:    br label %merge
; CHECK:       else:
; CHECK-NEXT:    %mask_else = call i32 @llvm.genx.GenISA.WaveBallot(i1 true, i32 2)
; CHECK-NEXT:    %result_else = add i32 %mask_else, %mask_else
; CHECK-NEXT:    br label %merge
; CHECK:       merge:
; CHECK-NEXT:    %result = phi i32 [ %result_then, %then ], [ %result_else, %else ]
; CHECK-NEXT:    %final = add i32 %result, %entry_work
; CHECK-NEXT:    ret i32 %final
;
  %mask1 = call i32 @llvm.genx.GenISA.WaveBallot(i1 true, i32 0)
  %mask1_dup = call i32 @llvm.genx.GenISA.WaveBallot(i1 true, i32 0)
  %entry_work = add i32 %mask1, %mask1_dup
  br i1 %cond, label %then, label %else

then:
  %mask_then = call i32 @llvm.genx.GenISA.WaveBallot(i1 false, i32 1)
  %mask_then_dup = call i32 @llvm.genx.GenISA.WaveBallot(i1 false, i32 1)
  %result_then = add i32 %mask_then, %mask_then_dup
  br label %merge

else:
  %mask_else = call i32 @llvm.genx.GenISA.WaveBallot(i1 true, i32 2)
  %mask_else_dup = call i32 @llvm.genx.GenISA.WaveBallot(i1 true, i32 2)
  %result_else = add i32 %mask_else, %mask_else_dup
  br label %merge

merge:
  %result = phi i32 [ %result_then, %then ], [ %result_else, %else ]
  %final = add i32 %result, %entry_work
  ret i32 %final
}

; Test complex control flow
define i32 @test_complex_control_flow(i1 %cond1, i1 %cond2) {
; CHECK-LABEL: @test_complex_control_flow
; CHECK-NEXT:    %mask1 = call i32 @llvm.genx.GenISA.WaveBallot(i1 true, i32 0)
; CHECK-NEXT:    %entry_result = add i32 %mask1, %mask1
; CHECK-NEXT:    br i1 %cond1, label %branch1, label %branch2
; CHECK:       branch1:
; CHECK-NEXT:    br i1 %cond2, label %nested1, label %nested2
; CHECK:       nested1:
; CHECK-NEXT:    %mask_n1 = call i32 @llvm.genx.GenISA.WaveBallot(i1 false, i32 1)
; CHECK-NEXT:    %n1_result = add i32 %mask_n1, %mask_n1
; CHECK-NEXT:    br label %merge
; CHECK:       nested2:
; CHECK-NEXT:    %mask_n2 = call i32 @llvm.genx.GenISA.WaveBallot(i1 true, i32 1)
; CHECK-NEXT:    %n2_result = add i32 %mask_n2, %mask_n2
; CHECK-NEXT:    br label %merge
; CHECK:       branch2:
; CHECK-NEXT:    %mask_b2 = call i32 @llvm.genx.GenISA.WaveBallot(i1 true, i32 2)
; CHECK-NEXT:    %b2_result = add i32 %mask_b2, %mask_b2
; CHECK-NEXT:    br label %merge
; CHECK:       merge:
; CHECK-NEXT:    %result = phi i32 [ %n1_result, %nested1 ], [ %n2_result, %nested2 ], [ %b2_result, %branch2 ]
; CHECK-NEXT:    %final = add i32 %result, %entry_result
; CHECK-NEXT:    ret i32 %final
;
  %mask1 = call i32 @llvm.genx.GenISA.WaveBallot(i1 true, i32 0)
  %mask1_dup = call i32 @llvm.genx.GenISA.WaveBallot(i1 true, i32 0)
  %entry_result = add i32 %mask1, %mask1_dup
  br i1 %cond1, label %branch1, label %branch2

branch1:
  br i1 %cond2, label %nested1, label %nested2

nested1:
  %mask_n1 = call i32 @llvm.genx.GenISA.WaveBallot(i1 false, i32 1)
  %mask_n1_dup = call i32 @llvm.genx.GenISA.WaveBallot(i1 false, i32 1)
  %n1_result = add i32 %mask_n1, %mask_n1_dup
  br label %merge

nested2:
  %mask_n2 = call i32 @llvm.genx.GenISA.WaveBallot(i1 true, i32 1)
  %mask_n2_dup = call i32 @llvm.genx.GenISA.WaveBallot(i1 true, i32 1)
  %n2_result = add i32 %mask_n2, %mask_n2_dup
  br label %merge

branch2:
  %mask_b2 = call i32 @llvm.genx.GenISA.WaveBallot(i1 true, i32 2)
  %mask_b2_dup = call i32 @llvm.genx.GenISA.WaveBallot(i1 true, i32 2)
  %b2_result = add i32 %mask_b2, %mask_b2_dup
  br label %merge

merge:
  %result = phi i32 [ %n1_result, %nested1 ], [ %n2_result, %nested2 ], [ %b2_result, %branch2 ]
  %final = add i32 %result, %entry_result
  ret i32 %final
}

declare i32 @llvm.genx.GenISA.WaveBallot(i1, i32)