File: basic.ll

package info (click to toggle)
intel-graphics-compiler 1.0.17791.18-1
  • links: PTS, VCS
  • area: main
  • in suites: sid
  • size: 102,312 kB
  • sloc: cpp: 935,343; lisp: 286,143; ansic: 16,196; python: 3,279; yacc: 2,487; lex: 1,642; pascal: 300; sh: 174; makefile: 27
file content (114 lines) | stat: -rw-r--r-- 5,730 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
;=========================== begin_copyright_notice ============================
;
; Copyright (C) 2022 Intel Corporation
;
; SPDX-License-Identifier: MIT
;
;============================ end_copyright_notice =============================
;
; RUN: igc_opt -enable-debugify -igc-agg-arg -S < %s 2>&1 | FileCheck %s
; ------------------------------------------------
; ResolveAggregateArguments
; ------------------------------------------------

; Debug-info related check
;
; CHECK-NOT: WARNING
; CHECK: CheckModuleDebugify: PASS

target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v16:16:16-v24:32:32-v32:32:32-v48:64:64-v64:64:64-v96:128:128-v128:128:128-v192:256:256-v256:256:256-v512:512:512-v1024:1024:1024-n8:16:32"

%struct._st_foo = type { i32, <4 x float>, [2 x i64] }

; Function Attrs: convergent noinline nounwind optnone
define spir_kernel void @bar(%struct._st_foo* byval(%struct._st_foo) %src, <8 x i32> %r0, <8 x i32> %payloadHeader, i8* %privateBase, i32 %const_reg_dword, float %const_reg_fp32, float %const_reg_fp321, float %const_reg_fp322, float %const_reg_fp323, i64 %const_reg_qword, i64 %const_reg_qword4) #0 {
; CHECK-LABEL: @bar(
; CHECK-NEXT:  entry:
; CHECK:    [[SRC_ALLOCA:%.*]] = alloca [[STRUCT__ST_FOO:%[A-z0-9_.]*]]
; CHECK:    [[TMP0:%[A-z0-9]*]] = bitcast %struct._st_foo* [[SRC_ALLOCA]] to i8*
; CHECK:    [[TMP1:%[A-z0-9]*]] = getelementptr i8, i8* [[TMP0]], i32 0
; CHECK:    [[TMP2:%[A-z0-9]*]] = bitcast i8* [[TMP1]] to i32*
; CHECK:    store i32 [[CONST_REG_DWORD:%[A-z0-9]*]], i32* [[TMP2]]
; CHECK:    [[TMP3:%[A-z0-9]*]] = getelementptr i8, i8* [[TMP0]], i32 16
; CHECK:    [[TMP4:%[A-z0-9]*]] = bitcast i8* [[TMP3]] to float*
; CHECK:    store float [[CONST_REG_FP32:%[A-z0-9]*]], float* [[TMP4]]
; CHECK:    [[TMP5:%[A-z0-9]*]] = getelementptr i8, i8* [[TMP0]], i32 20
; CHECK:    [[TMP6:%[A-z0-9]*]] = bitcast i8* [[TMP5]] to float*
; CHECK:    store float [[CONST_REG_FP321:%[A-z0-9]*]], float* [[TMP6]]
; CHECK:    [[TMP7:%[A-z0-9]*]] = getelementptr i8, i8* [[TMP0]], i32 24
; CHECK:    [[TMP8:%[A-z0-9]*]] = bitcast i8* [[TMP7]] to float*
; CHECK:    store float [[CONST_REG_FP322:%[A-z0-9]*]], float* [[TMP8]]
; CHECK:    [[TMP9:%[A-z0-9]*]] = getelementptr i8, i8* [[TMP0]], i32 28
; CHECK:    [[TMP10:%[A-z0-9]*]] = bitcast i8* [[TMP9]] to float*
; CHECK:    store float [[CONST_REG_FP323:%[A-z0-9]*]], float* [[TMP10]]
; CHECK:    [[TMP11:%[A-z0-9]*]] = getelementptr i8, i8* [[TMP0]], i32 32
; CHECK:    [[TMP12:%[A-z0-9]*]] = bitcast i8* [[TMP11]] to i64*
; CHECK:    store i64 [[CONST_REG_QWORD:%[A-z0-9]*]], i64* [[TMP12]]
; CHECK:    [[TMP13:%[A-z0-9]*]] = getelementptr i8, i8* [[TMP0]], i32 40
; CHECK:    [[TMP14:%[A-z0-9]*]] = bitcast i8* [[TMP13]] to i64*
; CHECK:    store i64 [[CONST_REG_QWORD4:%[A-z0-9]*]], i64* [[TMP14]]
; CHECK:    [[AA:%[A-z0-9]*]] = alloca i32, align 4
; CHECK:    [[BB:%[A-z0-9]*]] = alloca i32, align 4
; CHECK:    [[CC:%[A-z0-9]*]] = alloca i32, align 4
; CHECK:    [[A:%[A-z0-9]*]] = getelementptr inbounds [[STRUCT__ST_FOO]], %struct._st_foo* [[SRC_ALLOCA]], i32 0, i32 0
; CHECK:    [[TMP15:%[A-z0-9]*]] = load i32, i32* [[A]], align 16
; CHECK:    store i32 [[TMP15]], i32* [[AA]], align 4
; CHECK:    [[B:%[A-z0-9]*]] = getelementptr inbounds [[STRUCT__ST_FOO]], %struct._st_foo* [[SRC_ALLOCA]], i32 0, i32 1
; CHECK:    [[TMP16:%[A-z0-9]*]] = load <4 x float>, <4 x float>* [[B]], align 16
; CHECK:    [[TMP17:%[A-z0-9]*]] = extractelement <4 x float> [[TMP16]], i32 1
; CHECK:    [[CONV_I:%[A-z0-9.]*]] = fptosi float [[TMP17]] to i32
; CHECK:    store i32 [[CONV_I]], i32* [[BB]], align 4
; CHECK:    [[C:%[A-z0-9]*]] = getelementptr inbounds [[STRUCT__ST_FOO]], %struct._st_foo* [[SRC_ALLOCA]], i32 0, i32 2
; CHECK:    [[ARRAYIDX:%[A-z0-9]*]] = getelementptr inbounds [2 x i64], [2 x i64]* [[C]], i64 0, i64 1
; CHECK:    [[TMP18:%[A-z0-9]*]] = load i64, i64* [[ARRAYIDX]], align 8
; CHECK:    [[CONV_I1:%[A-z0-9.]*]] = trunc i64 [[TMP18]] to i32
; CHECK:    store i32 [[CONV_I1]], i32* [[CC]], align 4
; CHECK:    ret void
;
entry:
  %aa = alloca i32, align 4
  %bb = alloca i32, align 4
  %cc = alloca i32, align 4
  %a = getelementptr inbounds %struct._st_foo, %struct._st_foo* %src, i32 0, i32 0
  %0 = load i32, i32* %a, align 16
  store i32 %0, i32* %aa, align 4
  %b = getelementptr inbounds %struct._st_foo, %struct._st_foo* %src, i32 0, i32 1
  %1 = load <4 x float>, <4 x float>* %b, align 16
  %2 = extractelement <4 x float> %1, i32 1
  %conv.i = fptosi float %2 to i32
  store i32 %conv.i, i32* %bb, align 4
  %c = getelementptr inbounds %struct._st_foo, %struct._st_foo* %src, i32 0, i32 2
  %arrayidx = getelementptr inbounds [2 x i64], [2 x i64]* %c, i64 0, i64 1
  %3 = load i64, i64* %arrayidx, align 8
  %conv.i1 = trunc i64 %3 to i32
  store i32 %conv.i1, i32* %cc, align 4
  ret void
}

attributes #0 = { convergent noinline nounwind optnone }
attributes #2 = { nounwind }

!igc.functions = !{!3}

!3 = !{void (%struct._st_foo*, <8 x i32>, <8 x i32>, i8*, i32, float, float, float, float, i64, i64)* @bar, !4}
!4 = !{!5, !6}
!5 = !{!"function_type", i32 0}
!6 = !{!"implicit_arg_desc", !7, !8, !9, !10, !13, !15, !17, !19, !21, !23}
!7 = !{i32 0}
!8 = !{i32 1}
!9 = !{i32 12}
!10 = !{i32 17, !11, !12}
!11 = !{!"explicit_arg_num", i32 0}
!12 = !{!"struct_arg_offset", i32 0}
!13 = !{i32 15, !11, !14}
!14 = !{!"struct_arg_offset", i32 16}
!15 = !{i32 15, !11, !16}
!16 = !{!"struct_arg_offset", i32 20}
!17 = !{i32 15, !11, !18}
!18 = !{!"struct_arg_offset", i32 24}
!19 = !{i32 15, !11, !20}
!20 = !{!"struct_arg_offset", i32 28}
!21 = !{i32 16, !11, !22}
!22 = !{!"struct_arg_offset", i32 32}
!23 = !{i32 16, !11, !24}
!24 = !{!"struct_arg_offset", i32 40}