File: ldrawvec.ll

package info (click to toggle)
intel-graphics-compiler2 2.28.4-4
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid
  • size: 792,744 kB
  • sloc: cpp: 5,761,745; ansic: 466,928; lisp: 312,143; python: 114,790; asm: 44,736; pascal: 10,930; sh: 8,033; perl: 7,914; ml: 3,625; awk: 3,523; yacc: 2,747; javascript: 2,667; lex: 1,898; f90: 1,028; cs: 573; xml: 474; makefile: 344; objc: 162
file content (37 lines) | stat: -rw-r--r-- 1,551 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
;=========================== begin_copyright_notice ============================
;
; Copyright (C) 2024 Intel Corporation
;
; SPDX-License-Identifier: MIT
;
;============================ end_copyright_notice =============================
;
; REQUIRES: llvm-14-plus
; RUN: igc_opt --opaque-pointers -igc-custom-safe-opt -dce -S < %s | FileCheck %s
; ------------------------------------------------
; CustomSafeOptPass: ldrawvector
; ------------------------------------------------

; Test checks that sequence of ldrawvector + extractelement is substituted with
; GenISA.ldraw.indexed when possible

define float @test_loadvec(ptr addrspace(1) %src, i32 %offset) {
; CHECK-LABEL: define float @test_loadvec(
; CHECK-SAME: ptr addrspace(1) [[SRC:%.*]], i32 [[OFFSET:%.*]]) {
; CHECK:    [[TMP1:%.*]] = add i32 [[OFFSET]], 12
; CHECK:    [[TMP2:%.*]] = call float @llvm.genx.GenISA.ldraw.indexed.f32.p1(ptr addrspace(1) [[SRC]], i32 [[TMP1]], i32 4, i1 true)
; CHECK:    ret float [[TMP2]]
;
  %1 = call <4 x float> @llvm.genx.GenISA.ldrawvector.indexed.p1(ptr addrspace(1) %src, i32 %offset, i32 4, i1 true)
  %2 = extractelement <4 x float> %1, i32 3
  ret float %2
}

; Function Desc: Read a vector from a buffer pointer at byte offset
; Output:
; Arg 0: buffer pointer, result of GetBufferPtr
; Arg 1: offset from the base pointer, in bytes
; Arg 2: aligment in bytes
; Arg 3: volatile, must be an immediate
; Function Attrs: argmemonly nounwind readonly
declare <4 x float> @llvm.genx.GenISA.ldrawvector.indexed.p1(ptr addrspace(1), i32, i32, i1)