File: cast_to_i16.ll

package info (click to toggle)
intel-graphics-compiler2 2.28.4-4
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid
  • size: 792,744 kB
  • sloc: cpp: 5,761,745; ansic: 466,928; lisp: 312,143; python: 114,790; asm: 44,736; pascal: 10,930; sh: 8,033; perl: 7,914; ml: 3,625; awk: 3,523; yacc: 2,747; javascript: 2,667; lex: 1,898; f90: 1,028; cs: 573; xml: 474; makefile: 344; objc: 162
file content (69 lines) | stat: -rw-r--r-- 4,991 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
;=========================== begin_copyright_notice ============================
;
; Copyright (C) 2024 Intel Corporation
;
; SPDX-License-Identifier: MIT
;
;============================ end_copyright_notice =============================
; REQUIRES: llvm-14-plus
;
; RUN: igc_opt --opaque-pointers --igc-bfloat-builtins-resolution -S 2>&1 < %s | FileCheck %s --dump-input-filter all

target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v16:16:16-v24:32:32-v32:32:32-v48:64:64-v64:64:64-v96:128:128-v128:128:128-v192:256:256-v256:256:256-v512:512:512-v1024:1024:1024-n8:16:32"
target triple = "spir64-unknown-unknown"

declare spir_func i64 @_Z33__spirv_BuiltInGlobalInvocationIdi(i32)

; CHECK-LABEL: define spir_kernel void @test_cast_to_i16_with_pointer
declare spir_func signext i8 @_Z46__builtin_spirv_StochasticRoundBF16ToE5M2INTELDF16biPU3AS1i(bfloat, i32, ptr addrspace(1))
define spir_kernel void @test_cast_to_i16_with_pointer(ptr addrspace(1) %inbuf, ptr addrspace(1) %outbuf, ptr addrspace(1) %inseed, ptr addrspace(1) %outseed) {
entry:
  %globalId0 = call spir_func i64 @_Z33__spirv_BuiltInGlobalInvocationIdi(i32 0)
  %inputAddr = getelementptr inbounds bfloat, ptr addrspace(1) %inbuf, i64 %globalId0
  %inputLoaded = load bfloat, ptr addrspace(1) %inputAddr, align 2
  %inSeedAddr = getelementptr inbounds i32, ptr addrspace(1) %inseed, i64 %globalId0
  %seedLoaded = load i32, ptr addrspace(1) %inSeedAddr, align 4
  %outSeedAddr = getelementptr inbounds i32, ptr addrspace(1) %outseed, i64 %globalId0
  ; CHECK: %[[INPUT_CASTED:[A-z0-9]*]] = bitcast bfloat %inputLoaded to i16
  ; CHECK: %[[OUTPUT:[A-z0-9]*]] = call i8 @_Z46__builtin_spirv_StochasticRoundBF16ToE5M2INTELsiPU3AS1i(i16 %[[INPUT_CASTED]], i32 %seedLoaded, ptr addrspace(1) %outSeedAddr)
  %result = call spir_func signext i8 @_Z46__builtin_spirv_StochasticRoundBF16ToE5M2INTELDF16biPU3AS1i(bfloat %inputLoaded, i32 %seedLoaded, ptr addrspace(1) %outSeedAddr)
  %outputAddr = getelementptr inbounds i8, ptr addrspace(1) %outbuf, i64 %globalId0
  store i8 %result, ptr addrspace(1) %outputAddr, align 1
  ret void
}

; CHECK-LABEL: define spir_kernel void @test_cast_to_v2i16_with_pointer
declare spir_func <2 x i8> @_Z46__builtin_spirv_StochasticRoundBF16ToE5M2INTELDv2_DF16biPU3AS4i(<2 x bfloat>, i32, ptr addrspace(4))
define spir_kernel void @test_cast_to_v2i16_with_pointer(ptr addrspace(1) %inbuf, ptr addrspace(1) %outbuf, ptr addrspace(1) %inseed, ptr addrspace(1) %outseed) {
entry:
  %globalId0 = call spir_func i64 @_Z33__spirv_BuiltInGlobalInvocationIdi(i32 0)
  %inputAddr = getelementptr inbounds <2 x bfloat>, ptr addrspace(1) %inbuf, i64 %globalId0
  %inputLoaded = load <2 x bfloat>, ptr addrspace(1) %inputAddr, align 4
  %inSeedAddr = getelementptr inbounds i32, ptr addrspace(1) %inseed, i64 %globalId0
  %seedLoaded = load i32, ptr addrspace(1) %inSeedAddr, align 4
  %outseedAddrspaceCast = addrspacecast ptr addrspace(1) %outseed to ptr addrspace(4)
  %outSeedAddr = getelementptr inbounds i32, ptr addrspace(4) %outseedAddrspaceCast, i64 %globalId0
  ; CHECK: %[[INPUT_CASTED:[A-z0-9]*]] = bitcast <2 x bfloat> %inputLoaded to <2 x i16>
  ; CHECK: %[[OUTPUT:[A-z0-9]*]] = call <2 x i8> @_Z46__builtin_spirv_StochasticRoundBF16ToE5M2INTELDv2_siPU3AS4i(<2 x i16> %[[INPUT_CASTED]], i32 %seedLoaded, ptr addrspace(4) %outSeedAddr)
  %result = call spir_func <2 x i8> @_Z46__builtin_spirv_StochasticRoundBF16ToE5M2INTELDv2_DF16biPU3AS4i(<2 x bfloat> %inputLoaded, i32 %seedLoaded, ptr addrspace(4) %outSeedAddr)
  %outputAddr = getelementptr inbounds <2 x i8>, ptr addrspace(1) %outbuf, i64 %globalId0
  store <2 x i8> %result, ptr addrspace(1) %outputAddr, align 2
  ret void
}

; CHECK-LABEL: define spir_kernel void @test_cast_to_v4i16_no_pointer
declare spir_func <4 x i8> @_Z46__builtin_spirv_StochasticRoundBF16ToE5M2INTELDv4_DF16bi(<4 x bfloat>, i32)
define spir_kernel void @test_cast_to_v4i16_no_pointer(ptr addrspace(1) %inbuf, ptr addrspace(1) %outbuf, ptr addrspace(1) %inseed) {
entry:
  %globalId0 = call spir_func i64 @_Z33__spirv_BuiltInGlobalInvocationIdi(i32 0)
  %inputAddr = getelementptr inbounds <4 x bfloat>, ptr addrspace(1) %inbuf, i64 %globalId0
  %inputLoaded = load <4 x bfloat>, ptr addrspace(1) %inputAddr, align 8
  %inSeedAddr = getelementptr inbounds i32, ptr addrspace(1) %inseed, i64 %globalId0
  %seedLoaded = load i32, ptr addrspace(1) %inSeedAddr, align 4
  ; CHECK: %[[INPUT_CASTED:[A-z0-9]*]] = bitcast <4 x bfloat> %inputLoaded to <4 x i16>
  ; CHECK: %[[OUTPUT:[A-z0-9]*]] = call <4 x i8> @_Z46__builtin_spirv_StochasticRoundBF16ToE5M2INTELDv4_si(<4 x i16> %[[INPUT_CASTED]], i32 %seedLoaded)
  %result = call spir_func <4 x i8> @_Z46__builtin_spirv_StochasticRoundBF16ToE5M2INTELDv4_DF16bi(<4 x bfloat> %inputLoaded, i32 %seedLoaded)
  %outputAddr = getelementptr inbounds <4 x i8>, ptr addrspace(1) %outbuf, i64 %globalId0
  store <4 x i8> %result, ptr addrspace(1) %outputAddr, align 4
  ret void
}