File: cast_to_bfloat.ll

package info (click to toggle)
intel-graphics-compiler2 2.28.4-4
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid
  • size: 792,744 kB
  • sloc: cpp: 5,761,745; ansic: 466,928; lisp: 312,143; python: 114,790; asm: 44,736; pascal: 10,930; sh: 8,033; perl: 7,914; ml: 3,625; awk: 3,523; yacc: 2,747; javascript: 2,667; lex: 1,898; f90: 1,028; cs: 573; xml: 474; makefile: 344; objc: 162
file content (50 lines) | stat: -rw-r--r-- 2,996 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
;=========================== begin_copyright_notice ============================
;
; Copyright (C) 2024 Intel Corporation
;
; SPDX-License-Identifier: MIT
;
;============================ end_copyright_notice =============================
; REQUIRES: llvm-14-plus
;
; RUN: igc_opt --opaque-pointers --igc-bfloat-builtins-resolution -S 2>&1 < %s | FileCheck %s --dump-input-filter all

target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v16:16:16-v24:32:32-v32:32:32-v48:64:64-v64:64:64-v96:128:128-v128:128:128-v192:256:256-v256:256:256-v512:512:512-v1024:1024:1024-n8:16:32"
target triple = "spir64-unknown-unknown"

declare spir_func i64 @_Z33__spirv_BuiltInGlobalInvocationIdi(i32)

; CHECK-LABEL: define spir_kernel void @test_cast_to_v2bfloat
declare spir_func <2 x bfloat> @_Z38__builtin_spirv_ConvertE5M2ToBF16INTELDv2_c(<2 x i8>)
define spir_kernel void @test_cast_to_v2bfloat(ptr addrspace(1) %inbuf, ptr addrspace(1) %outbuf) {
entry:
  %globalId = call spir_func i64 @_Z33__spirv_BuiltInGlobalInvocationIdi(i32 0)
  %loadIdx = getelementptr inbounds <2 x i8>, ptr addrspace(1) %inbuf, i64 %globalId
  %loaded = load <2 x i8>, ptr addrspace(1) %loadIdx, align 2
  %call1 = call spir_func <2 x bfloat> @_Z38__builtin_spirv_ConvertE5M2ToBF16INTELDv2_c(<2 x i8> %loaded)
  ; CHECK: %[[OUTPUT:[A-z0-9]*]] = call <2 x i16> @_Z38__builtin_spirv_ConvertE5M2ToBF16INTELDv2_c(<2 x i8> %loaded)
  ; CHECK: %[[OUTPUT_CASTED:[A-z0-9]*]] = bitcast <2 x i16> %[[OUTPUT]] to <2 x bfloat>
  %storeIdx = getelementptr inbounds <2 x bfloat>, ptr addrspace(1) %outbuf, i64 %globalId
  store <2 x bfloat> %call1, ptr addrspace(1) %storeIdx, align 4
  ret void
}

; CHECK-LABEL: define spir_kernel void @test_cast_to_bfloat
declare spir_func bfloat @_Z38__builtin_spirv_ConvertE5M2ToBF16INTELc(i8)
define spir_kernel void @test_cast_to_bfloat(ptr addrspace(1) %inbuf, ptr addrspace(1) %outbuf) {
entry:
  %globalId = call spir_func i64 @_Z33__spirv_BuiltInGlobalInvocationIdi(i32 0)
  %loadIdx = getelementptr inbounds i8, ptr addrspace(1) %inbuf, i64 %globalId
  %loaded = load i8, ptr addrspace(1) %loadIdx, align 2
  %call1 = call spir_func bfloat @_Z38__builtin_spirv_ConvertE5M2ToBF16INTELc(i8 %loaded)
  %call2 = call spir_func bfloat @_Z38__builtin_spirv_ConvertE5M2ToBF16INTELc(i8 %loaded)
  ; CHECK: %[[OUTPUT1:[A-z0-9]*]] = call i16 @_Z38__builtin_spirv_ConvertE5M2ToBF16INTELc(i8 %loaded)
  ; CHECK: %[[OUTPUT1_CASTED:[A-z0-9]*]] = bitcast i16 %[[OUTPUT1]] to bfloat
  ; CHECK: %[[OUTPUT2:[A-z0-9]*]] = call i16 @_Z38__builtin_spirv_ConvertE5M2ToBF16INTELc(i8 %loaded)
  ; CHECK: %[[OUTPUT2_CASTED:[A-z0-9]*]] = bitcast i16 %[[OUTPUT2]] to bfloat
  %storeIdx1 = getelementptr inbounds bfloat, ptr addrspace(1) %outbuf, i64 %globalId
  %storeIdx2 = getelementptr inbounds bfloat, ptr addrspace(1) %storeIdx1, i64 1024
  store bfloat %call1, ptr addrspace(1) %storeIdx1, align 4
  store bfloat %call2, ptr addrspace(1) %storeIdx2, align 4
  ret void
}