1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50
|
;=========================== begin_copyright_notice ============================
;
; Copyright (C) 2024 Intel Corporation
;
; SPDX-License-Identifier: MIT
;
;============================ end_copyright_notice =============================
; REQUIRES: llvm-14-plus
;
; RUN: igc_opt --opaque-pointers --igc-bfloat-builtins-resolution -S 2>&1 < %s | FileCheck %s --dump-input-filter all
target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v16:16:16-v24:32:32-v32:32:32-v48:64:64-v64:64:64-v96:128:128-v128:128:128-v192:256:256-v256:256:256-v512:512:512-v1024:1024:1024-n8:16:32"
target triple = "spir64-unknown-unknown"
declare spir_func i64 @_Z33__spirv_BuiltInGlobalInvocationIdi(i32)
; CHECK-LABEL: define spir_kernel void @test_cast_to_v2bfloat
declare spir_func <2 x bfloat> @_Z38__builtin_spirv_ConvertE5M2ToBF16INTELDv2_c(<2 x i8>)
define spir_kernel void @test_cast_to_v2bfloat(ptr addrspace(1) %inbuf, ptr addrspace(1) %outbuf) {
entry:
%globalId = call spir_func i64 @_Z33__spirv_BuiltInGlobalInvocationIdi(i32 0)
%loadIdx = getelementptr inbounds <2 x i8>, ptr addrspace(1) %inbuf, i64 %globalId
%loaded = load <2 x i8>, ptr addrspace(1) %loadIdx, align 2
%call1 = call spir_func <2 x bfloat> @_Z38__builtin_spirv_ConvertE5M2ToBF16INTELDv2_c(<2 x i8> %loaded)
; CHECK: %[[OUTPUT:[A-z0-9]*]] = call <2 x i16> @_Z38__builtin_spirv_ConvertE5M2ToBF16INTELDv2_c(<2 x i8> %loaded)
; CHECK: %[[OUTPUT_CASTED:[A-z0-9]*]] = bitcast <2 x i16> %[[OUTPUT]] to <2 x bfloat>
%storeIdx = getelementptr inbounds <2 x bfloat>, ptr addrspace(1) %outbuf, i64 %globalId
store <2 x bfloat> %call1, ptr addrspace(1) %storeIdx, align 4
ret void
}
; CHECK-LABEL: define spir_kernel void @test_cast_to_bfloat
declare spir_func bfloat @_Z38__builtin_spirv_ConvertE5M2ToBF16INTELc(i8)
define spir_kernel void @test_cast_to_bfloat(ptr addrspace(1) %inbuf, ptr addrspace(1) %outbuf) {
entry:
%globalId = call spir_func i64 @_Z33__spirv_BuiltInGlobalInvocationIdi(i32 0)
%loadIdx = getelementptr inbounds i8, ptr addrspace(1) %inbuf, i64 %globalId
%loaded = load i8, ptr addrspace(1) %loadIdx, align 2
%call1 = call spir_func bfloat @_Z38__builtin_spirv_ConvertE5M2ToBF16INTELc(i8 %loaded)
%call2 = call spir_func bfloat @_Z38__builtin_spirv_ConvertE5M2ToBF16INTELc(i8 %loaded)
; CHECK: %[[OUTPUT1:[A-z0-9]*]] = call i16 @_Z38__builtin_spirv_ConvertE5M2ToBF16INTELc(i8 %loaded)
; CHECK: %[[OUTPUT1_CASTED:[A-z0-9]*]] = bitcast i16 %[[OUTPUT1]] to bfloat
; CHECK: %[[OUTPUT2:[A-z0-9]*]] = call i16 @_Z38__builtin_spirv_ConvertE5M2ToBF16INTELc(i8 %loaded)
; CHECK: %[[OUTPUT2_CASTED:[A-z0-9]*]] = bitcast i16 %[[OUTPUT2]] to bfloat
%storeIdx1 = getelementptr inbounds bfloat, ptr addrspace(1) %outbuf, i64 %globalId
%storeIdx2 = getelementptr inbounds bfloat, ptr addrspace(1) %storeIdx1, i64 1024
store bfloat %call1, ptr addrspace(1) %storeIdx1, align 4
store bfloat %call2, ptr addrspace(1) %storeIdx2, align 4
ret void
}
|