1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42
|
;=========================== begin_copyright_notice ============================
;
; Copyright (C) 2022 Intel Corporation
;
; SPDX-License-Identifier: MIT
;
;============================ end_copyright_notice =============================
; RUN: igc_opt %s -S -o - -igc-generic-address-dynamic-resolution | FileCheck %s
; This test verifies whether optimization which allows to avoid additional control flow
; generation is blocked when a kernel calls a function indirectly. In such case, we don't
; know what function is going to be called by a function pointer, so it is not possible
; to check whether callee contains addrspacecast's from private/local to generic addrspace.
target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v16:16:16-v24:32:32-v32:32:32-v48:64:64-v64:64:64-v96:128:128-v128:128:128-v192:256:256-v256:256:256-v512:512:512-v1024:1024:1024"
declare spir_func void @foo(i32 addrspace(4)* %ptr) "referenced-indirectly"
define spir_kernel void @kernel(i32 addrspace(1)* %global_buffer) {
%fp = alloca void (i32 addrspace(4)*)*, align 8
store void (i32 addrspace(4)*)* @foo, void (i32 addrspace(4)*)** %fp, align 8
%generic_ptr = addrspacecast i32 addrspace(1)* %global_buffer to i32 addrspace(4)*
%f = load void (i32 addrspace(4)*)*, void (i32 addrspace(4)*)** %fp, align 8
call spir_func void %f(i32 addrspace(4)* %generic_ptr)
; CHECK: %[[PTI:.*]] = ptrtoint i32 addrspace(4)* %generic_ptr to i64
; CHECK: %[[TAG:.*]] = lshr i64 %[[PTI]], 61
; CHECK: switch i64 %[[TAG]], label %GlobalBlock [
; CHECK: i64 2, label %LocalBlock
; CHECK: ]
; CHECK: LocalBlock:
; CHECK: %[[LOCAL_PTR:.*]] = addrspacecast i32 addrspace(4)* %generic_ptr to i32 addrspace(3)*
; CHECK: store i32 5, i32 addrspace(3)* %[[LOCAL_PTR]], align 4
; CHECK: GlobalBlock:
; CHECK: %[[GLOBAL_PTR:.*]] = addrspacecast i32 addrspace(4)* %generic_ptr to i32 addrspace(1)*
; CHECK: store i32 5, i32 addrspace(1)* %[[GLOBAL_PTR]], align 4
store i32 5, i32 addrspace(4)* %generic_ptr, align 4
ret void
}
|