1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118
|
;=========================== begin_copyright_notice ============================
;
; Copyright (C) 2023 Intel Corporation
;
; SPDX-License-Identifier: MIT
;
;============================ end_copyright_notice =============================
; RUN: %opt %use_old_pass_manager% -GenXGEPLowering -march=genx64 -mcpu=Gen9 -S < %s | FileCheck %s
target datalayout = "e-p:64:64-p3:32:32-i64:64-n8:16:32:64"
declare <32 x double> @llvm.vc.internal.lsc.load.slm.v32f64.v32i1.v32i32(<32 x i1>, i8, i8, i8, i8, i8, i32, <32 x i32>, i16, i32, <32 x double>)
declare <32 x i32> @llvm.vc.internal.lsc.load.ugm.v32i32.v1i1.i64(<1 x i1>, i8, i8, i8, i8, i8, i64, i64, i16, i32, <32 x i32>)
declare <32 x double> @llvm.vc.internal.lsc.load.ugm.v32f64.v32i1.v32i64(<32 x i1>, i8, i8, i8, i8, i8, i64, <32 x i64>, i16, i32, <32 x double>)
; CHECK-LABEL: @test_fold_cast
define <32 x i32> @test_fold_cast(i8 addrspace(1)* align 8 %a) {
entry:
%bitcast = bitcast i8 addrspace(1)* %a to double addrspace(1)*
; CHECK: %pti = ptrtoint i8 addrspace(1)* %a to i64
%pti = ptrtoint double addrspace(1)* %bitcast to i64
%res = call <32 x i32> @llvm.vc.internal.lsc.load.ugm.v32i32.v1i1.i64(<1 x i1> <i1 true>, i8 3, i8 3, i8 7, i8 0, i8 0, i64 0, i64 %pti, i16 1, i32 0, <32 x i32> undef)
ret <32 x i32> %res
}
; CHECK-LABEL: @test_fold_itp
define <32 x i32> @test_fold_itp(i64 %a) {
entry:
%itp = inttoptr i64 %a to double addrspace(1)*
%pti = ptrtoint double addrspace(1)* %itp to i64
; CHECK: %res = call <32 x i32> @llvm.vc.internal.lsc.load.ugm.v32i32.v1i1.i64(<1 x i1> <i1 true>, i8 3, i8 3, i8 7, i8 0, i8 0, i64 0, i64 %a, i16 1, i32 0, <32 x i32> undef)
%res = call <32 x i32> @llvm.vc.internal.lsc.load.ugm.v32i32.v1i1.i64(<1 x i1> <i1 true>, i8 3, i8 3, i8 7, i8 0, i8 0, i64 0, i64 %pti, i16 1, i32 0, <32 x i32> undef)
ret <32 x i32> %res
}
; CHECK-LABEL: @test_fold_cast_gep_pti
define <32 x i32> @test_fold_cast_gep_pti(i8 addrspace(1)* align 8 %a) {
entry:
%bitcast = bitcast i8 addrspace(1)* %a to double addrspace(1)*
; CHECK: [[PTI:%[^ ]+]] = ptrtoint i8 addrspace(1)* %a to i64
; CHECK: [[ADD:%[^ ]+]] = add i64 [[PTI]], 1024
%gep = getelementptr double, double addrspace(1)* %bitcast, i32 128
%pti = ptrtoint double addrspace(1)* %gep to i64
; CHECL: %res = call <32 x i32> @llvm.vc.internal.lsc.load.ugm.v32i32.v1i1.i64(<1 x i1> <i1 true>, i8 3, i8 3, i8 7, i8 0, i8 0, i64 0, i64 [[ADD]], i16 1, i32 0, <32 x i32> undef)
%res = call <32 x i32> @llvm.vc.internal.lsc.load.ugm.v32i32.v1i1.i64(<1 x i1> <i1 true>, i8 3, i8 3, i8 7, i8 0, i8 0, i64 0, i64 %pti, i16 1, i32 0, <32 x i32> undef)
ret <32 x i32> %res
}
; CHECK-LABEL: @test_fold_ascastp42p3_vector
define <32 x double> @test_fold_ascastp42p3_vector(<32 x i1> %mask, <32 x double addrspace(4)*> %a) {
entry:
%ascast = addrspacecast <32 x double addrspace(4)*> %a to <32 x double addrspace(3)*>
; CHECK: %pti = ptrtoint <32 x double addrspace(3)*> %ascast to <32 x i32>
%pti = ptrtoint <32 x double addrspace(3)*> %ascast to <32 x i32>
%res = call <32 x double> @llvm.vc.internal.lsc.load.slm.v32f64.v32i1.v32i32(<32 x i1> %mask, i8 2, i8 4, i8 1, i8 0, i8 0, i32 0, <32 x i32> %pti, i16 1, i32 0, <32 x double> undef)
ret <32 x double> %res
}
; CHECK-LABEL: @test_fold_ascastp42p1_vector
define <32 x double> @test_fold_ascastp42p1_vector(<32 x i1> %mask, <32 x double addrspace(4)*> %a) {
entry:
%ascast = addrspacecast <32 x double addrspace(4)*> %a to <32 x double addrspace(1)*>
; CHECK: %pti = ptrtoint <32 x double addrspace(4)*> %a to <32 x i64>
%pti = ptrtoint <32 x double addrspace(1)*> %ascast to <32 x i64>
%res = call <32 x double> @llvm.vc.internal.lsc.load.ugm.v32f64.v32i1.v32i64(<32 x i1> %mask, i8 3, i8 4, i8 1, i8 0, i8 0, i64 0, <32 x i64> %pti, i16 1, i32 0, <32 x double> undef)
ret <32 x double> %res
}
; CHECK-LABEL: @test_fold_cast_vector
define <32 x double> @test_fold_cast_vector(<32 x i1> %mask, <32 x i8 addrspace(1)*> %a) {
entry:
%bitcast = bitcast <32 x i8 addrspace(1)*> %a to <32 x double addrspace(1)*>
; CHECK: %pti = ptrtoint <32 x i8 addrspace(1)*> %a to <32 x i64>
%pti = ptrtoint <32 x double addrspace(1)*> %bitcast to <32 x i64>
%res = call <32 x double> @llvm.vc.internal.lsc.load.ugm.v32f64.v32i1.v32i64(<32 x i1> %mask, i8 3, i8 4, i8 1, i8 0, i8 0, i64 0, <32 x i64> %pti, i16 1, i32 0, <32 x double> undef)
ret <32 x double> %res
}
; CHECK-LABEL: @test_fold_itp_vector
define <32 x double> @test_fold_itp_vector(<32 x i1> %mask, <32 x i64> %a) {
entry:
%itp = inttoptr <32 x i64> %a to <32 x double addrspace(1)*>
%pti = ptrtoint <32 x double addrspace(1)*> %itp to <32 x i64>
; CHECK: %res = call <32 x double> @llvm.vc.internal.lsc.load.ugm.v32f64.v32i1.v32i64(<32 x i1> %mask, i8 3, i8 4, i8 1, i8 0, i8 0, i64 0, <32 x i64> %a, i16 1, i32 0, <32 x double> undef)
%res = call <32 x double> @llvm.vc.internal.lsc.load.ugm.v32f64.v32i1.v32i64(<32 x i1> %mask, i8 3, i8 4, i8 1, i8 0, i8 0, i64 0, <32 x i64> %pti, i16 1, i32 0, <32 x double> undef)
ret <32 x double> %res
}
; CHECK-LABEL: @test_cross_block
define void @test_cross_block(i64 %a, i32 %b) {
entry:
%itp = inttoptr i64 %a to float*
%mul = mul i32 %b, 60
%zext = zext i32 %mul to i64
; CHECK: [[SCALE:%[^ ]+]] = shl i64 %zext, 2
; CHECK: [[ADD:%[^ ]+]] = add i64 %a, [[SCALE]]
%gep = getelementptr inbounds float, float* %itp, i64 %zext
br label %label
label: ; preds = %entry
%pti = ptrtoint float* %gep to i64
; CHECK: %ins = insertelement <16 x i64> undef, i64 [[ADD]], i64 0
%ins = insertelement <16 x i64> undef, i64 %pti, i64 0
%splat = shufflevector <16 x i64> %ins, <16 x i64> undef, <16 x i32> zeroinitializer
ret void
}
; CHECK-LABEL: @test_bitcast_vector_to_scalar
define i64 @test_bitcast_vector_to_scalar(<1 x i8*> %vptr) {
%ptr = bitcast <1 x i8*> %vptr to i8*
%gep = getelementptr i8, i8* %ptr, i32 123
%addr = ptrtoint i8* %gep to i64
; CHECK: [[PTI:%[^ ]+]] = ptrtoint i8* %ptr to i64
; CHECK: [[ADD:%[^ ]+]] = add i64 [[PTI]], 123
; CHECK: ret i64 [[ADD]]
ret i64 %addr
}
|