1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 5
; RUN: opt -S --passes=slp-vectorizer -mtriple=x86_64-unknown-linux-gnu -slp-threshold=-100 < %s | FileCheck %s
define i8 @test(ptr %g_127, i32 %0, i16 %1) {
; CHECK-LABEL: define i8 @test(
; CHECK-SAME: ptr [[G_127:%.*]], i32 [[TMP0:%.*]], i16 [[TMP1:%.*]]) {
; CHECK-NEXT: [[ENTRY:.*]]:
; CHECK-NEXT: br label %[[FOR_INC434_I:.*]]
; CHECK: [[FOR_COND166_PREHEADER_I:.*]]:
; CHECK-NEXT: br label %[[FOR_INC434_I]]
; CHECK: [[FOR_INC434_I]]:
; CHECK-NEXT: [[TMP2:%.*]] = phi i64 [ 0, %[[ENTRY]] ], [ 60, %[[FOR_COND166_PREHEADER_I]] ]
; CHECK-NEXT: [[CONV8_I_I:%.*]] = zext nneg i32 [[TMP0]] to i64
; CHECK-NEXT: [[DIV_I_I_1:%.*]] = udiv i64 [[CONV8_I_I]], [[TMP2]]
; CHECK-NEXT: [[TMP3:%.*]] = trunc i64 [[DIV_I_I_1]] to i16
; CHECK-NEXT: [[TMP4:%.*]] = insertelement <8 x i16> poison, i16 [[TMP3]], i32 0
; CHECK-NEXT: [[TMP5:%.*]] = insertelement <4 x i64> poison, i64 [[CONV8_I_I]], i32 0
; CHECK-NEXT: [[TMP6:%.*]] = shufflevector <4 x i64> [[TMP5]], <4 x i64> poison, <4 x i32> zeroinitializer
; CHECK-NEXT: [[TMP7:%.*]] = insertelement <4 x i64> poison, i64 [[TMP2]], i32 0
; CHECK-NEXT: [[TMP8:%.*]] = shufflevector <4 x i64> [[TMP7]], <4 x i64> poison, <4 x i32> zeroinitializer
; CHECK-NEXT: [[TMP9:%.*]] = udiv <4 x i64> [[TMP6]], [[TMP8]]
; CHECK-NEXT: [[TMP10:%.*]] = trunc <4 x i64> [[TMP9]] to <4 x i16>
; CHECK-NEXT: [[TMP11:%.*]] = shufflevector <4 x i16> [[TMP10]], <4 x i16> poison, <8 x i32> <i32 0, i32 poison, i32 1, i32 2, i32 poison, i32 3, i32 poison, i32 poison>
; CHECK-NEXT: [[TMP12:%.*]] = shufflevector <8 x i16> [[TMP4]], <8 x i16> [[TMP11]], <8 x i32> <i32 0, i32 8, i32 poison, i32 10, i32 11, i32 poison, i32 13, i32 poison>
; CHECK-NEXT: [[TMP13:%.*]] = shufflevector <8 x i16> [[TMP12]], <8 x i16> poison, <8 x i32> <i32 0, i32 1, i32 1, i32 3, i32 4, i32 4, i32 6, i32 6>
; CHECK-NEXT: [[TMP14:%.*]] = call <8 x i16> @llvm.bswap.v8i16(<8 x i16> [[TMP13]])
; CHECK-NEXT: [[TMP15:%.*]] = call i16 @llvm.vector.reduce.and.v8i16(<8 x i16> [[TMP14]])
; CHECK-NEXT: [[OP_RDX:%.*]] = and i16 [[TMP15]], [[TMP1]]
; CHECK-NEXT: [[AND14_I_2_I_5:%.*]] = zext i16 [[OP_RDX]] to i32
; CHECK-NEXT: store i32 [[AND14_I_2_I_5]], ptr [[G_127]], align 4
; CHECK-NEXT: ret i8 0
;
entry:
br label %for.inc434.i
for.cond166.preheader.i:
br label %for.inc434.i
for.inc434.i:
%2 = phi i64 [ 0, %entry ], [ 60, %for.cond166.preheader.i ]
%conv8.i.i = zext nneg i32 %0 to i64
%div.i.i.1 = udiv i64 %conv8.i.i, %2
%3 = trunc i64 %div.i.i.1 to i16
%call12.i.2.i.1 = tail call i16 @llvm.bswap.i16(i16 %3)
%and14.i.2.i.118 = and i16 %1, %call12.i.2.i.1
%div.i.i.2 = udiv i64 %conv8.i.i, %2
%4 = trunc i64 %div.i.i.2 to i16
%call12.i.i.2 = tail call i16 @llvm.bswap.i16(i16 %4)
%and14.i.i.219 = and i16 %and14.i.2.i.118, %call12.i.i.2
%call12.i.2.i.2 = tail call i16 @llvm.bswap.i16(i16 %4)
%and14.i.2.i.220 = and i16 %and14.i.i.219, %call12.i.2.i.2
%div.i.i.3 = udiv i64 %conv8.i.i, %2
%5 = trunc i64 %div.i.i.3 to i16
%call12.i.2.i.3 = tail call i16 @llvm.bswap.i16(i16 %5)
%and14.i.2.i.322 = and i16 %and14.i.2.i.220, %call12.i.2.i.3
%div.i.i.4 = udiv i64 %conv8.i.i, %2
%6 = trunc i64 %div.i.i.4 to i16
%call12.i.i.4 = tail call i16 @llvm.bswap.i16(i16 %6)
%and14.i.i.423 = and i16 %and14.i.2.i.322, %call12.i.i.4
%call12.i.2.i.4 = tail call i16 @llvm.bswap.i16(i16 %6)
%and14.i.2.i.424 = and i16 %and14.i.i.423, %call12.i.2.i.4
%div.i.i.5 = udiv i64 %conv8.i.i, %2
%7 = trunc i64 %div.i.i.5 to i16
%call12.i.i.5 = tail call i16 @llvm.bswap.i16(i16 %7)
%and14.i.i.525 = and i16 %and14.i.2.i.424, %call12.i.i.5
%call12.i.2.i.5 = tail call i16 @llvm.bswap.i16(i16 %7)
%and14.i.2.i.51 = and i16 %and14.i.i.525, %call12.i.2.i.5
%and14.i.2.i.5 = zext i16 %and14.i.2.i.51 to i32
store i32 %and14.i.2.i.5, ptr %g_127, align 4
ret i8 0
}
|