1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134
|
; RUN: llc -mtriple=x86_64-unknown-unknown < %s | FileCheck %s
define i8 @ctz_v8i16(<8 x i16> %a) {
; CHECK-LABEL: .LCPI0_0:
; CHECK-NEXT: .byte 8
; CHECK-NEXT: .byte 7
; CHECK-NEXT: .byte 6
; CHECK-NEXT: .byte 5
; CHECK-NEXT: .byte 4
; CHECK-NEXT: .byte 3
; CHECK-NEXT: .byte 2
; CHECK-NEXT: .byte 1
; CHECK-LABEL: ctz_v8i16:
; CHECK: # %bb.0:
; CHECK-NEXT: pxor %xmm1, %xmm1
; CHECK-NEXT: pcmpeqw %xmm0, %xmm1
; CHECK-NEXT: packsswb %xmm1, %xmm1
; CHECK-NEXT: pandn {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm1
; CHECK-NEXT: movdqa %xmm1, -{{[0-9]+}}(%rsp)
; CHECK-NEXT: movzbl -{{[0-9]+}}(%rsp), %ecx
; CHECK-NEXT: movl -{{[0-9]+}}(%rsp), %eax
; CHECK-NEXT: movl -{{[0-9]+}}(%rsp), %edx
; CHECK-NEXT: cmpb %cl, %al
; CHECK-NEXT: cmoval %eax, %ecx
; CHECK-NEXT: movzbl -{{[0-9]+}}(%rsp), %eax
; CHECK-NEXT: cmpb %al, %cl
; CHECK-NEXT: cmovbel %eax, %ecx
; CHECK-NEXT: movzbl -{{[0-9]+}}(%rsp), %eax
; CHECK-NEXT: cmpb %al, %cl
; CHECK-NEXT: cmovbel %eax, %ecx
; CHECK-NEXT: cmpb %dl, %cl
; CHECK-NEXT: cmovbel %edx, %ecx
; CHECK-NEXT: movzbl -{{[0-9]+}}(%rsp), %eax
; CHECK-NEXT: cmpb %al, %cl
; CHECK-NEXT: cmovbel %eax, %ecx
; CHECK-NEXT: movzbl -{{[0-9]+}}(%rsp), %eax
; CHECK-NEXT: cmpb %al, %cl
; CHECK-NEXT: cmovbel %eax, %ecx
; CHECK-NEXT: movzbl -{{[0-9]+}}(%rsp), %eax
; CHECK-NEXT: cmpb %al, %cl
; CHECK-NEXT: cmovbel %eax, %ecx
; CHECK-NEXT: movb $8, %al
; CHECK-NEXT: subb %cl, %al
; CHECK-NEXT: retq
%res = call i8 @llvm.experimental.cttz.elts.i8.v8i16(<8 x i16> %a, i1 0)
ret i8 %res
}
define i16 @ctz_v4i32(<4 x i32> %a) {
; CHECK-LABEL: .LCPI1_0:
; CHECK-NEXT: .byte 4
; CHECK-NEXT: .byte 3
; CHECK-NEXT: .byte 2
; CHECK-NEXT: .byte 1
; CHECK-LABEL: ctz_v4i32:
; CHECK: # %bb.0:
; CHECK-NEXT: pxor %xmm1, %xmm1
; CHECK-NEXT: pcmpeqd %xmm0, %xmm1
; CHECK-NEXT: packssdw %xmm1, %xmm1
; CHECK-NEXT: pcmpeqd %xmm0, %xmm0
; CHECK-NEXT: pxor %xmm1, %xmm0
; CHECK-NEXT: packsswb %xmm0, %xmm0
; CHECK-NEXT: pand {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0
; CHECK-NEXT: movd %xmm0, %eax
; CHECK-NEXT: movl %eax, %ecx
; CHECK-NEXT: shrl $8, %ecx
; CHECK-NEXT: cmpb %cl, %al
; CHECK-NEXT: cmoval %eax, %ecx
; CHECK-NEXT: movl %eax, %edx
; CHECK-NEXT: shrl $16, %edx
; CHECK-NEXT: cmpb %dl, %cl
; CHECK-NEXT: cmoval %ecx, %edx
; CHECK-NEXT: shrl $24, %eax
; CHECK-NEXT: cmpb %al, %dl
; CHECK-NEXT: cmoval %edx, %eax
; CHECK-NEXT: movb $4, %cl
; CHECK-NEXT: subb %al, %cl
; CHECK-NEXT: movzbl %cl, %eax
; CHECK-NEXT: # kill: def $ax killed $ax killed $eax
; CHECK-NEXT: retq
%res = call i16 @llvm.experimental.cttz.elts.i16.v4i32(<4 x i32> %a, i1 0)
ret i16 %res
}
; ZERO IS POISON
define i8 @ctz_v8i16_poison(<8 x i16> %a) {
; CHECK-LABEL: .LCPI2_0:
; CHECK-NEXT: .byte 8
; CHECK-NEXT: .byte 7
; CHECK-NEXT: .byte 6
; CHECK-NEXT: .byte 5
; CHECK-NEXT: .byte 4
; CHECK-NEXT: .byte 3
; CHECK-NEXT: .byte 2
; CHECK-NEXT: .byte 1
; CHECK-LABEL: ctz_v8i16_poison:
; CHECK: # %bb.0:
; CHECK-NEXT: pxor %xmm1, %xmm1
; CHECK-NEXT: pcmpeqw %xmm0, %xmm1
; CHECK-NEXT: packsswb %xmm1, %xmm1
; CHECK-NEXT: pandn {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm1
; CHECK-NEXT: movdqa %xmm1, -{{[0-9]+}}(%rsp)
; CHECK-NEXT: movzbl -{{[0-9]+}}(%rsp), %ecx
; CHECK-NEXT: movl -{{[0-9]+}}(%rsp), %eax
; CHECK-NEXT: movl -{{[0-9]+}}(%rsp), %edx
; CHECK-NEXT: cmpb %cl, %al
; CHECK-NEXT: cmoval %eax, %ecx
; CHECK-NEXT: movzbl -{{[0-9]+}}(%rsp), %eax
; CHECK-NEXT: cmpb %al, %cl
; CHECK-NEXT: cmovbel %eax, %ecx
; CHECK-NEXT: movzbl -{{[0-9]+}}(%rsp), %eax
; CHECK-NEXT: cmpb %al, %cl
; CHECK-NEXT: cmovbel %eax, %ecx
; CHECK-NEXT: cmpb %dl, %cl
; CHECK-NEXT: cmovbel %edx, %ecx
; CHECK-NEXT: movzbl -{{[0-9]+}}(%rsp), %eax
; CHECK-NEXT: cmpb %al, %cl
; CHECK-NEXT: cmovbel %eax, %ecx
; CHECK-NEXT: movzbl -{{[0-9]+}}(%rsp), %eax
; CHECK-NEXT: cmpb %al, %cl
; CHECK-NEXT: cmovbel %eax, %ecx
; CHECK-NEXT: movzbl -{{[0-9]+}}(%rsp), %eax
; CHECK-NEXT: cmpb %al, %cl
; CHECK-NEXT: cmovbel %eax, %ecx
; CHECK-NEXT: movb $8, %al
; CHECK-NEXT: subb %cl, %al
; CHECK-NEXT: retq
%res = call i8 @llvm.experimental.cttz.elts.i8.v8i16(<8 x i16> %a, i1 1)
ret i8 %res
}
declare i8 @llvm.experimental.cttz.elts.i8.v8i16(<8 x i16>, i1)
declare i16 @llvm.experimental.cttz.elts.i16.v4i32(<4 x i32>, i1)
|