File: pr55158.ll

package info (click to toggle)
llvm-toolchain-17 1%3A17.0.6-22
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid, trixie
  • size: 1,799,624 kB
  • sloc: cpp: 6,428,607; ansic: 1,383,196; asm: 793,408; python: 223,504; objc: 75,364; f90: 60,502; lisp: 33,869; pascal: 15,282; sh: 9,684; perl: 7,453; ml: 4,937; awk: 3,523; makefile: 2,889; javascript: 2,149; xml: 888; fortran: 619; cs: 573
file content (35 lines) | stat: -rw-r--r-- 1,702 bytes parent folder | download | duplicates (10)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc < %s -mtriple=x86_64-linux -mcpu=ivybridge -mattr=+avx2 | FileCheck %s
; RUN: llc < %s -mtriple=x86_64-linux -mcpu=haswell | FileCheck %s

define <2 x i64> @PR55158(ptr %0) {
; CHECK-LABEL: PR55158:
; CHECK:       # %bb.0:
; CHECK-NEXT:    vpxor %xmm0, %xmm0, %xmm0
; CHECK-NEXT:    vphsubw 64(%rdi), %xmm0, %xmm0
; CHECK-NEXT:    retq
  %2 = load <16 x i8>, ptr %0, align 16
  %3 = getelementptr inbounds i32, ptr %0, i64 16
  %4 = load <8 x i16>, ptr %3, align 16
  %5 = getelementptr inbounds i32, ptr %0, i64 32
  %6 = load <4 x i32>, ptr %5, align 16
  %7 = shufflevector <16 x i8> %2, <16 x i8> poison, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
  %8 = sext <4 x i8> %7 to <4 x i32>
  %9 = icmp sgt <4 x i32> %6, %8
  %10 = sext <4 x i1> %9 to <4 x i32>
  %11 = tail call <8 x i16> @llvm.x86.ssse3.phsub.w.128(<8 x i16> %4, <8 x i16> %4)
  %12 = bitcast <8 x i16> %11 to <2 x i64>
  %13 = shufflevector <4 x i32> %10, <4 x i32> poison, <2 x i32> <i32 0, i32 1>
  %14 = zext <2 x i32> %13 to <2 x i64>
  %15 = bitcast <8 x i16> %11 to <16 x i8>
  %16 = icmp ne <16 x i8> %15, zeroinitializer
  %17 = sext <16 x i1> %16 to <16 x i8>
  %18 = shufflevector <16 x i8> %17, <16 x i8> poison, <2 x i32> <i32 0, i32 1>
  %19 = zext <2 x i8> %18 to <2 x i64>
  %20 = insertelement <2 x i64> %19, i64 0, i64 1
  %21 = tail call <2 x i64> @llvm.x86.avx2.psrlv.q(<2 x i64> %20, <2 x i64> %14)
  %22 = shufflevector <2 x i64> %21, <2 x i64> %12, <2 x i32> <i32 1, i32 3>
  ret <2 x i64> %22
}
declare <8 x i16> @llvm.x86.ssse3.phsub.w.128(<8 x i16>, <8 x i16>)
declare <2 x i64> @llvm.x86.avx2.psrlv.q(<2 x i64>, <2 x i64>)