File: repeated_instrs.ll

package info (click to toggle)
llvm-toolchain-21 1%3A21.1.6-3
  • links: PTS, VCS
  • area: main
  • in suites: sid
  • size: 2,245,028 kB
  • sloc: cpp: 7,619,726; ansic: 1,434,018; asm: 1,058,748; python: 252,740; f90: 94,671; objc: 70,685; lisp: 42,813; pascal: 18,401; sh: 8,601; ml: 5,111; perl: 4,720; makefile: 3,675; awk: 3,523; javascript: 2,409; xml: 892; fortran: 770
file content (65 lines) | stat: -rw-r--r-- 3,168 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 5
; RUN: opt -passes=sandbox-vectorizer -sbvec-vec-reg-bits=1024 -sbvec-allow-non-pow2 -sbvec-passes="seed-collection<tr-save,bottom-up-vec,tr-accept>" %s -S | FileCheck %s

define i32 @repeated_splat(ptr %ptr, i32 %v) #0 {
; CHECK-LABEL: define i32 @repeated_splat(
; CHECK-SAME: ptr [[PTR:%.*]], i32 [[V:%.*]]) {
; CHECK-NEXT:    [[GEP0:%.*]] = getelementptr inbounds i32, ptr [[PTR]], i64 0
; CHECK-NEXT:    [[SPLAT:%.*]] = add i32 [[V]], 0
; CHECK-NEXT:    [[PACK:%.*]] = insertelement <2 x i32> poison, i32 [[SPLAT]], i32 0
; CHECK-NEXT:    [[PACK1:%.*]] = insertelement <2 x i32> [[PACK]], i32 [[SPLAT]], i32 1
; CHECK-NEXT:    [[VECL:%.*]] = load <2 x i32>, ptr [[GEP0]], align 4
; CHECK-NEXT:    [[VEC:%.*]] = mul <2 x i32> [[VECL]], [[PACK1]]
; CHECK-NEXT:    store <2 x i32> [[VEC]], ptr [[GEP0]], align 4
; CHECK-NEXT:    ret i32 0
;
  %gep0 = getelementptr inbounds i32, ptr %ptr, i64 0
  %gep1 = getelementptr inbounds i32, ptr %ptr, i64 1
  %ld0 = load i32, ptr %gep0, align 4
  %ld1 = load i32, ptr %gep1, align 4
  %splat = add i32 %v, 0
  %add0 = mul i32 %ld0, %splat
  %add1 = mul i32 %ld1, %splat
  store i32 %add0, ptr %gep0, align 4
  store i32 %add1, ptr %gep1, align 4
  ret i32 0
}

define i32 @repeated_partial(ptr %ptr, i32 %v) #0 {
; CHECK-LABEL: define i32 @repeated_partial(
; CHECK-SAME: ptr [[PTR:%.*]], i32 [[V:%.*]]) {
; CHECK-NEXT:    [[GEP0:%.*]] = getelementptr inbounds i32, ptr [[PTR]], i64 0
; CHECK-NEXT:    [[GEP1:%.*]] = getelementptr inbounds i32, ptr [[PTR]], i64 1
; CHECK-NEXT:    [[GEP3:%.*]] = getelementptr inbounds i32, ptr [[PTR]], i64 3
; CHECK-NEXT:    [[SPLAT:%.*]] = add i32 [[V]], 0
; CHECK-NEXT:    [[LD0:%.*]] = load i32, ptr [[GEP0]], align 4
; CHECK-NEXT:    [[LD1:%.*]] = load i32, ptr [[GEP1]], align 4
; CHECK-NEXT:    [[LD3:%.*]] = load i32, ptr [[GEP3]], align 4
; CHECK-NEXT:    [[PACK:%.*]] = insertelement <4 x i32> poison, i32 [[LD0]], i32 0
; CHECK-NEXT:    [[PACK1:%.*]] = insertelement <4 x i32> [[PACK]], i32 [[LD1]], i32 1
; CHECK-NEXT:    [[PACK2:%.*]] = insertelement <4 x i32> [[PACK1]], i32 [[LD1]], i32 2
; CHECK-NEXT:    [[PACK3:%.*]] = insertelement <4 x i32> [[PACK2]], i32 [[LD3]], i32 3
; CHECK-NEXT:    [[VECL:%.*]] = load <4 x i32>, ptr [[GEP0]], align 4
; CHECK-NEXT:    [[VEC:%.*]] = mul <4 x i32> [[VECL]], [[PACK3]]
; CHECK-NEXT:    store <4 x i32> [[VEC]], ptr [[GEP0]], align 4
; CHECK-NEXT:    ret i32 0
;
  %gep0 = getelementptr inbounds i32, ptr %ptr, i64 0
  %gep1 = getelementptr inbounds i32, ptr %ptr, i64 1
  %gep2 = getelementptr inbounds i32, ptr %ptr, i64 2
  %gep3 = getelementptr inbounds i32, ptr %ptr, i64 3
  %ld0 = load i32, ptr %gep0, align 4
  %ld1 = load i32, ptr %gep1, align 4
  %ld2 = load i32, ptr %gep2, align 4
  %ld3 = load i32, ptr %gep3, align 4
  %splat = add i32 %v, 0
  %add0 = mul i32 %ld0, %ld0
  %add1 = mul i32 %ld1, %ld1
  %add2 = mul i32 %ld2, %ld1
  %add3 = mul i32 %ld3, %ld3
  store i32 %add0, ptr %gep0, align 4
  store i32 %add1, ptr %gep1, align 4
  store i32 %add2, ptr %gep2, align 4
  store i32 %add3, ptr %gep3, align 4
  ret i32 0
}