File: falkor-hwpf-fix.ll

package info (click to toggle)
llvm-toolchain-17 1%3A17.0.6-22
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid, trixie
  • size: 1,799,624 kB
  • sloc: cpp: 6,428,607; ansic: 1,383,196; asm: 793,408; python: 223,504; objc: 75,364; f90: 60,502; lisp: 33,869; pascal: 15,282; sh: 9,684; perl: 7,453; ml: 4,937; awk: 3,523; makefile: 2,889; javascript: 2,149; xml: 888; fortran: 619; cs: 573
file content (67 lines) | stat: -rw-r--r-- 1,957 bytes parent folder | download | duplicates (12)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
; RUN: llc < %s -mtriple aarch64 -mcpu=falkor -disable-post-ra | FileCheck %s

; Check that strided load tag collisions are avoided on Falkor.

; CHECK-LABEL: hwpf1:
; CHECK: ldp {{w[0-9]+}}, {{w[0-9]+}}, [x[[BASE:[0-9]+]], #-16]
; CHECK: mov x[[BASE2:[0-9]+]], x[[BASE]]
; CHECK: ldp {{w[0-9]+}}, {{w[0-9]+}}, [x[[BASE2]], #-8]
; CHECK: ldp {{w[0-9]+}}, {{w[0-9]+}}, [x[[BASE3:[0-9]+]]]
; CHECK: mov x[[BASE4:[0-9]+]], x[[BASE3]]
; CHECK: ldp {{w[0-9]+}}, {{w[0-9]+}}, [x[[BASE4]], #8]

define void @hwpf1(ptr %p, ptr %sp, ptr %sp2, ptr %sp3, ptr %sp4) {
entry:
  br label %loop

loop:
  %iv = phi i32 [ 0, %entry ], [ %inc, %loop ]

  %gep = getelementptr inbounds i32, ptr %p, i32 %iv
  %load1 = load i32, ptr %gep

  %gep2 = getelementptr inbounds i32, ptr %gep, i32 1
  %load2 = load i32, ptr %gep2

  %add = add i32 %load1, %load2
  %storegep = getelementptr inbounds i32, ptr %sp, i32 %iv
  store i32 %add, ptr %storegep

  %gep3 = getelementptr inbounds i32, ptr %gep, i32 2
  %load3 = load i32, ptr %gep3

  %gep4 = getelementptr inbounds i32, ptr %gep, i32 3
  %load4 = load i32, ptr %gep4

  %add2 = add i32 %load3, %load4
  %storegep2 = getelementptr inbounds i32, ptr %sp2, i32 %iv
  store i32 %add2, ptr %storegep2

  %gep5 = getelementptr inbounds i32, ptr %gep, i32 4
  %load5 = load i32, ptr %gep5

  %gep6 = getelementptr inbounds i32, ptr %gep, i32 5
  %load6 = load i32, ptr %gep6

  %add3 = add i32 %load5, %load6
  %storegep3 = getelementptr inbounds i32, ptr %sp3, i32 %iv
  store i32 %add3, ptr %storegep3

  %gep7 = getelementptr inbounds i32, ptr %gep, i32 6
  %load7 = load i32, ptr %gep7

  %gep8 = getelementptr inbounds i32, ptr %gep, i32 7
  %load8 = load i32, ptr %gep8

  %add4 = add i32 %load7, %load8
  %storegep4 = getelementptr inbounds i32, ptr %sp4, i32 %iv
  store i32 %add4, ptr %storegep4

  %inc = add i32 %iv, 8
  %exitcnd = icmp uge i32 %inc, 1024
  br i1 %exitcnd, label %exit, label %loop

exit:
  ret void
}