File: 2012-03-26-FoldImmBug.ll

package info (click to toggle)
llvm-toolchain-9 1%3A9.0.1-16
  • links: PTS, VCS
  • area: main
  • in suites: bullseye
  • size: 882,436 kB
  • sloc: cpp: 4,167,636; ansic: 714,256; asm: 457,610; python: 155,927; objc: 65,094; sh: 42,856; lisp: 26,908; perl: 7,786; pascal: 7,722; makefile: 6,881; ml: 5,581; awk: 3,648; cs: 2,027; xml: 888; javascript: 381; ruby: 156
file content (33 lines) | stat: -rw-r--r-- 1,098 bytes parent folder | download | duplicates (36)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
; RUN: llc < %s -mtriple=thumbv7-apple-ios -mcpu=cortex-a8 | FileCheck %s

; ARM has a peephole optimization which looks for a def / use pair. The def
; produces a 32-bit immediate which is consumed by the use. It tries to 
; fold the immediate by breaking it into two parts and fold them into the
; immmediate fields of two uses. e.g
;        movw    r2, #40885
;        movt    r3, #46540
;        add     r0, r0, r3
; =>
;        add.w   r0, r0, #3019898880
;        add.w   r0, r0, #30146560
;
; However, this transformation is incorrect if the user produces a flag. e.g.
;        movw    r2, #40885
;        movt    r3, #46540
;        adds    r0, r0, r3
; =>
;        add.w   r0, r0, #3019898880
;        adds.w  r0, r0, #30146560
; Note the adds.w may not set the carry flag even if the original sequence
; would.
;
; rdar://11116189
define i64 @t(i64 %aInput) nounwind {
; CHECK-LABEL: t:
; CHECK: movs [[REG:(r[0-9]+)]], #0
; CHECK: movt [[REG]], #46540
; CHECK: adds r{{[0-9]+}}, r{{[0-9]+}}, [[REG]]
  %1 = mul i64 %aInput, 1000000
  %2 = add i64 %1, -7952618389194932224
  ret i64 %2
}