File: dagcombine-unsafe-math.ll

package info (click to toggle)
llvm-toolchain-3.7 1%3A3.7.1-5
  • links: PTS, VCS
  • area: main
  • in suites: stretch
  • size: 345,556 kB
  • ctags: 362,199
  • sloc: cpp: 2,156,381; ansic: 458,339; objc: 91,547; python: 89,988; asm: 86,305; sh: 21,479; makefile: 6,853; perl: 5,601; ml: 5,458; pascal: 3,933; lisp: 2,429; xml: 686; cs: 239; php: 202; csh: 117
file content (56 lines) | stat: -rw-r--r-- 1,550 bytes parent folder | download | duplicates (10)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
; RUN: llc < %s -enable-unsafe-fp-math -mtriple=x86_64-apple-darwin -mcpu=corei7-avx | FileCheck %s 


; rdar://13126763
; Expression "x + x*x" was mistakenly transformed into "x * 3.0f".

define float @test1(float %x) {
  %t1 = fmul fast float %x, %x
  %t2 = fadd fast float %t1, %x
  ret float %t2
; CHECK: test1
; CHECK: vaddss
}

; (x + x) + x => x * 3.0
define float @test2(float %x) {
  %t1 = fadd fast float %x, %x
  %t2 = fadd fast float %t1, %x
  ret float %t2
; CHECK: .long  1077936128
; CHECK: test2
; CHECK: vmulss LCPI1_0(%rip), %xmm0, %xmm0
}

; x + (x + x) => x * 3.0
define float @test3(float %x) {
  %t1 = fadd fast float %x, %x
  %t2 = fadd fast float %t1, %x
  ret float %t2
; CHECK: .long  1077936128
; CHECK: test3
; CHECK: vmulss LCPI2_0(%rip), %xmm0, %xmm0
}

; (y + x) + x != x * 3.0
define float @test4(float %x, float %y) {
  %t1 = fadd fast float %x, %y
  %t2 = fadd fast float %t1, %x
  ret float %t2
; CHECK: test4
; CHECK: vaddss
}

; rdar://13445387
; "x + x + x => 3.0 * x" should be disabled after legalization because 
; Instruction-Selection doesn't know how to handle "3.0"
; 
define float @test5() {
  %mul.i.i151 = fmul <4 x float> zeroinitializer, zeroinitializer
  %vecext.i8.i152 = extractelement <4 x float> %mul.i.i151, i32 1
  %vecext1.i9.i153 = extractelement <4 x float> %mul.i.i151, i32 0
  %add.i10.i154 = fadd float %vecext1.i9.i153, %vecext.i8.i152
  %vecext.i7.i155 = extractelement <4 x float> %mul.i.i151, i32 2
  %add.i.i156 = fadd float %vecext.i7.i155, %add.i10.i154
  ret float %add.i.i156
}