File: pmul.ll

package info (click to toggle)
llvm-3.1 3.1-1
  • links: PTS, VCS
  • area: main
  • in suites: wheezy
  • size: 80,224 kB
  • sloc: cpp: 491,014; asm: 110,971; ansic: 14,579; sh: 13,120; python: 6,152; ml: 4,719; makefile: 1,830; pascal: 1,553; perl: 874; xml: 283; lisp: 187; csh: 117; exp: 4
file content (34 lines) | stat: -rw-r--r-- 1,080 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
; RUN: llc < %s -march=x86 -mattr=sse41 -stack-alignment=16 -join-physregs > %t
; RUN: grep pmul %t | count 12
; RUN: grep mov %t | count 11

; The f() arguments in %xmm0 and %xmm1 cause an extra movdqa without -join-physregs.

define <4 x i32> @a(<4 x i32> %i) nounwind  {
        %A = mul <4 x i32> %i, < i32 117, i32 117, i32 117, i32 117 >
        ret <4 x i32> %A
}
define <2 x i64> @b(<2 x i64> %i) nounwind  {
        %A = mul <2 x i64> %i, < i64 117, i64 117 >
        ret <2 x i64> %A
}
define <4 x i32> @c(<4 x i32> %i, <4 x i32> %j) nounwind  {
        %A = mul <4 x i32> %i, %j
        ret <4 x i32> %A
}
define <2 x i64> @d(<2 x i64> %i, <2 x i64> %j) nounwind  {
        %A = mul <2 x i64> %i, %j
        ret <2 x i64> %A
}
; Use a call to force spills.
declare void @foo()
define <4 x i32> @e(<4 x i32> %i, <4 x i32> %j) nounwind  {
        call void @foo()
        %A = mul <4 x i32> %i, %j
        ret <4 x i32> %A
}
define <2 x i64> @f(<2 x i64> %i, <2 x i64> %j) nounwind  {
        call void @foo()
        %A = mul <2 x i64> %i, %j
        ret <2 x i64> %A
}