File: no-rex2-general.ll

package info (click to toggle)
llvm-toolchain-19 1%3A19.1.7-3
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid, trixie
  • size: 1,998,520 kB
  • sloc: cpp: 6,951,680; ansic: 1,486,157; asm: 913,598; python: 232,024; f90: 80,126; objc: 75,281; lisp: 37,276; pascal: 16,990; sh: 10,009; ml: 5,058; perl: 4,724; awk: 3,523; makefile: 3,167; javascript: 2,504; xml: 892; fortran: 664; cs: 573
file content (83 lines) | stat: -rw-r--r-- 3,718 bytes parent folder | download | duplicates (7)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
; NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py
; RUN: llc < %s -mtriple=x86_64-unknown -stop-after=x86-isel -mattr=+sse2,+ssse3,+egpr  | FileCheck %s --check-prefix=SSE
; RUN: llc < %s -mtriple=x86_64-unknown -stop-after=x86-isel -mattr=+sse2,+ssse3,+egpr,+avx | FileCheck %s --check-prefix=AVX
; RUN: llc < %s -enable-new-pm -mtriple=x86_64-unknown -stop-after=x86-isel -mattr=+sse2,+ssse3,+egpr  | FileCheck %s --check-prefix=SSE
; RUN: llc < %s -enable-new-pm -mtriple=x86_64-unknown -stop-after=x86-isel -mattr=+sse2,+ssse3,+egpr,+avx | FileCheck %s --check-prefix=AVX

define i32 @map0(ptr nocapture noundef readonly %a, i64 noundef %b) {
  ; SSE-LABEL: name: map0
  ; SSE: bb.0.entry:
  ; SSE-NEXT:   liveins: $rdi, $rsi
  ; SSE-NEXT: {{  $}}
  ; SSE-NEXT:   [[COPY:%[0-9]+]]:gr64_nosp = COPY $rsi
  ; SSE-NEXT:   [[COPY1:%[0-9]+]]:gr64 = COPY $rdi
  ; SSE-NEXT:   [[MOV32rm:%[0-9]+]]:gr32 = MOV32rm [[COPY1]], 4, [[COPY]], 0, $noreg :: (load (s32) from %ir.add.ptr)
  ; SSE-NEXT:   $eax = COPY [[MOV32rm]]
  ; SSE-NEXT:   RET 0, $eax
  ; AVX-LABEL: name: map0
  ; AVX: bb.0.entry:
  ; AVX-NEXT:   liveins: $rdi, $rsi
  ; AVX-NEXT: {{  $}}
  ; AVX-NEXT:   [[COPY:%[0-9]+]]:gr64_nosp = COPY $rsi
  ; AVX-NEXT:   [[COPY1:%[0-9]+]]:gr64 = COPY $rdi
  ; AVX-NEXT:   [[MOV32rm:%[0-9]+]]:gr32 = MOV32rm [[COPY1]], 4, [[COPY]], 0, $noreg :: (load (s32) from %ir.add.ptr)
  ; AVX-NEXT:   $eax = COPY [[MOV32rm]]
  ; AVX-NEXT:   RET 0, $eax
entry:
  %add.ptr = getelementptr inbounds i32, ptr %a, i64 %b
  %0 = load i32, ptr %add.ptr
  ret i32 %0
}

define i32 @map1_or_vex(<2 x double> noundef %a) {
  ; SSE-LABEL: name: map1_or_vex
  ; SSE: bb.0.entry:
  ; SSE-NEXT:   liveins: $xmm0
  ; SSE-NEXT: {{  $}}
  ; SSE-NEXT:   [[COPY:%[0-9]+]]:vr128 = COPY $xmm0
  ; SSE-NEXT:   [[CVTSD2SIrr_Int:%[0-9]+]]:gr32 = nofpexcept CVTSD2SIrr_Int [[COPY]], implicit $mxcsr
  ; SSE-NEXT:   $eax = COPY [[CVTSD2SIrr_Int]]
  ; SSE-NEXT:   RET 0, $eax
  ; AVX-LABEL: name: map1_or_vex
  ; AVX: bb.0.entry:
  ; AVX-NEXT:   liveins: $xmm0
  ; AVX-NEXT: {{  $}}
  ; AVX-NEXT:   [[COPY:%[0-9]+]]:vr128 = COPY $xmm0
  ; AVX-NEXT:   [[VCVTSD2SIrr_Int:%[0-9]+]]:gr32_norex2 = nofpexcept VCVTSD2SIrr_Int [[COPY]], implicit $mxcsr
  ; AVX-NEXT:   $eax = COPY [[VCVTSD2SIrr_Int]]
  ; AVX-NEXT:   RET 0, $eax
entry:
  %0 = tail call i32 @llvm.x86.sse2.cvtsd2si(<2 x double> %a)
  ret i32 %0
}

define <2 x i64> @map2_or_vex(ptr nocapture noundef readonly %b, i64 noundef %c) {
  ; SSE-LABEL: name: map2_or_vex
  ; SSE: bb.0.entry:
  ; SSE-NEXT:   liveins: $rdi, $rsi
  ; SSE-NEXT: {{  $}}
  ; SSE-NEXT:   [[COPY:%[0-9]+]]:gr64_norex2_nosp = COPY $rsi
  ; SSE-NEXT:   [[COPY1:%[0-9]+]]:gr64_norex2 = COPY $rdi
  ; SSE-NEXT:   [[PABSBrm:%[0-9]+]]:vr128 = PABSBrm [[COPY1]], 4, [[COPY]], 0, $noreg :: (load (s128) from %ir.add.ptr)
  ; SSE-NEXT:   $xmm0 = COPY [[PABSBrm]]
  ; SSE-NEXT:   RET 0, $xmm0
  ; AVX-LABEL: name: map2_or_vex
  ; AVX: bb.0.entry:
  ; AVX-NEXT:   liveins: $rdi, $rsi
  ; AVX-NEXT: {{  $}}
  ; AVX-NEXT:   [[COPY:%[0-9]+]]:gr64_norex2_nosp = COPY $rsi
  ; AVX-NEXT:   [[COPY1:%[0-9]+]]:gr64_norex2 = COPY $rdi
  ; AVX-NEXT:   [[VPABSBrm:%[0-9]+]]:vr128 = VPABSBrm [[COPY1]], 4, [[COPY]], 0, $noreg :: (load (s128) from %ir.add.ptr)
  ; AVX-NEXT:   $xmm0 = COPY [[VPABSBrm]]
  ; AVX-NEXT:   RET 0, $xmm0
entry:
  %add.ptr = getelementptr inbounds i32, ptr %b, i64 %c
  %a = load <2 x i64>, ptr %add.ptr
  %0 = bitcast <2 x i64> %a to <16 x i8>
  %elt.abs.i = tail call <16 x i8> @llvm.abs.v16i8(<16 x i8> %0, i1 false)
  %1 = bitcast <16 x i8> %elt.abs.i to <2 x i64>
  ret <2 x i64> %1
}

declare i32 @llvm.x86.sse2.cvtsd2si(<2 x double>)
declare <16 x i8> @llvm.abs.v16i8(<16 x i8>, i1 immarg)