File: arith-max-cost.ll

package info (click to toggle)
llvm-toolchain-15 1%3A15.0.6-4
  • links: PTS, VCS
  • area: main
  • in suites: bookworm
  • size: 1,554,644 kB
  • sloc: cpp: 5,922,452; ansic: 1,012,136; asm: 674,362; python: 191,568; objc: 73,855; f90: 42,327; lisp: 31,913; pascal: 11,973; javascript: 10,144; sh: 9,421; perl: 7,447; ml: 5,527; awk: 3,523; makefile: 2,520; xml: 885; cs: 573; fortran: 567
file content (40 lines) | stat: -rw-r--r-- 1,782 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
; RUN: opt < %s -slp-vectorizer -mcpu=corei7-avx -mtriple=x86_64-unknown-linux -S | FileCheck %s

; This test checks whether the cost of the vector max intrinsic is calculated
; correctly. A max vector intrinsic combines the select and icmp instructions.
; This maps to a single PMAX instruction in x86.
define void @smax_intrinsic_cost(i64 %arg0, i64 %arg1) {
; CHECK-LABEL: @smax_intrinsic_cost(
; CHECK-NEXT:    [[ICMP0:%.*]] = icmp sgt i64 [[ARG0:%.*]], 123
; CHECK-NEXT:    [[ICMP1:%.*]] = icmp sgt i64 [[ARG1:%.*]], 456
; CHECK-NEXT:    [[SELECT0:%.*]] = select i1 [[ICMP0]], i64 [[ARG0]], i64 123
; CHECK-NEXT:    [[SELECT1:%.*]] = select i1 [[ICMP1]], i64 [[ARG1]], i64 456
; CHECK-NEXT:    [[ROOT:%.*]] = icmp sle i64 [[SELECT0]], [[SELECT1]]
; CHECK-NEXT:    ret void
;
  %icmp0 = icmp sgt i64 %arg0, 123
  %icmp1 = icmp sgt i64 %arg1, 456
  %select0 = select i1 %icmp0, i64 %arg0, i64 123
  %select1 = select i1 %icmp1, i64 %arg1, i64 456
  %root = icmp sle i64 %select0, %select1
  ret void
}


define void @umax_intrinsic_cost(i64 %arg0, i64 %arg1) {
; CHECK-LABEL: @umax_intrinsic_cost(
; CHECK-NEXT:    [[ICMP0:%.*]] = icmp ugt i64 [[ARG0:%.*]], 123
; CHECK-NEXT:    [[ICMP1:%.*]] = icmp ugt i64 [[ARG1:%.*]], 456
; CHECK-NEXT:    [[SELECT0:%.*]] = select i1 [[ICMP0]], i64 [[ARG0]], i64 123
; CHECK-NEXT:    [[SELECT1:%.*]] = select i1 [[ICMP1]], i64 [[ARG1]], i64 456
; CHECK-NEXT:    [[ROOT:%.*]] = icmp sle i64 [[SELECT0]], [[SELECT1]]
; CHECK-NEXT:    ret void
;
  %icmp0 = icmp ugt i64 %arg0, 123
  %icmp1 = icmp ugt i64 %arg1, 456
  %select0 = select i1 %icmp0, i64 %arg0, i64 123
  %select1 = select i1 %icmp1, i64 %arg1, i64 456
  %root = icmp sle i64 %select0, %select1
  ret void
}