File: kryo.ll

package info (click to toggle)
llvm-toolchain-15 1%3A15.0.6-4
  • links: PTS, VCS
  • area: main
  • in suites: bookworm
  • size: 1,554,644 kB
  • sloc: cpp: 5,922,452; ansic: 1,012,136; asm: 674,362; python: 191,568; objc: 73,855; f90: 42,327; lisp: 31,913; pascal: 11,973; javascript: 10,144; sh: 9,421; perl: 7,447; ml: 5,527; awk: 3,523; makefile: 2,520; xml: 885; cs: 573; fortran: 567
file content (50 lines) | stat: -rw-r--r-- 1,991 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
; RUN: opt < %s -passes='print<cost-model>' 2>&1 -disable-output -mcpu=kryo | FileCheck %s

target datalayout = "e-m:e-i64:64-i128:128-n32:64-S128"
target triple = "aarch64--linux-gnu"

; CHECK-LABEL: vectorInstrCost
define void @vectorInstrCost() {

    ; Vector extracts - extracting the first element should have a zero cost;
    ; all other elements should have a cost of two.
    ;
    ; CHECK: cost of 0 {{.*}} extractelement <2 x i64> undef, i32 0
    ; CHECK: cost of 2 {{.*}} extractelement <2 x i64> undef, i32 1
    %t1 = extractelement <2 x i64> undef, i32 0
    %t2 = extractelement <2 x i64> undef, i32 1

    ; Vector inserts - inserting the first element should have a zero cost; all
    ; other elements should have a cost of two.
    ;
    ; CHECK: cost of 0 {{.*}} insertelement <2 x i64> undef, i64 undef, i32 0
    ; CHECK: cost of 2 {{.*}} insertelement <2 x i64> undef, i64 undef, i32 1
    %t3 = insertelement <2 x i64> undef, i64 undef, i32 0
    %t4 = insertelement <2 x i64> undef, i64 undef, i32 1

    ret void
}

; CHECK-LABEL: vectorInstrExtractCost
define i64 @vectorInstrExtractCost(<4 x i64> %vecreg) {
    
    ; Vector extracts - extracting each element at index 0 is considered
    ; free in the current implementation. When extracting element at index
    ; 2, 2 is rounded to 0, so extracting element at index 2 has cost 0 as 
    ; well.
    ;
    ; CHECK: cost of 2 {{.*}} extractelement <4 x i64> %vecreg, i32 1
    ; CHECK: cost of 0 {{.*}} extractelement <4 x i64> %vecreg, i32 2
    %t1 = extractelement <4 x i64> %vecreg, i32 1
    %t2 = extractelement <4 x i64> %vecreg, i32 2
    %ele = add i64 %t2, 1
    %cond = icmp eq i64 %t1, %ele

    ; CHECK: cost of 0 {{.*}} extractelement <4 x i64> %vecreg, i32 0
    ; CHECK: cost of 2 {{.*}} extractelement <4 x i64> %vecreg, i32 3
    %t0 = extractelement <4 x i64> %vecreg, i32 0
    %t3 = extractelement <4 x i64> %vecreg, i32 3
    %val = select i1 %cond, i64 %t0 , i64 %t3

    ret i64 %val
}