1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50
|
; RUN: opt < %s -passes='print<cost-model>' 2>&1 -disable-output -mcpu=kryo | FileCheck %s
target datalayout = "e-m:e-i64:64-i128:128-n32:64-S128"
target triple = "aarch64--linux-gnu"
; CHECK-LABEL: vectorInstrCost
define void @vectorInstrCost() {
; Vector extracts - extracting the first element should have a zero cost;
; all other elements should have a cost of two.
;
; CHECK: cost of 0 {{.*}} extractelement <2 x i64> undef, i32 0
; CHECK: cost of 2 {{.*}} extractelement <2 x i64> undef, i32 1
%t1 = extractelement <2 x i64> undef, i32 0
%t2 = extractelement <2 x i64> undef, i32 1
; Vector inserts - inserting the first element should have a zero cost; all
; other elements should have a cost of two.
;
; CHECK: cost of 0 {{.*}} insertelement <2 x i64> undef, i64 undef, i32 0
; CHECK: cost of 2 {{.*}} insertelement <2 x i64> undef, i64 undef, i32 1
%t3 = insertelement <2 x i64> undef, i64 undef, i32 0
%t4 = insertelement <2 x i64> undef, i64 undef, i32 1
ret void
}
; CHECK-LABEL: vectorInstrExtractCost
define i64 @vectorInstrExtractCost(<4 x i64> %vecreg) {
; Vector extracts - extracting each element at index 0 is considered
; free in the current implementation. When extracting element at index
; 2, 2 is rounded to 0, so extracting element at index 2 has cost 0 as
; well.
;
; CHECK: cost of 2 {{.*}} extractelement <4 x i64> %vecreg, i32 1
; CHECK: cost of 0 {{.*}} extractelement <4 x i64> %vecreg, i32 2
%t1 = extractelement <4 x i64> %vecreg, i32 1
%t2 = extractelement <4 x i64> %vecreg, i32 2
%ele = add i64 %t2, 1
%cond = icmp eq i64 %t1, %ele
; CHECK: cost of 0 {{.*}} extractelement <4 x i64> %vecreg, i32 0
; CHECK: cost of 2 {{.*}} extractelement <4 x i64> %vecreg, i32 3
%t0 = extractelement <4 x i64> %vecreg, i32 0
%t3 = extractelement <4 x i64> %vecreg, i32 3
%val = select i1 %cond, i64 %t0 , i64 %t3
ret i64 %val
}
|