forked from OSchip/llvm-project
[AArch64] Reduce vector insert/extract cost for Kryo
Differential Revision: http://reviews.llvm.org/D17379 llvm-svn: 261237
This commit is contained in:
parent
7c8e2c37ba
commit
921ad01a1d
|
@ -313,6 +313,8 @@ int AArch64TTIImpl::getVectorInstrCost(unsigned Opcode, Type *Val,
|
|||
}
|
||||
|
||||
// All other insert/extracts cost this much.
|
||||
if (ST->isKryo())
|
||||
return 2;
|
||||
return 3;
|
||||
}
|
||||
|
||||
|
|
|
@ -0,0 +1,26 @@
|
|||
; RUN: opt < %s -cost-model -analyze -mcpu=kryo | FileCheck %s
|
||||
|
||||
target datalayout = "e-m:e-i64:64-i128:128-n32:64-S128"
|
||||
target triple = "aarch64--linux-gnu"
|
||||
|
||||
; CHECK-LABEL: vectorInstrCost
|
||||
define void @vectorInstrCost() {
|
||||
|
||||
; Vector extracts - extracting the first element should have a zero cost;
|
||||
; all other elements should have a cost of two.
|
||||
;
|
||||
; CHECK: cost of 0 {{.*}} extractelement <2 x i64> undef, i32 0
|
||||
; CHECK: cost of 2 {{.*}} extractelement <2 x i64> undef, i32 1
|
||||
%t1 = extractelement <2 x i64> undef, i32 0
|
||||
%t2 = extractelement <2 x i64> undef, i32 1
|
||||
|
||||
; Vector inserts - inserting the first element should have a zero cost; all
|
||||
; other elements should have a cost of two.
|
||||
;
|
||||
; CHECK: cost of 0 {{.*}} insertelement <2 x i64> undef, i64 undef, i32 0
|
||||
; CHECK: cost of 2 {{.*}} insertelement <2 x i64> undef, i64 undef, i32 1
|
||||
%t3 = insertelement <2 x i64> undef, i64 undef, i32 0
|
||||
%t4 = insertelement <2 x i64> undef, i64 undef, i32 1
|
||||
|
||||
ret void
|
||||
}
|
Loading…
Reference in New Issue