forked from OSchip/llvm-project
[AArch64] Allow loads with imp-def to be handled in getMemOpBaseRegImmOfsWidth()
Summary: This change will allow loads with imp-def to be clustered in machine-scheduler pass. areMemAccessesTriviallyDisjoint() can also handle loads with imp-def. Reviewers: mcrosier, jmolloy, t.p.northover Subscribers: aemerson, rengolin, mcrosier, llvm-commits Differential Revision: http://reviews.llvm.org/D18665 llvm-svn: 265051
This commit is contained in:
parent
9defda528e
commit
760afcb338
|
@ -1404,7 +1404,7 @@ bool AArch64InstrInfo::getMemOpBaseRegImmOfsWidth(
|
||||||
const TargetRegisterInfo *TRI) const {
|
const TargetRegisterInfo *TRI) const {
|
||||||
assert(LdSt->mayLoadOrStore() && "Expected a memory operation.");
|
assert(LdSt->mayLoadOrStore() && "Expected a memory operation.");
|
||||||
// Handle only loads/stores with base register followed by immediate offset.
|
// Handle only loads/stores with base register followed by immediate offset.
|
||||||
if (LdSt->getNumOperands() != 3)
|
if (LdSt->getNumExplicitOperands() != 3)
|
||||||
return false;
|
return false;
|
||||||
if (!LdSt->getOperand(1).isReg() || !LdSt->getOperand(2).isImm())
|
if (!LdSt->getOperand(1).isReg() || !LdSt->getOperand(2).isImm())
|
||||||
return false;
|
return false;
|
||||||
|
|
|
@ -125,7 +125,7 @@ entry:
|
||||||
define void @bar(i32 %x, <4 x i32> %y) nounwind {
|
define void @bar(i32 %x, <4 x i32> %y) nounwind {
|
||||||
entry:
|
entry:
|
||||||
; CHECK-LABEL: bar:
|
; CHECK-LABEL: bar:
|
||||||
; CHECK: str {{q[0-9]+}}, [sp, #16]
|
; CHECK: stp {{q[0-9]+}}, {{q[0-9]+}}, [sp, #16]
|
||||||
; CHECK: str {{x[0-9]+}}, [sp]
|
; CHECK: str {{x[0-9]+}}, [sp]
|
||||||
%x.addr = alloca i32, align 4
|
%x.addr = alloca i32, align 4
|
||||||
%y.addr = alloca <4 x i32>, align 16
|
%y.addr = alloca <4 x i32>, align 16
|
||||||
|
|
|
@ -0,0 +1,35 @@
|
||||||
|
# RUN: llc -mtriple=aarch64-none-linux-gnu -run-pass machine-scheduler -verify-machineinstrs -o /dev/null %s 2>&1 | FileCheck %s
|
||||||
|
|
||||||
|
--- |
|
||||||
|
define i64 @load_imp-def(i64* nocapture %P, i32 %v) {
|
||||||
|
entry:
|
||||||
|
%0 = bitcast i64* %P to i32*
|
||||||
|
%1 = load i32, i32* %0
|
||||||
|
%conv = zext i32 %1 to i64
|
||||||
|
%arrayidx19 = getelementptr inbounds i64, i64* %P, i64 1
|
||||||
|
%arrayidx1 = bitcast i64* %arrayidx19 to i32*
|
||||||
|
store i32 %v, i32* %arrayidx1
|
||||||
|
%2 = load i64, i64* %arrayidx19
|
||||||
|
%and = and i64 %2, 4294967295
|
||||||
|
%add = add nuw nsw i64 %and, %conv
|
||||||
|
ret i64 %add
|
||||||
|
}
|
||||||
|
...
|
||||||
|
---
|
||||||
|
# CHECK-LABEL: name: load_imp-def
|
||||||
|
# CHECK: bb.0.entry:
|
||||||
|
# CHECK: LDRWui %x0, 0
|
||||||
|
# CHECK: LDRWui %x0, 1
|
||||||
|
# CHECK: STRWui %w1, %x0, 2
|
||||||
|
name: load_imp-def
|
||||||
|
isSSA: true
|
||||||
|
body: |
|
||||||
|
bb.0.entry:
|
||||||
|
liveins: %w1, %x0
|
||||||
|
%w8 = LDRWui %x0, 1, implicit-def %x8 :: (load 4 from %ir.0)
|
||||||
|
STRWui killed %w1, %x0, 2 :: (store 4 into %ir.arrayidx1)
|
||||||
|
%w9 = LDRWui killed %x0, 0, implicit-def %x9 :: (load 4 from %ir.arrayidx19, align 8)
|
||||||
|
%x0 = ADDXrr killed %x9, killed %x8
|
||||||
|
RET_ReallyLR implicit %x0
|
||||||
|
...
|
||||||
|
|
Loading…
Reference in New Issue