forked from OSchip/llvm-project
Use a latency value of 0 for the artificial edges inserted by
AddPseudoTwoAddrDeps. This lets the scheduling infrastructure avoid recalculating node heights. In very large testcases this was a major bottleneck. Thanks to Roman Levenstein for finding this! As a side effect, fold-pcmpeqd-0.ll is now scheduled better and it no longer requires spilling on x86-32. llvm-svn: 61778
This commit is contained in:
parent
04a2079726
commit
79c3516912
|
@ -1252,7 +1252,7 @@ void RegReductionPriorityQueue<SF>::AddPseudoTwoAddrDeps() {
|
|||
!scheduleDAG->IsReachable(SuccSU, SU)) {
|
||||
DOUT << "Adding a pseudo-two-addr edge from SU # " << SU->NodeNum
|
||||
<< " to SU #" << SuccSU->NodeNum << "\n";
|
||||
scheduleDAG->AddPred(SU, SDep(SuccSU, SDep::Order, /*Latency=*/1,
|
||||
scheduleDAG->AddPred(SU, SDep(SuccSU, SDep::Order, /*Latency=*/0,
|
||||
/*Reg=*/0, /*isMustAlias=*/false,
|
||||
/*isArtificial=*/true));
|
||||
}
|
||||
|
|
|
@ -1,4 +1,4 @@
|
|||
; RUN: llvm-as < %s | llc -mtriple=i386-apple-darwin | not grep pcmpeqd
|
||||
; RUN: llvm-as < %s | llc -mtriple=i386-apple-darwin | grep pcmpeqd | count 1
|
||||
; RUN: llvm-as < %s | llc -mtriple=x86_64-apple-darwin | grep pcmpeqd | count 1
|
||||
|
||||
; This testcase shouldn't need to spill the -1 value,
|
||||
|
|
Loading…
Reference in New Issue