Use a latency value of 0 for the artificial edges inserted by

AddPseudoTwoAddrDeps. This lets the scheduling infrastructure avoid recalculating node heights. In very large testcases this was a major bottleneck. Thanks to Roman Levenstein for finding this! As a side effect, fold-pcmpeqd-0.ll is now scheduled better and it no longer requires spilling on x86-32. llvm-svn: 61778
2009-01-06 01:19:04 +00:00 · 2009-01-06 01:19:04 +00:00 · 79c3516912
parent 04a2079726
commit 79c3516912
2 changed files with 2 additions and 2 deletions
--- a/llvm/lib/CodeGen/SelectionDAG/ScheduleDAGRRList.cpp
+++ b/llvm/lib/CodeGen/SelectionDAG/ScheduleDAGRRList.cpp
@ -1252,7 +1252,7 @@ void RegReductionPriorityQueue<SF>::AddPseudoTwoAddrDeps() {
            !scheduleDAG->IsReachable(SuccSU, SU)) {
          DOUT << "Adding a pseudo-two-addr edge from SU # " << SU->NodeNum
               << " to SU #" << SuccSU->NodeNum << "\n";
-          scheduleDAG->AddPred(SU, SDep(SuccSU, SDep::Order, /*Latency=*/1,
+          scheduleDAG->AddPred(SU, SDep(SuccSU, SDep::Order, /*Latency=*/0,
                                        /*Reg=*/0, /*isMustAlias=*/false,
                                        /*isArtificial=*/true));
        }
--- a/llvm/test/CodeGen/X86/fold-pcmpeqd-0.ll
+++ b/llvm/test/CodeGen/X86/fold-pcmpeqd-0.ll
@ -1,4 +1,4 @@
-; RUN: llvm-as < %s | llc -mtriple=i386-apple-darwin   | not grep pcmpeqd
+; RUN: llvm-as < %s | llc -mtriple=i386-apple-darwin   | grep pcmpeqd | count 1
 ; RUN: llvm-as < %s | llc -mtriple=x86_64-apple-darwin | grep pcmpeqd | count 1

 ; This testcase shouldn't need to spill the -1 value,