forked from OSchip/llvm-project
AMDGPU: Run SIInsertWaits as pre-emit pass
Running this after the scheduler enables scheduling waits later so other ALU instructions can run while this would be waiting. When combined with enabling the post-RA scheduler, this gives about a ~20% improvement on sgemm. llvm-svn: 241473
This commit is contained in:
parent
f423f5627c
commit
db7781c6e9
|
@ -280,10 +280,10 @@ void GCNPassConfig::addPostRegAlloc() {
|
|||
}
|
||||
|
||||
void GCNPassConfig::addPreSched2() {
|
||||
addPass(createSIInsertWaits(*TM), false);
|
||||
}
|
||||
|
||||
void GCNPassConfig::addPreEmitPass() {
|
||||
addPass(createSIInsertWaits(*TM), false);
|
||||
addPass(createSILowerControlFlowPass(*TM), false);
|
||||
}
|
||||
|
||||
|
|
Loading…
Reference in New Issue