forked from OSchip/llvm-project
439 lines
13 KiB
C++
439 lines
13 KiB
C++
//===-- Thumb2ITBlockPass.cpp - Insert Thumb-2 IT blocks ------------------===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "ARM.h"
|
|
#include "ARMMachineFunctionInfo.h"
|
|
#include "ARMSubtarget.h"
|
|
#include "MCTargetDesc/ARMBaseInfo.h"
|
|
#include "Thumb2InstrInfo.h"
|
|
#include "llvm/ADT/SmallSet.h"
|
|
#include "llvm/ADT/SmallVector.h"
|
|
#include "llvm/ADT/Statistic.h"
|
|
#include "llvm/ADT/StringRef.h"
|
|
#include "llvm/CodeGen/MachineBasicBlock.h"
|
|
#include "llvm/CodeGen/MachineFunction.h"
|
|
#include "llvm/CodeGen/MachineFunctionPass.h"
|
|
#include "llvm/CodeGen/MachineInstr.h"
|
|
#include "llvm/CodeGen/MachineInstrBuilder.h"
|
|
#include "llvm/CodeGen/MachineInstrBundle.h"
|
|
#include "llvm/CodeGen/MachineOperand.h"
|
|
#include "llvm/IR/DebugLoc.h"
|
|
#include "llvm/MC/MCInstrDesc.h"
|
|
#include "llvm/MC/MCRegisterInfo.h"
|
|
#include <cassert>
|
|
#include <new>
|
|
|
|
using namespace llvm;
|
|
|
|
#define DEBUG_TYPE "thumb2-it"
|
|
#define PASS_NAME "Thumb IT blocks insertion pass"
|
|
|
|
STATISTIC(NumITs, "Number of IT blocks inserted");
|
|
STATISTIC(NumMovedInsts, "Number of predicated instructions moved");
|
|
|
|
using RegisterSet = SmallSet<unsigned, 4>;
|
|
|
|
namespace {
|
|
|
|
class Thumb2ITBlock : public MachineFunctionPass {
|
|
public:
|
|
static char ID;
|
|
|
|
bool restrictIT;
|
|
const Thumb2InstrInfo *TII;
|
|
const TargetRegisterInfo *TRI;
|
|
ARMFunctionInfo *AFI;
|
|
|
|
Thumb2ITBlock() : MachineFunctionPass(ID) {}
|
|
|
|
bool runOnMachineFunction(MachineFunction &Fn) override;
|
|
|
|
MachineFunctionProperties getRequiredProperties() const override {
|
|
return MachineFunctionProperties().set(
|
|
MachineFunctionProperties::Property::NoVRegs);
|
|
}
|
|
|
|
StringRef getPassName() const override {
|
|
return PASS_NAME;
|
|
}
|
|
|
|
private:
|
|
bool MoveCopyOutOfITBlock(MachineInstr *MI,
|
|
ARMCC::CondCodes CC, ARMCC::CondCodes OCC,
|
|
RegisterSet &Defs, RegisterSet &Uses);
|
|
bool InsertITInstructions(MachineBasicBlock &Block);
|
|
};
|
|
|
|
char Thumb2ITBlock::ID = 0;
|
|
|
|
} // end anonymous namespace
|
|
|
|
INITIALIZE_PASS(Thumb2ITBlock, DEBUG_TYPE, PASS_NAME, false, false)
|
|
|
|
/// TrackDefUses - Tracking what registers are being defined and used by
|
|
/// instructions in the IT block. This also tracks "dependencies", i.e. uses
|
|
/// in the IT block that are defined before the IT instruction.
|
|
static void TrackDefUses(MachineInstr *MI, RegisterSet &Defs, RegisterSet &Uses,
|
|
const TargetRegisterInfo *TRI) {
|
|
using RegList = SmallVector<unsigned, 4>;
|
|
RegList LocalDefs;
|
|
RegList LocalUses;
|
|
|
|
for (auto &MO : MI->operands()) {
|
|
if (!MO.isReg())
|
|
continue;
|
|
unsigned Reg = MO.getReg();
|
|
if (!Reg || Reg == ARM::ITSTATE || Reg == ARM::SP)
|
|
continue;
|
|
if (MO.isUse())
|
|
LocalUses.push_back(Reg);
|
|
else
|
|
LocalDefs.push_back(Reg);
|
|
}
|
|
|
|
auto InsertUsesDefs = [&](RegList &Regs, RegisterSet &UsesDefs) {
|
|
for (unsigned Reg : Regs)
|
|
for (MCSubRegIterator Subreg(Reg, TRI, /*IncludeSelf=*/true);
|
|
Subreg.isValid(); ++Subreg)
|
|
UsesDefs.insert(*Subreg);
|
|
};
|
|
|
|
InsertUsesDefs(LocalDefs, Defs);
|
|
InsertUsesDefs(LocalUses, Uses);
|
|
}
|
|
|
|
/// Clear kill flags for any uses in the given set. This will likely
|
|
/// conservatively remove more kill flags than are necessary, but removing them
|
|
/// is safer than incorrect kill flags remaining on instructions.
|
|
static void ClearKillFlags(MachineInstr *MI, RegisterSet &Uses) {
|
|
for (MachineOperand &MO : MI->operands()) {
|
|
if (!MO.isReg() || MO.isDef() || !MO.isKill())
|
|
continue;
|
|
if (!Uses.count(MO.getReg()))
|
|
continue;
|
|
MO.setIsKill(false);
|
|
}
|
|
}
|
|
|
|
static bool isCopy(MachineInstr *MI) {
|
|
switch (MI->getOpcode()) {
|
|
default:
|
|
return false;
|
|
case ARM::MOVr:
|
|
case ARM::MOVr_TC:
|
|
case ARM::tMOVr:
|
|
case ARM::t2MOVr:
|
|
return true;
|
|
}
|
|
}
|
|
|
|
bool
|
|
Thumb2ITBlock::MoveCopyOutOfITBlock(MachineInstr *MI,
|
|
ARMCC::CondCodes CC, ARMCC::CondCodes OCC,
|
|
RegisterSet &Defs, RegisterSet &Uses) {
|
|
if (!isCopy(MI))
|
|
return false;
|
|
// llvm models select's as two-address instructions. That means a copy
|
|
// is inserted before a t2MOVccr, etc. If the copy is scheduled in
|
|
// between selects we would end up creating multiple IT blocks.
|
|
assert(MI->getOperand(0).getSubReg() == 0 &&
|
|
MI->getOperand(1).getSubReg() == 0 &&
|
|
"Sub-register indices still around?");
|
|
|
|
unsigned DstReg = MI->getOperand(0).getReg();
|
|
unsigned SrcReg = MI->getOperand(1).getReg();
|
|
|
|
// First check if it's safe to move it.
|
|
if (Uses.count(DstReg) || Defs.count(SrcReg))
|
|
return false;
|
|
|
|
// If the CPSR is defined by this copy, then we don't want to move it. E.g.,
|
|
// if we have:
|
|
//
|
|
// movs r1, r1
|
|
// rsb r1, 0
|
|
// movs r2, r2
|
|
// rsb r2, 0
|
|
//
|
|
// we don't want this to be converted to:
|
|
//
|
|
// movs r1, r1
|
|
// movs r2, r2
|
|
// itt mi
|
|
// rsb r1, 0
|
|
// rsb r2, 0
|
|
//
|
|
const MCInstrDesc &MCID = MI->getDesc();
|
|
if (MI->hasOptionalDef() &&
|
|
MI->getOperand(MCID.getNumOperands() - 1).getReg() == ARM::CPSR)
|
|
return false;
|
|
|
|
// Then peek at the next instruction to see if it's predicated on CC or OCC.
|
|
// If not, then there is nothing to be gained by moving the copy.
|
|
MachineBasicBlock::iterator I = MI;
|
|
++I;
|
|
MachineBasicBlock::iterator E = MI->getParent()->end();
|
|
|
|
while (I != E && I->isDebugInstr())
|
|
++I;
|
|
|
|
if (I != E) {
|
|
unsigned NPredReg = 0;
|
|
ARMCC::CondCodes NCC = getITInstrPredicate(*I, NPredReg);
|
|
if (NCC == CC || NCC == OCC)
|
|
return true;
|
|
}
|
|
return false;
|
|
}
|
|
|
|
bool Thumb2ITBlock::InsertITInstructions(MachineBasicBlock &MBB) {
|
|
bool Modified = false;
|
|
RegisterSet Defs, Uses;
|
|
MachineBasicBlock::iterator MBBI = MBB.begin(), E = MBB.end();
|
|
|
|
while (MBBI != E) {
|
|
MachineInstr *MI = &*MBBI;
|
|
DebugLoc dl = MI->getDebugLoc();
|
|
unsigned PredReg = 0;
|
|
ARMCC::CondCodes CC = getITInstrPredicate(*MI, PredReg);
|
|
if (CC == ARMCC::AL) {
|
|
++MBBI;
|
|
continue;
|
|
}
|
|
|
|
Defs.clear();
|
|
Uses.clear();
|
|
TrackDefUses(MI, Defs, Uses, TRI);
|
|
|
|
// Insert an IT instruction.
|
|
MachineInstrBuilder MIB = BuildMI(MBB, MBBI, dl, TII->get(ARM::t2IT))
|
|
.addImm(CC);
|
|
|
|
// Add implicit use of ITSTATE to IT block instructions.
|
|
MI->addOperand(MachineOperand::CreateReg(ARM::ITSTATE, false/*ifDef*/,
|
|
true/*isImp*/, false/*isKill*/));
|
|
|
|
MachineInstr *LastITMI = MI;
|
|
MachineBasicBlock::iterator InsertPos = MIB.getInstr();
|
|
++MBBI;
|
|
|
|
// Form IT block.
|
|
ARMCC::CondCodes OCC = ARMCC::getOppositeCondition(CC);
|
|
unsigned Mask = 0, Pos = 3;
|
|
|
|
// v8 IT blocks are limited to one conditional op unless -arm-no-restrict-it
|
|
// is set: skip the loop
|
|
if (!restrictIT) {
|
|
// Branches, including tricky ones like LDM_RET, need to end an IT
|
|
// block so check the instruction we just put in the block.
|
|
for (; MBBI != E && Pos &&
|
|
(!MI->isBranch() && !MI->isReturn()) ; ++MBBI) {
|
|
if (MBBI->isDebugInstr())
|
|
continue;
|
|
|
|
MachineInstr *NMI = &*MBBI;
|
|
MI = NMI;
|
|
|
|
unsigned NPredReg = 0;
|
|
ARMCC::CondCodes NCC = getITInstrPredicate(*NMI, NPredReg);
|
|
if (NCC == CC || NCC == OCC) {
|
|
Mask |= ((NCC ^ CC) & 1) << Pos;
|
|
// Add implicit use of ITSTATE.
|
|
NMI->addOperand(MachineOperand::CreateReg(ARM::ITSTATE, false/*ifDef*/,
|
|
true/*isImp*/, false/*isKill*/));
|
|
LastITMI = NMI;
|
|
} else {
|
|
if (NCC == ARMCC::AL &&
|
|
MoveCopyOutOfITBlock(NMI, CC, OCC, Defs, Uses)) {
|
|
--MBBI;
|
|
MBB.remove(NMI);
|
|
MBB.insert(InsertPos, NMI);
|
|
ClearKillFlags(MI, Uses);
|
|
++NumMovedInsts;
|
|
continue;
|
|
}
|
|
break;
|
|
}
|
|
TrackDefUses(NMI, Defs, Uses, TRI);
|
|
--Pos;
|
|
}
|
|
}
|
|
|
|
// Finalize IT mask.
|
|
Mask |= (1 << Pos);
|
|
MIB.addImm(Mask);
|
|
|
|
// Last instruction in IT block kills ITSTATE.
|
|
LastITMI->findRegisterUseOperand(ARM::ITSTATE)->setIsKill();
|
|
|
|
// Finalize the bundle.
|
|
finalizeBundle(MBB, InsertPos.getInstrIterator(),
|
|
++LastITMI->getIterator());
|
|
|
|
Modified = true;
|
|
++NumITs;
|
|
}
|
|
|
|
return Modified;
|
|
}
|
|
|
|
bool Thumb2ITBlock::runOnMachineFunction(MachineFunction &Fn) {
|
|
const ARMSubtarget &STI =
|
|
static_cast<const ARMSubtarget &>(Fn.getSubtarget());
|
|
if (!STI.isThumb2())
|
|
return false;
|
|
AFI = Fn.getInfo<ARMFunctionInfo>();
|
|
TII = static_cast<const Thumb2InstrInfo *>(STI.getInstrInfo());
|
|
TRI = STI.getRegisterInfo();
|
|
restrictIT = STI.restrictIT();
|
|
|
|
if (!AFI->isThumbFunction())
|
|
return false;
|
|
|
|
bool Modified = false;
|
|
for (auto &MBB : Fn )
|
|
Modified |= InsertITInstructions(MBB);
|
|
|
|
if (Modified)
|
|
AFI->setHasITBlocks(true);
|
|
|
|
return Modified;
|
|
}
|
|
|
|
/// createThumb2ITBlockPass - Returns an instance of the Thumb2 IT blocks
|
|
/// insertion pass.
|
|
FunctionPass *llvm::createThumb2ITBlockPass() { return new Thumb2ITBlock(); }
|
|
|
|
#undef DEBUG_TYPE
|
|
#define DEBUG_TYPE "arm-mve-vpt"
|
|
|
|
namespace {
|
|
class MVEVPTBlock : public MachineFunctionPass {
|
|
public:
|
|
static char ID;
|
|
const Thumb2InstrInfo *TII;
|
|
const TargetRegisterInfo *TRI;
|
|
|
|
MVEVPTBlock() : MachineFunctionPass(ID) {}
|
|
|
|
bool runOnMachineFunction(MachineFunction &Fn) override;
|
|
|
|
MachineFunctionProperties getRequiredProperties() const override {
|
|
return MachineFunctionProperties().set(
|
|
MachineFunctionProperties::Property::NoVRegs);
|
|
}
|
|
|
|
StringRef getPassName() const override {
|
|
return "MVE VPT block insertion pass";
|
|
}
|
|
|
|
private:
|
|
bool InsertVPTBlocks(MachineBasicBlock &MBB);
|
|
};
|
|
|
|
char MVEVPTBlock::ID = 0;
|
|
|
|
} // end anonymous namespace
|
|
|
|
INITIALIZE_PASS(MVEVPTBlock, DEBUG_TYPE, "ARM MVE VPT block pass", false, false)
|
|
|
|
enum VPTMaskValue {
|
|
T = 8, // 0b1000
|
|
TT = 4, // 0b0100
|
|
TE = 12, // 0b1100
|
|
TTT = 2, // 0b0010
|
|
TTE = 6, // 0b0110
|
|
TEE = 10, // 0b1010
|
|
TET = 14, // 0b1110
|
|
TTTT = 1, // 0b0001
|
|
TTTE = 3, // 0b0011
|
|
TTEE = 5, // 0b0101
|
|
TTET = 7, // 0b0111
|
|
TEEE = 9, // 0b1001
|
|
TEET = 11, // 0b1011
|
|
TETT = 13, // 0b1101
|
|
TETE = 15 // 0b1111
|
|
};
|
|
|
|
bool MVEVPTBlock::InsertVPTBlocks(MachineBasicBlock &Block) {
|
|
bool Modified = false;
|
|
MachineBasicBlock::iterator MBIter = Block.begin();
|
|
MachineBasicBlock::iterator EndIter = Block.end();
|
|
|
|
while (MBIter != EndIter) {
|
|
MachineInstr *MI = &*MBIter;
|
|
unsigned PredReg = 0;
|
|
DebugLoc dl = MI->getDebugLoc();
|
|
|
|
ARMVCC::VPTCodes Pred = getVPTInstrPredicate(*MI, PredReg);
|
|
|
|
// The idea of the predicate is that None, Then and Else are for use when
|
|
// handling assembly language: they correspond to the three possible
|
|
// suffixes "", "t" and "e" on the mnemonic. So when instructions are read
|
|
// from assembly source or disassembled from object code, you expect to see
|
|
// a mixture whenever there's a long VPT block. But in code generation, we
|
|
// hope we'll never generate an Else as input to this pass.
|
|
|
|
assert(Pred != ARMVCC::Else && "VPT block pass does not expect Else preds");
|
|
|
|
if (Pred == ARMVCC::None) {
|
|
++MBIter;
|
|
continue;
|
|
}
|
|
|
|
MachineInstrBuilder MIBuilder =
|
|
BuildMI(Block, MBIter, dl, TII->get(ARM::MVE_VPST));
|
|
// The mask value for the VPST instruction is T = 0b1000 = 8
|
|
MIBuilder.addImm(VPTMaskValue::T);
|
|
|
|
MachineBasicBlock::iterator VPSTInsertPos = MIBuilder.getInstr();
|
|
int VPTInstCnt = 1;
|
|
ARMVCC::VPTCodes NextPred;
|
|
|
|
do {
|
|
++MBIter;
|
|
NextPred = getVPTInstrPredicate(*MBIter, PredReg);
|
|
} while (NextPred != ARMVCC::None && NextPred == Pred && ++VPTInstCnt < 4);
|
|
|
|
MachineInstr *LastMI = &*MBIter;
|
|
finalizeBundle(Block, VPSTInsertPos.getInstrIterator(),
|
|
++LastMI->getIterator());
|
|
|
|
Modified = true;
|
|
LLVM_DEBUG(dbgs() << "VPT block created for: "; MI->dump(););
|
|
|
|
++MBIter;
|
|
}
|
|
return Modified;
|
|
}
|
|
|
|
bool MVEVPTBlock::runOnMachineFunction(MachineFunction &Fn) {
|
|
const ARMSubtarget &STI =
|
|
static_cast<const ARMSubtarget &>(Fn.getSubtarget());
|
|
|
|
if (!STI.isThumb2() || !STI.hasMVEIntegerOps())
|
|
return false;
|
|
|
|
TII = static_cast<const Thumb2InstrInfo *>(STI.getInstrInfo());
|
|
TRI = STI.getRegisterInfo();
|
|
|
|
LLVM_DEBUG(dbgs() << "********** ARM MVE VPT BLOCKS **********\n"
|
|
<< "********** Function: " << Fn.getName() << '\n');
|
|
|
|
bool Modified = false;
|
|
for (MachineBasicBlock &MBB : Fn)
|
|
Modified |= InsertVPTBlocks(MBB);
|
|
|
|
LLVM_DEBUG(dbgs() << "**************************************\n");
|
|
return Modified;
|
|
}
|
|
|
|
/// createMVEVPTBlock - Returns an instance of the MVE VPT block
|
|
/// insertion pass.
|
|
FunctionPass *llvm::createMVEVPTBlockPass() { return new MVEVPTBlock(); }
|