forked from OSchip/llvm-project
[NFC][X86] Refine code in X86AsmBackend
Summary: Move code to a better place, rename function, etc Tags: #llvm Differential Revision: https://reviews.llvm.org/D77778
This commit is contained in:
parent
9aa5fbb3af
commit
2477cec2ac
|
@ -62,10 +62,9 @@ public:
|
|||
else if (BranchType == "indirect")
|
||||
addKind(X86::AlignBranchIndirect);
|
||||
else {
|
||||
report_fatal_error(
|
||||
"'-x86-align-branch 'The branches's type is combination of jcc, "
|
||||
"fused, jmp, call, ret, indirect.(plus separated)",
|
||||
false);
|
||||
errs() << "invalid argument " << BranchType.str()
|
||||
<< " to -x86-align-branch=; each element must be one of: fused, "
|
||||
"jcc, jmp, call, ret, indirect.(plus separated)";
|
||||
}
|
||||
}
|
||||
}
|
||||
|
@ -129,18 +128,18 @@ class X86AsmBackend : public MCAsmBackend {
|
|||
std::unique_ptr<const MCInstrInfo> MCII;
|
||||
X86AlignBranchKind AlignBranchType;
|
||||
Align AlignBoundary;
|
||||
unsigned TargetPrefixMax = 0;
|
||||
|
||||
MCInst PrevInst;
|
||||
MCBoundaryAlignFragment *PendingBA = nullptr;
|
||||
std::pair<MCFragment *, size_t> PrevInstPosition;
|
||||
bool CanPadInst;
|
||||
|
||||
uint8_t determinePaddingPrefix(const MCInst &Inst) const;
|
||||
|
||||
bool isMacroFused(const MCInst &Cmp, const MCInst &Jcc) const;
|
||||
|
||||
bool needAlign(MCObjectStreamer &OS) const;
|
||||
bool needAlignInst(const MCInst &Inst) const;
|
||||
bool allowAutoPaddingForInst(const MCInst &Inst, MCObjectStreamer &OS) const;
|
||||
MCInst PrevInst;
|
||||
MCBoundaryAlignFragment *PendingBoundaryAlign = nullptr;
|
||||
std::pair<MCFragment *, size_t> PrevInstPosition;
|
||||
bool AllowAutoPaddingForInst;
|
||||
bool needAlign(const MCInst &Inst) const;
|
||||
bool canPadBranches(MCObjectStreamer &OS) const;
|
||||
bool canPadInst(const MCInst &Inst, MCObjectStreamer &OS) const;
|
||||
|
||||
public:
|
||||
X86AsmBackend(const Target &T, const MCSubtargetInfo &STI)
|
||||
|
@ -161,6 +160,8 @@ public:
|
|||
AlignBoundary = assumeAligned(X86AlignBranchBoundary);
|
||||
if (X86AlignBranch.getNumOccurrences())
|
||||
AlignBranchType = X86AlignBranchKindLoc;
|
||||
if (X86PadMaxPrefixSize.getNumOccurrences())
|
||||
TargetPrefixMax = X86PadMaxPrefixSize;
|
||||
}
|
||||
|
||||
bool allowAutoPadding() const override;
|
||||
|
@ -459,23 +460,7 @@ bool X86AsmBackend::allowAutoPadding() const {
|
|||
}
|
||||
|
||||
bool X86AsmBackend::allowEnhancedRelaxation() const {
|
||||
return allowAutoPadding() && X86PadMaxPrefixSize != 0 && X86PadForBranchAlign;
|
||||
}
|
||||
|
||||
bool X86AsmBackend::needAlign(MCObjectStreamer &OS) const {
|
||||
if (!OS.getAllowAutoPadding())
|
||||
return false;
|
||||
assert(allowAutoPadding() && "incorrect initialization!");
|
||||
|
||||
// To be Done: Currently don't deal with Bundle cases.
|
||||
if (OS.getAssembler().isBundlingEnabled())
|
||||
return false;
|
||||
|
||||
// Branches only need to be aligned in 32-bit or 64-bit mode.
|
||||
if (!(STI.hasFeature(X86::Mode64Bit) || STI.hasFeature(X86::Mode32Bit)))
|
||||
return false;
|
||||
|
||||
return true;
|
||||
return allowAutoPadding() && TargetPrefixMax != 0 && X86PadForBranchAlign;
|
||||
}
|
||||
|
||||
/// X86 has certain instructions which enable interrupts exactly one
|
||||
|
@ -545,25 +530,9 @@ static size_t getSizeForInstFragment(const MCFragment *F) {
|
|||
}
|
||||
}
|
||||
|
||||
/// Check if the instruction operand needs to be aligned.
|
||||
bool X86AsmBackend::needAlignInst(const MCInst &Inst) const {
|
||||
const MCInstrDesc &InstDesc = MCII->get(Inst.getOpcode());
|
||||
return (InstDesc.isConditionalBranch() &&
|
||||
(AlignBranchType & X86::AlignBranchJcc)) ||
|
||||
(InstDesc.isUnconditionalBranch() &&
|
||||
(AlignBranchType & X86::AlignBranchJmp)) ||
|
||||
(InstDesc.isCall() &&
|
||||
(AlignBranchType & X86::AlignBranchCall)) ||
|
||||
(InstDesc.isReturn() &&
|
||||
(AlignBranchType & X86::AlignBranchRet)) ||
|
||||
(InstDesc.isIndirectBranch() &&
|
||||
(AlignBranchType & X86::AlignBranchIndirect));
|
||||
}
|
||||
|
||||
/// Return true if we can insert NOP or prefixes automatically before the
|
||||
/// the instruction to be emitted.
|
||||
bool X86AsmBackend::allowAutoPaddingForInst(const MCInst &Inst,
|
||||
MCObjectStreamer &OS) const {
|
||||
bool X86AsmBackend::canPadInst(const MCInst &Inst, MCObjectStreamer &OS) const {
|
||||
if (hasVariantSymbol(Inst))
|
||||
// Linker may rewrite the instruction with variant symbol operand(e.g.
|
||||
// TLSCALL).
|
||||
|
@ -592,23 +561,51 @@ bool X86AsmBackend::allowAutoPaddingForInst(const MCInst &Inst,
|
|||
return true;
|
||||
}
|
||||
|
||||
bool X86AsmBackend::canPadBranches(MCObjectStreamer &OS) const {
|
||||
if (!OS.getAllowAutoPadding())
|
||||
return false;
|
||||
assert(allowAutoPadding() && "incorrect initialization!");
|
||||
|
||||
// To be Done: Currently don't deal with Bundle cases.
|
||||
if (OS.getAssembler().isBundlingEnabled())
|
||||
return false;
|
||||
|
||||
// Branches only need to be aligned in 32-bit or 64-bit mode.
|
||||
if (!(STI.hasFeature(X86::Mode64Bit) || STI.hasFeature(X86::Mode32Bit)))
|
||||
return false;
|
||||
|
||||
return true;
|
||||
}
|
||||
|
||||
/// Check if the instruction operand needs to be aligned.
|
||||
bool X86AsmBackend::needAlign(const MCInst &Inst) const {
|
||||
const MCInstrDesc &Desc = MCII->get(Inst.getOpcode());
|
||||
return (Desc.isConditionalBranch() &&
|
||||
(AlignBranchType & X86::AlignBranchJcc)) ||
|
||||
(Desc.isUnconditionalBranch() &&
|
||||
(AlignBranchType & X86::AlignBranchJmp)) ||
|
||||
(Desc.isCall() && (AlignBranchType & X86::AlignBranchCall)) ||
|
||||
(Desc.isReturn() && (AlignBranchType & X86::AlignBranchRet)) ||
|
||||
(Desc.isIndirectBranch() &&
|
||||
(AlignBranchType & X86::AlignBranchIndirect));
|
||||
}
|
||||
|
||||
/// Insert BoundaryAlignFragment before instructions to align branches.
|
||||
void X86AsmBackend::emitInstructionBegin(MCObjectStreamer &OS,
|
||||
const MCInst &Inst) {
|
||||
AllowAutoPaddingForInst = allowAutoPaddingForInst(Inst, OS);
|
||||
CanPadInst = canPadInst(Inst, OS);
|
||||
|
||||
if (!needAlign(OS))
|
||||
if (!canPadBranches(OS))
|
||||
return;
|
||||
|
||||
if (!isMacroFused(PrevInst, Inst))
|
||||
// Macro fusion doesn't happen indeed, clear the pending.
|
||||
PendingBoundaryAlign = nullptr;
|
||||
PendingBA = nullptr;
|
||||
|
||||
if (!AllowAutoPaddingForInst)
|
||||
if (!CanPadInst)
|
||||
return;
|
||||
|
||||
if (PendingBoundaryAlign &&
|
||||
OS.getCurrentFragment()->getPrevNode() == PendingBoundaryAlign) {
|
||||
if (PendingBA && OS.getCurrentFragment()->getPrevNode() == PendingBA) {
|
||||
// Macro fusion actually happens and there is no other fragment inserted
|
||||
// after the previous instruction.
|
||||
//
|
||||
|
@ -630,12 +627,11 @@ void X86AsmBackend::emitInstructionBegin(MCObjectStreamer &OS,
|
|||
return;
|
||||
}
|
||||
|
||||
if (needAlignInst(Inst) || ((AlignBranchType & X86::AlignBranchFused) &&
|
||||
isFirstMacroFusibleInst(Inst, *MCII))) {
|
||||
if (needAlign(Inst) || ((AlignBranchType & X86::AlignBranchFused) &&
|
||||
isFirstMacroFusibleInst(Inst, *MCII))) {
|
||||
// If we meet a unfused branch or the first instuction in a fusiable pair,
|
||||
// insert a BoundaryAlign fragment.
|
||||
OS.insert(PendingBoundaryAlign =
|
||||
new MCBoundaryAlignFragment(AlignBoundary));
|
||||
OS.insert(PendingBA = new MCBoundaryAlignFragment(AlignBoundary));
|
||||
}
|
||||
}
|
||||
|
||||
|
@ -645,17 +641,17 @@ void X86AsmBackend::emitInstructionEnd(MCObjectStreamer &OS, const MCInst &Inst)
|
|||
MCFragment *CF = OS.getCurrentFragment();
|
||||
PrevInstPosition = std::make_pair(CF, getSizeForInstFragment(CF));
|
||||
if (auto *F = dyn_cast_or_null<MCRelaxableFragment>(CF))
|
||||
F->setAllowAutoPadding(AllowAutoPaddingForInst);
|
||||
F->setAllowAutoPadding(CanPadInst);
|
||||
|
||||
if (!needAlign(OS))
|
||||
if (!canPadBranches(OS))
|
||||
return;
|
||||
|
||||
if (!needAlignInst(Inst) || !PendingBoundaryAlign)
|
||||
if (!needAlign(Inst) || !PendingBA)
|
||||
return;
|
||||
|
||||
// Tie the aligned instructions into a a pending BoundaryAlign.
|
||||
PendingBoundaryAlign->setLastFragment(CF);
|
||||
PendingBoundaryAlign = nullptr;
|
||||
PendingBA->setLastFragment(CF);
|
||||
PendingBA = nullptr;
|
||||
|
||||
// We need to ensure that further data isn't added to the current
|
||||
// DataFragment, so that we can get the size of instructions later in
|
||||
|
@ -853,26 +849,6 @@ static bool isFullyRelaxed(const MCRelaxableFragment &RF) {
|
|||
return getRelaxedOpcode(Inst, Is16BitMode) == Inst.getOpcode();
|
||||
}
|
||||
|
||||
static unsigned getRemainingPrefixSize(const MCInst &Inst,
|
||||
const MCSubtargetInfo &STI,
|
||||
MCCodeEmitter &Emitter) {
|
||||
SmallString<256> Code;
|
||||
raw_svector_ostream VecOS(Code);
|
||||
Emitter.emitPrefix(Inst, VecOS, STI);
|
||||
assert(Code.size() < 15 && "The number of prefixes must be less than 15.");
|
||||
|
||||
// TODO: It turns out we need a decent amount of plumbing for the target
|
||||
// specific bits to determine number of prefixes its safe to add. Various
|
||||
// targets (older chips mostly, but also Atom family) encounter decoder
|
||||
// stalls with too many prefixes. For testing purposes, we set the value
|
||||
// externally for the moment.
|
||||
unsigned ExistingPrefixSize = Code.size();
|
||||
unsigned TargetPrefixMax = X86PadMaxPrefixSize;
|
||||
if (TargetPrefixMax <= ExistingPrefixSize)
|
||||
return 0;
|
||||
return TargetPrefixMax - ExistingPrefixSize;
|
||||
}
|
||||
|
||||
bool X86AsmBackend::padInstructionViaPrefix(MCRelaxableFragment &RF,
|
||||
MCCodeEmitter &Emitter,
|
||||
unsigned &RemainingSize) const {
|
||||
|
@ -890,9 +866,24 @@ bool X86AsmBackend::padInstructionViaPrefix(MCRelaxableFragment &RF,
|
|||
return false;
|
||||
|
||||
const unsigned MaxPossiblePad = std::min(15 - OldSize, RemainingSize);
|
||||
const unsigned RemainingPrefixSize = [&]() -> unsigned {
|
||||
SmallString<15> Code;
|
||||
raw_svector_ostream VecOS(Code);
|
||||
Emitter.emitPrefix(RF.getInst(), VecOS, STI);
|
||||
assert(Code.size() < 15 && "The number of prefixes must be less than 15.");
|
||||
|
||||
// TODO: It turns out we need a decent amount of plumbing for the target
|
||||
// specific bits to determine number of prefixes its safe to add. Various
|
||||
// targets (older chips mostly, but also Atom family) encounter decoder
|
||||
// stalls with too many prefixes. For testing purposes, we set the value
|
||||
// externally for the moment.
|
||||
unsigned ExistingPrefixSize = Code.size();
|
||||
if (TargetPrefixMax <= ExistingPrefixSize)
|
||||
return 0;
|
||||
return TargetPrefixMax - ExistingPrefixSize;
|
||||
}();
|
||||
const unsigned PrefixBytesToAdd =
|
||||
std::min(MaxPossiblePad,
|
||||
getRemainingPrefixSize(RF.getInst(), STI, Emitter));
|
||||
std::min(MaxPossiblePad, RemainingPrefixSize);
|
||||
if (PrefixBytesToAdd == 0)
|
||||
return false;
|
||||
|
||||
|
|
Loading…
Reference in New Issue