else if (BranchType == "indirect")
addKind(X86::AlignBranchIndirect);
else {
- report_fatal_error(
- "'-x86-align-branch 'The branches's type is combination of jcc, "
- "fused, jmp, call, ret, indirect.(plus separated)",
- false);
+ errs() << "invalid argument " << BranchType.str()
+ << " to -x86-align-branch=; each element must be one of: fused, "
+ "jcc, jmp, call, ret, indirect.(plus separated)";
}
}
}
std::unique_ptr<const MCInstrInfo> MCII;
X86AlignBranchKind AlignBranchType;
Align AlignBoundary;
+ unsigned TargetPrefixMax = 0;
- uint8_t determinePaddingPrefix(const MCInst &Inst) const;
-
- bool isMacroFused(const MCInst &Cmp, const MCInst &Jcc) const;
-
- bool needAlign(MCObjectStreamer &OS) const;
- bool needAlignInst(const MCInst &Inst) const;
- bool allowAutoPaddingForInst(const MCInst &Inst, MCObjectStreamer &OS) const;
MCInst PrevInst;
- MCBoundaryAlignFragment *PendingBoundaryAlign = nullptr;
+ MCBoundaryAlignFragment *PendingBA = nullptr;
std::pair<MCFragment *, size_t> PrevInstPosition;
- bool AllowAutoPaddingForInst;
+ bool CanPadInst;
+
+ uint8_t determinePaddingPrefix(const MCInst &Inst) const;
+ bool isMacroFused(const MCInst &Cmp, const MCInst &Jcc) const;
+ bool needAlign(const MCInst &Inst) const;
+ bool canPadBranches(MCObjectStreamer &OS) const;
+ bool canPadInst(const MCInst &Inst, MCObjectStreamer &OS) const;
public:
X86AsmBackend(const Target &T, const MCSubtargetInfo &STI)
AlignBoundary = assumeAligned(X86AlignBranchBoundary);
if (X86AlignBranch.getNumOccurrences())
AlignBranchType = X86AlignBranchKindLoc;
+ if (X86PadMaxPrefixSize.getNumOccurrences())
+ TargetPrefixMax = X86PadMaxPrefixSize;
}
bool allowAutoPadding() const override;
}
bool X86AsmBackend::allowEnhancedRelaxation() const {
- return allowAutoPadding() && X86PadMaxPrefixSize != 0 && X86PadForBranchAlign;
-}
-
-bool X86AsmBackend::needAlign(MCObjectStreamer &OS) const {
- if (!OS.getAllowAutoPadding())
- return false;
- assert(allowAutoPadding() && "incorrect initialization!");
-
- // To be Done: Currently don't deal with Bundle cases.
- if (OS.getAssembler().isBundlingEnabled())
- return false;
-
- // Branches only need to be aligned in 32-bit or 64-bit mode.
- if (!(STI.hasFeature(X86::Mode64Bit) || STI.hasFeature(X86::Mode32Bit)))
- return false;
-
- return true;
+ return allowAutoPadding() && TargetPrefixMax != 0 && X86PadForBranchAlign;
}
/// X86 has certain instructions which enable interrupts exactly one
}
}
-/// Check if the instruction operand needs to be aligned.
-bool X86AsmBackend::needAlignInst(const MCInst &Inst) const {
- const MCInstrDesc &InstDesc = MCII->get(Inst.getOpcode());
- return (InstDesc.isConditionalBranch() &&
- (AlignBranchType & X86::AlignBranchJcc)) ||
- (InstDesc.isUnconditionalBranch() &&
- (AlignBranchType & X86::AlignBranchJmp)) ||
- (InstDesc.isCall() &&
- (AlignBranchType & X86::AlignBranchCall)) ||
- (InstDesc.isReturn() &&
- (AlignBranchType & X86::AlignBranchRet)) ||
- (InstDesc.isIndirectBranch() &&
- (AlignBranchType & X86::AlignBranchIndirect));
-}
-
/// Return true if we can insert NOP or prefixes automatically before the
/// the instruction to be emitted.
-bool X86AsmBackend::allowAutoPaddingForInst(const MCInst &Inst,
- MCObjectStreamer &OS) const {
+bool X86AsmBackend::canPadInst(const MCInst &Inst, MCObjectStreamer &OS) const {
if (hasVariantSymbol(Inst))
// Linker may rewrite the instruction with variant symbol operand(e.g.
// TLSCALL).
return true;
}
+bool X86AsmBackend::canPadBranches(MCObjectStreamer &OS) const {
+ if (!OS.getAllowAutoPadding())
+ return false;
+ assert(allowAutoPadding() && "incorrect initialization!");
+
+ // To be Done: Currently don't deal with Bundle cases.
+ if (OS.getAssembler().isBundlingEnabled())
+ return false;
+
+ // Branches only need to be aligned in 32-bit or 64-bit mode.
+ if (!(STI.hasFeature(X86::Mode64Bit) || STI.hasFeature(X86::Mode32Bit)))
+ return false;
+
+ return true;
+}
+
+/// Check if the instruction operand needs to be aligned.
+bool X86AsmBackend::needAlign(const MCInst &Inst) const {
+ const MCInstrDesc &Desc = MCII->get(Inst.getOpcode());
+ return (Desc.isConditionalBranch() &&
+ (AlignBranchType & X86::AlignBranchJcc)) ||
+ (Desc.isUnconditionalBranch() &&
+ (AlignBranchType & X86::AlignBranchJmp)) ||
+ (Desc.isCall() && (AlignBranchType & X86::AlignBranchCall)) ||
+ (Desc.isReturn() && (AlignBranchType & X86::AlignBranchRet)) ||
+ (Desc.isIndirectBranch() &&
+ (AlignBranchType & X86::AlignBranchIndirect));
+}
+
/// Insert BoundaryAlignFragment before instructions to align branches.
void X86AsmBackend::emitInstructionBegin(MCObjectStreamer &OS,
const MCInst &Inst) {
- AllowAutoPaddingForInst = allowAutoPaddingForInst(Inst, OS);
+ CanPadInst = canPadInst(Inst, OS);
- if (!needAlign(OS))
+ if (!canPadBranches(OS))
return;
if (!isMacroFused(PrevInst, Inst))
// Macro fusion doesn't happen indeed, clear the pending.
- PendingBoundaryAlign = nullptr;
+ PendingBA = nullptr;
- if (!AllowAutoPaddingForInst)
+ if (!CanPadInst)
return;
- if (PendingBoundaryAlign &&
- OS.getCurrentFragment()->getPrevNode() == PendingBoundaryAlign) {
+ if (PendingBA && OS.getCurrentFragment()->getPrevNode() == PendingBA) {
// Macro fusion actually happens and there is no other fragment inserted
// after the previous instruction.
//
return;
}
- if (needAlignInst(Inst) || ((AlignBranchType & X86::AlignBranchFused) &&
- isFirstMacroFusibleInst(Inst, *MCII))) {
+ if (needAlign(Inst) || ((AlignBranchType & X86::AlignBranchFused) &&
+ isFirstMacroFusibleInst(Inst, *MCII))) {
// If we meet a unfused branch or the first instuction in a fusiable pair,
// insert a BoundaryAlign fragment.
- OS.insert(PendingBoundaryAlign =
- new MCBoundaryAlignFragment(AlignBoundary));
+ OS.insert(PendingBA = new MCBoundaryAlignFragment(AlignBoundary));
}
}
MCFragment *CF = OS.getCurrentFragment();
PrevInstPosition = std::make_pair(CF, getSizeForInstFragment(CF));
if (auto *F = dyn_cast_or_null<MCRelaxableFragment>(CF))
- F->setAllowAutoPadding(AllowAutoPaddingForInst);
+ F->setAllowAutoPadding(CanPadInst);
- if (!needAlign(OS))
+ if (!canPadBranches(OS))
return;
- if (!needAlignInst(Inst) || !PendingBoundaryAlign)
+ if (!needAlign(Inst) || !PendingBA)
return;
// Tie the aligned instructions into a a pending BoundaryAlign.
- PendingBoundaryAlign->setLastFragment(CF);
- PendingBoundaryAlign = nullptr;
+ PendingBA->setLastFragment(CF);
+ PendingBA = nullptr;
// We need to ensure that further data isn't added to the current
// DataFragment, so that we can get the size of instructions later in
return getRelaxedOpcode(Inst, Is16BitMode) == Inst.getOpcode();
}
-static unsigned getRemainingPrefixSize(const MCInst &Inst,
- const MCSubtargetInfo &STI,
- MCCodeEmitter &Emitter) {
- SmallString<256> Code;
- raw_svector_ostream VecOS(Code);
- Emitter.emitPrefix(Inst, VecOS, STI);
- assert(Code.size() < 15 && "The number of prefixes must be less than 15.");
-
- // TODO: It turns out we need a decent amount of plumbing for the target
- // specific bits to determine number of prefixes its safe to add. Various
- // targets (older chips mostly, but also Atom family) encounter decoder
- // stalls with too many prefixes. For testing purposes, we set the value
- // externally for the moment.
- unsigned ExistingPrefixSize = Code.size();
- unsigned TargetPrefixMax = X86PadMaxPrefixSize;
- if (TargetPrefixMax <= ExistingPrefixSize)
- return 0;
- return TargetPrefixMax - ExistingPrefixSize;
-}
-
bool X86AsmBackend::padInstructionViaPrefix(MCRelaxableFragment &RF,
MCCodeEmitter &Emitter,
unsigned &RemainingSize) const {
return false;
const unsigned MaxPossiblePad = std::min(15 - OldSize, RemainingSize);
+ const unsigned RemainingPrefixSize = [&]() -> unsigned {
+ SmallString<15> Code;
+ raw_svector_ostream VecOS(Code);
+ Emitter.emitPrefix(RF.getInst(), VecOS, STI);
+ assert(Code.size() < 15 && "The number of prefixes must be less than 15.");
+
+ // TODO: It turns out we need a decent amount of plumbing for the target
+ // specific bits to determine number of prefixes its safe to add. Various
+ // targets (older chips mostly, but also Atom family) encounter decoder
+ // stalls with too many prefixes. For testing purposes, we set the value
+ // externally for the moment.
+ unsigned ExistingPrefixSize = Code.size();
+ if (TargetPrefixMax <= ExistingPrefixSize)
+ return 0;
+ return TargetPrefixMax - ExistingPrefixSize;
+ }();
const unsigned PrefixBytesToAdd =
- std::min(MaxPossiblePad,
- getRemainingPrefixSize(RF.getInst(), STI, Emitter));
+ std::min(MaxPossiblePad, RemainingPrefixSize);
if (PrefixBytesToAdd == 0)
return false;