91#define DEBUG_TYPE "shrink-wrap"
94STATISTIC(NumCandidates,
"Number of shrink-wrapping candidates");
96 "Number of shrink-wrapping candidates dropped because of frequency");
100 cl::desc(
"enable the shrink-wrapping pass"));
103 cl::desc(
"enable splitting of the restore block if possible"));
114class ShrinkWrapImpl {
145 unsigned FrameSetupOpcode = ~0u;
148 unsigned FrameDestroyOpcode = ~0u;
159 mutable SetOfRegs CurrentCSRs;
175 bool StackAddressUsed)
const;
177 const SetOfRegs &getCurrentCSRs(
RegScavenger *RS)
const {
178 if (CurrentCSRs.empty()) {
185 for (
int Reg = SavedRegs.
find_first(); Reg != -1;
187 CurrentCSRs.insert((
unsigned)Reg);
201 bool performShrinkWrapping(
218 bool checkIfRestoreSplittable(
233 FrameSetupOpcode =
TII.getCallFrameSetupOpcode();
234 FrameDestroyOpcode =
TII.getCallFrameDestroyOpcode();
245 bool ArePointsInteresting()
const {
return Save !=
Entry && Save && Restore; }
251 : MDT(MDT), MPDT(MPDT), MBFI(MBFI), MLI(MLI), ORE(ORE) {}
290char ShrinkWrapLegacy::ID = 0;
305 bool StackAddressUsed)
const {
313 if (
Op->getValue()) {
317 if (
auto *Arg = dyn_cast<Argument>(UO))
318 return !Arg->hasPassPointeeByValueCopyAttr();
319 return isa<GlobalValue>(UO);
322 return PSV->isJumpTable();
327 if (StackAddressUsed &&
MI.mayLoadOrStore() &&
328 (
MI.isCall() ||
MI.hasUnmodeledSideEffects() ||
MI.memoperands_empty() ||
329 !
all_of(
MI.memoperands(), IsKnownNonStackPtr)))
332 if (
MI.getOpcode() == FrameSetupOpcode ||
333 MI.getOpcode() == FrameDestroyOpcode) {
340 bool UseOrDefCSR =
false;
343 if (!MO.isDef() && !MO.readsReg())
361 UseOrDefCSR = (!
MI.isCall() && PhysReg == SP) ||
364 TRI->isNonallocatableRegisterCalleeSave(PhysReg)) ||
365 TRI->isVirtualFrameRegister(PhysReg);
366 }
else if (MO.isRegMask()) {
368 for (
unsigned Reg : getCurrentCSRs(RS)) {
369 if (MO.clobbersPhysReg(Reg)) {
376 if (UseOrDefCSR || (MO.isFI() && !
MI.isDebugValue())) {
377 LLVM_DEBUG(
dbgs() <<
"Use or define CSR(" << UseOrDefCSR <<
") or FI("
378 << MO.isFI() <<
"): " <<
MI <<
'\n');
386template <
typename ListOfBBs,
typename DominanceAnalysis>
388 DominanceAnalysis &Dom,
bool Strict =
true) {
390 if (Strict && IDom == &
Block)
411 if (ReachableByDirty.
count(PredBB))
421 while (!Worklist.
empty()) {
423 if (!Visited.
insert(SuccMBB).second)
448 while (!Worklist.
empty()) {
450 if (CleanBB == SavePoint)
476 TII->insertUnconditionalBranch(*BBToUpdate, NMBB,
DL);
501 if (BB->getFallThrough(
false) ==
MBB)
502 MBBFallthrough.
insert(BB);
517 SuccBB->ReplaceUsesOfBlockWith(
MBB, NMBB);
542 if (BB->getFallThrough(
false) == NMBB)
543 NMBBFallthrough.
insert(BB);
547 SuccBB->ReplaceUsesOfBlockWith(NMBB,
MBB);
559bool ShrinkWrapImpl::checkIfRestoreSplittable(
566 if (useOrDefCSROrFI(
MI, RS,
true))
573 if (ReachableByDirty.
count(PredBB))
579 return !(CleanPreds.
empty() || DirtyPreds.
empty());
582bool ShrinkWrapImpl::postShrinkWrapping(
bool HasCandidate,
MachineFunction &MF,
592 InitRestore = Restore;
594 InitRestore =
nullptr;
595 InitSave = &MF.
front();
608 if (!InitSave || !InitRestore || InitRestore == InitSave ||
609 !MDT->
dominates(InitSave, InitRestore) ||
626 if (useOrDefCSROrFI(
MI, RS,
true)) {
639 if (!checkIfRestoreSplittable(InitRestore, ReachableByDirty, DirtyPreds,
640 CleanPreds,
TII, RS))
645 FindIDom<>(**DirtyPreds.
begin(), DirtyPreds, *MDT,
false);
647 while (NewSave && (
hasDirtyPred(ReachableByDirty, *NewSave) ||
648 EntryFreq < MBFI->getBlockFreq(NewSave) ||
656 if (!NewSave || NewSave == InitSave ||
674 Restore = NewRestore;
680 "Incorrect save or restore point due to dominance relations");
682 "Unexpected save or restore point in a loop");
685 "Incorrect save or restore point based on block frequency");
711 if (Restore == &
MBB) {
713 if (!useOrDefCSROrFI(Terminator, RS,
true))
722 Restore = FindIDom<>(*Restore, Restore->
successors(), *MPDT);
729 dbgs() <<
"Restore point needs to be spanned on several blocks\n");
740 bool SaveDominatesRestore =
false;
741 bool RestorePostDominatesSave =
false;
743 (!(SaveDominatesRestore = MDT->
dominates(Save, Restore)) ||
744 !(RestorePostDominatesSave = MPDT->
dominates(Restore, Save)) ||
764 if (!SaveDominatesRestore) {
769 if (!RestorePostDominatesSave)
789 IPdom = FindIDom<>(*IPdom, LoopExitBB->successors(), *MPDT);
820bool ShrinkWrapImpl::performShrinkWrapping(
828 "EH Funclets are not supported yet.",
837 updateSaveRestorePoints(*
MBB, RS);
838 if (!ArePointsInteresting()) {
839 LLVM_DEBUG(
dbgs() <<
"EHPad/inlineasm_br prevents shrink-wrapping\n");
845 bool StackAddressUsed =
false;
852 if (StackAddressUsedBlockInfo.
test(Pred->getNumber())) {
853 StackAddressUsed =
true;
859 if (useOrDefCSROrFI(
MI, RS, StackAddressUsed)) {
862 updateSaveRestorePoints(*
MBB, RS);
865 if (!ArePointsInteresting()) {
871 StackAddressUsed =
true;
875 StackAddressUsedBlockInfo[
MBB->
getNumber()] = StackAddressUsed;
877 if (!ArePointsInteresting()) {
881 assert(!Save && !Restore &&
"We miss a shrink-wrap opportunity?!");
892 LLVM_DEBUG(
dbgs() <<
"Shrink wrap candidates (#, Name, Freq):\nSave: "
898 bool IsSaveCheap, TargetCanUseSaveAsPrologue =
false;
899 if (((IsSaveCheap = EntryFreq >= MBFI->
getBlockFreq(Save)) &&
905 dbgs() <<
"New points are too expensive or invalid for the target\n");
907 if (!IsSaveCheap || !TargetCanUseSaveAsPrologue) {
914 Restore = FindIDom<>(*Restore, Restore->
successors(), *MPDT);
919 updateSaveRestorePoints(*NewBB, RS);
920 }
while (Save && Restore);
922 if (!ArePointsInteresting()) {
923 ++NumCandidatesDropped;
935 if (containsIrreducibleCFG<MachineBasicBlock *>(RPOT, *MLI)) {
943 "Irreducible CFGs are not supported yet.",
948 std::unique_ptr<RegScavenger> RS(
951 bool Changed =
false;
957 bool HasCandidate = performShrinkWrapping(RPOT, RS.get());
958 StackAddressUsedBlockInfo.
clear();
959 Changed = postShrinkWrapping(HasCandidate, MF, RS.get());
960 if (!HasCandidate && !Changed)
962 if (!ArePointsInteresting())
984 !ShrinkWrapImpl::isShrinkWrapEnabled(MF))
988 &getAnalysis<MachineDominatorTreeWrapperPass>().getDomTree();
990 &getAnalysis<MachinePostDominatorTreeWrapperPass>().getPostDomTree();
992 &getAnalysis<MachineBlockFrequencyInfoWrapperPass>().getMBFI();
993 MachineLoopInfo *MLI = &getAnalysis<MachineLoopInfoWrapperPass>().getLI();
995 &getAnalysis<MachineOptimizationRemarkEmitterPass>().getORE();
997 return ShrinkWrapImpl(MDT, MPDT, MBFI, MLI, ORE).run(MF);
1003 if (MF.
empty() || !ShrinkWrapImpl::isShrinkWrapEnabled(MF))
1015 ShrinkWrapImpl(&MDT, &MPDT, &MBFI, &MLI, &ORE).
run(MF);
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
This file contains the simple types necessary to represent the attributes associated with functions a...
This file implements the BitVector class.
const HexagonInstrInfo * TII
Register const TargetRegisterInfo * TRI
#define INITIALIZE_PASS_DEPENDENCY(depName)
#define INITIALIZE_PASS_END(passName, arg, name, cfg, analysis)
#define INITIALIZE_PASS_BEGIN(passName, arg, name, cfg, analysis)
This file builds on the ADT/GraphTraits.h file to build a generic graph post order iterator.
const SmallVectorImpl< MachineOperand > MachineBasicBlock * TBB
const SmallVectorImpl< MachineOperand > & Cond
This file declares the machine register scavenger class.
This file implements a set that has insertion order iteration characteristics.
static void markAllReachable(DenseSet< const MachineBasicBlock * > &Visited, const MachineBasicBlock &MBB)
Derives the list of all the basic blocks reachable from MBB.
static void updateTerminator(MachineBasicBlock *BBToUpdate, MachineBasicBlock *NMBB, const TargetInstrInfo *TII)
This function updates the branches post restore point split.
static MachineBasicBlock * tryToSplitRestore(MachineBasicBlock *MBB, ArrayRef< MachineBasicBlock * > DirtyPreds, const TargetInstrInfo *TII)
This function splits the restore point and returns new restore point/BB.
static bool hasDirtyPred(const DenseSet< const MachineBasicBlock * > &ReachableByDirty, const MachineBasicBlock &MBB)
Determines if any predecessor of MBB is on the path from block that has use or def of CSRs/FI to MBB.
static bool giveUpWithRemarks(MachineOptimizationRemarkEmitter *ORE, StringRef RemarkName, StringRef RemarkMessage, const DiagnosticLocation &Loc, const MachineBasicBlock *MBB)
static cl::opt< bool > EnablePostShrinkWrapOpt("enable-shrink-wrap-region-split", cl::init(true), cl::Hidden, cl::desc("enable splitting of the restore block if possible"))
static void rollbackRestoreSplit(MachineFunction &MF, MachineBasicBlock *NMBB, MachineBasicBlock *MBB, ArrayRef< MachineBasicBlock * > DirtyPreds, const TargetInstrInfo *TII)
This function undoes the restore point split done earlier.
static bool isAnalyzableBB(const TargetInstrInfo &TII, MachineBasicBlock &Entry)
static bool isSaveReachableThroughClean(const MachineBasicBlock *SavePoint, ArrayRef< MachineBasicBlock * > CleanPreds)
static cl::opt< cl::boolOrDefault > EnableShrinkWrapOpt("enable-shrink-wrap", cl::Hidden, cl::desc("enable the shrink-wrapping pass"))
static void collectBlocksReachableByDirty(const DenseSet< const MachineBasicBlock * > &DirtyBBs, DenseSet< const MachineBasicBlock * > &ReachableByDirty)
Collect blocks reachable by use or def of CSRs/FI.
static MachineBasicBlock * FindIDom(MachineBasicBlock &Block, ListOfBBs BBs, DominanceAnalysis &Dom, bool Strict=true)
Helper function to find the immediate (post) dominator.
This file defines the SmallVector class.
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...
#define STATISTIC(VARNAME, DESC)
This file describes how to lower LLVM code to machine code.
A container for analyses that lazily runs them and caches their results.
PassT::Result & getResult(IRUnitT &IR, ExtraArgTs... ExtraArgs)
Get the result of an analysis pass for a given IR unit.
Represent the analysis usage information of a pass.
AnalysisUsage & addRequired()
void setPreservesAll()
Set by analyses that do not transform their input at all.
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
bool test(unsigned Idx) const
int find_first() const
find_first - Returns the index of the first set bit, -1 if none of the bits are set.
void resize(unsigned N, bool t=false)
resize - Grow or shrink the bitvector.
void clear()
clear - Removes all bits from the bitvector.
int find_next(unsigned Prev) const
find_next - Returns the index of the next set bit following the "Prev" bit.
uint64_t getFrequency() const
Returns the frequency as a fixpoint number scaled by the entry frequency.
This class represents an Operation in the Expression.
Implements a dense probed hash-table based set.
NodeT * findNearestCommonDominator(NodeT *A, NodeT *B) const
Find nearest common dominator basic block for basic block A and B.
bool dominates(const DomTreeNodeBase< NodeT > *A, const DomTreeNodeBase< NodeT > *B) const
dominates - Returns true iff A dominates B.
void recalculate(ParentType &Func)
recalculate - compute a dominator tree for the given function
DomTreeNodeBase< NodeT > * getNode(const NodeT *BB) const
getNode - return the (Post)DominatorTree node for the specified basic block.
DISubprogram * getSubprogram() const
Get the attached subprogram.
bool hasFnAttribute(Attribute::AttrKind Kind) const
Return true if the function has the attribute.
bool analyzeBranch(MachineBasicBlock &MBB, MachineBasicBlock *&TBB, MachineBasicBlock *&FBB, SmallVectorImpl< MachineOperand > &Cond, bool AllowModify) const override
Analyze the branching code at the end of MBB, returning true if it cannot be understood (e....
void getExitingBlocks(SmallVectorImpl< BlockT * > &ExitingBlocks) const
Return all blocks inside the loop that have successors outside of the loop.
unsigned getLoopDepth(const BlockT *BB) const
Return the loop nesting level of the specified block.
LoopT * getLoopFor(const BlockT *BB) const
Return the inner most loop that BB lives in.
bool usesWindowsCFI() const
An RAII based helper class to modify MachineFunctionProperties when running pass.
bool isInlineAsmBrIndirectTarget() const
Returns true if this is the indirect dest of an INLINEASM_BR.
unsigned pred_size() const
bool isEHPad() const
Returns true if the block is a landing pad.
iterator_range< livein_iterator > liveins() const
int getNumber() const
MachineBasicBlocks are uniquely numbered at the function level, unless they're not in a MachineFuncti...
succ_iterator succ_begin()
bool isEHFuncletEntry() const
Returns true if this is the entry block of an EH funclet.
bool isReturnBlock() const
Convenience function that returns true if the block ends in a return instruction.
LLVM_ABI void addSuccessor(MachineBasicBlock *Succ, BranchProbability Prob=BranchProbability::getUnknown())
Add Succ as a successor of this MachineBasicBlock.
LLVM_ABI void removeSuccessor(MachineBasicBlock *Succ, bool NormalizeSuccProbs=false)
Remove successor from the successors list of this MachineBasicBlock.
pred_iterator pred_begin()
LLVM_ABI bool isLayoutSuccessor(const MachineBasicBlock *MBB) const
Return true if the specified MBB will be emitted immediately after this block, such that if this bloc...
LLVM_ABI void eraseFromParent()
This method unlinks 'this' from the containing function and deletes it.
void addLiveIn(MCRegister PhysReg, LaneBitmask LaneMask=LaneBitmask::getAll())
Adds the specified register as a live in.
const MachineFunction * getParent() const
Return the MachineFunction containing this basic block.
LLVM_ABI instr_iterator erase(instr_iterator I)
Remove an instruction from the instruction list and delete it.
iterator_range< iterator > terminators()
LLVM_ABI DebugLoc findBranchDebugLoc()
Find and return the merged DebugLoc of the branch instructions of the block.
iterator_range< succ_iterator > successors()
iterator_range< pred_iterator > predecessors()
MachineBlockFrequencyInfo pass uses BlockFrequencyInfoImpl implementation to estimate machine basic b...
LLVM_ABI BlockFrequency getBlockFreq(const MachineBasicBlock *MBB) const
getblockFreq - Return block frequency.
LLVM_ABI BlockFrequency getEntryFreq() const
Divide a block's BlockFrequency::getFrequency() value by this value to obtain the entry block - relat...
Analysis pass which computes a MachineDominatorTree.
Analysis pass which computes a MachineDominatorTree.
DominatorTree Class - Concrete subclass of DominatorTreeBase that is used to compute a normal dominat...
bool dominates(const MachineInstr *A, const MachineInstr *B) const
The MachineFrameInfo class represents an abstract stack frame until prolog/epilog code is inserted.
void setRestorePoints(ArrayRef< MachineBasicBlock * > NewRestorePoints)
void setSavePoints(ArrayRef< MachineBasicBlock * > NewSavePoints)
MachineFunctionPass - This class adapts the FunctionPass interface to allow convenient creation of pa...
void getAnalysisUsage(AnalysisUsage &AU) const override
getAnalysisUsage - Subclasses that override getAnalysisUsage must call this.
virtual bool runOnMachineFunction(MachineFunction &MF)=0
runOnMachineFunction - This method must be overloaded to perform the desired machine code transformat...
virtual MachineFunctionProperties getRequiredProperties() const
Properties which a MachineFunction may have at a given point in time.
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
StringRef getName() const
getName - Return the name of the corresponding LLVM function.
MachineFrameInfo & getFrameInfo()
getFrameInfo - Return the frame info object for the current function.
Function & getFunction()
Return the LLVM function that this machine code represents.
unsigned getNumBlockIDs() const
getNumBlockIDs - Return the number of MBB ID's allocated.
const MachineBasicBlock & front() const
MachineBasicBlock * CreateMachineBasicBlock(const BasicBlock *BB=nullptr, std::optional< UniqueBBID > BBID=std::nullopt)
CreateMachineBasicBlock - Allocate a new MachineBasicBlock.
void insert(iterator MBBI, MachineBasicBlock *MBB)
const TargetMachine & getTarget() const
getTarget - Return the target machine this machine code is compiled with
Representation of each machine instruction.
const DebugLoc & getDebugLoc() const
Returns the debug location id of this MachineInstr.
Analysis pass that exposes the MachineLoopInfo for a machine function.
A description of a memory reference used in the backend.
MachineOperand class - Representation of each machine instruction operand.
MachinePostDominatorTree - an analysis pass wrapper for DominatorTree used to compute the post-domina...
LLVM_ABI MachineBasicBlock * findNearestCommonDominator(ArrayRef< MachineBasicBlock * > Blocks) const
Returns the nearest common dominator of the given blocks.
static LLVM_ABI PassRegistry * getPassRegistry()
getPassRegistry - Access the global registry object, which is automatically initialized at applicatio...
Pass interface - Implemented by all 'passes'.
virtual StringRef getPassName() const
getPassName - Return a nice clean name for a pass.
A set of analyses that are preserved following a run of a transformation pass.
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
Special value supplied for machine level alias analysis.
LLVM_ABI void runOnMachineFunction(const MachineFunction &MF, bool Rev=false)
runOnFunction - Prepare to answer questions about MF.
MCRegister getLastCalleeSavedAlias(MCRegister PhysReg) const
getLastCalleeSavedAlias - Returns the last callee saved register that overlaps PhysReg,...
Wrapper class representing virtual and physical registers.
constexpr bool isPhysical() const
Return true if the specified register number is in the physical register namespace.
PreservedAnalyses run(MachineFunction &MF, MachineFunctionAnalysisManager &MFAM)
std::pair< iterator, bool > insert(PtrType Ptr)
Inserts Ptr if and only if there is no element in the container equal to Ptr.
SmallPtrSet - This class implements a set which is optimized for holding SmallSize or less elements.
A SetVector that performs no allocations if smaller than a certain size.
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
void append(ItTy in_start, ItTy in_end)
Add the specified range to the end of the SmallVector.
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
StringRef - Represent a constant reference to a string, i.e.
Information about stack frame layout on the target.
virtual void determineCalleeSaves(MachineFunction &MF, BitVector &SavedRegs, RegScavenger *RS=nullptr) const
This method determines which of the registers reported by TargetRegisterInfo::getCalleeSavedRegs() sh...
virtual bool enableShrinkWrapping(const MachineFunction &MF) const
Returns true if the target will correctly handle shrink wrapping.
virtual bool canUseAsEpilogue(const MachineBasicBlock &MBB) const
Check whether or not the given MBB can be used as a epilogue for the target.
virtual bool canUseAsPrologue(const MachineBasicBlock &MBB) const
Check whether or not the given MBB can be used as a prologue for the target.
TargetInstrInfo - Interface to description of machine instruction set.
Register getStackPointerRegisterToSaveRestore() const
If a physical register, this specifies the register that llvm.savestack/llvm.restorestack should save...
const MCAsmInfo * getMCAsmInfo() const
Return target specific asm information.
TargetRegisterInfo base class - We assume that the target defines a static array of TargetRegisterDes...
TargetSubtargetInfo - Generic base class for all target subtargets.
virtual const TargetFrameLowering * getFrameLowering() const
virtual const TargetInstrInfo * getInstrInfo() const
virtual const TargetRegisterInfo * getRegisterInfo() const =0
Return the target's register information.
virtual const TargetLowering * getTargetLowering() const
LLVM Value Representation.
std::pair< iterator, bool > insert(const ValueT &V)
size_type count(const_arg_type_t< ValueT > V) const
Return 1 if the specified key is in the set, 0 otherwise.
A range adaptor for a pair of iterators.
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
initializer< Ty > init(const Ty &Val)
PointerTypeMap run(const Module &M)
Compute the PointerTypeMap for the module M.
This is an optimization pass for GlobalISel generic memory operations.
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
LLVM_ABI void initializeShrinkWrapLegacyPass(PassRegistry &)
LLVM_ABI char & ShrinkWrapID
ShrinkWrap pass. Look for the best place to insert save and restore.
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
DWARFExpression::Operation Op
LLVM_ABI Printable printBlockFreq(const BlockFrequencyInfo &BFI, BlockFrequency Freq)
Print the block frequency Freq relative to the current functions entry frequency.
LLVM_ABI const Value * getUnderlyingObject(const Value *V, unsigned MaxLookup=MaxLookupSearchDepth)
This method strips off any GEP address adjustments, pointer casts or llvm.threadlocal....
LLVM_ABI Printable printMBBReference(const MachineBasicBlock &MBB)
Prints a machine basic block reference.
Pair of physical register and lane mask.