90#define DEBUG_TYPE "shrink-wrap"
93STATISTIC(NumCandidates,
"Number of shrink-wrapping candidates");
95 "Number of shrink-wrapping candidates dropped because of frequency");
99 cl::desc(
"enable the shrink-wrapping pass"));
102 cl::desc(
"enable splitting of the restore block if possible"));
144 unsigned FrameSetupOpcode = ~0u;
147 unsigned FrameDestroyOpcode = ~0u;
158 mutable SetOfRegs CurrentCSRs;
174 bool StackAddressUsed)
const;
176 const SetOfRegs &getCurrentCSRs(
RegScavenger *RS)
const {
177 if (CurrentCSRs.empty()) {
184 for (
int Reg = SavedRegs.
find_first(); Reg != -1;
186 CurrentCSRs.insert((
unsigned)Reg);
200 bool performShrinkWrapping(
217 bool checkIfRestoreSplittable(
227 MDT = &getAnalysis<MachineDominatorTreeWrapperPass>().getDomTree();
228 MPDT = &getAnalysis<MachinePostDominatorTreeWrapperPass>().getPostDomTree();
231 MBFI = &getAnalysis<MachineBlockFrequencyInfoWrapperPass>().getMBFI();
232 MLI = &getAnalysis<MachineLoopInfoWrapperPass>().getLI();
233 ORE = &getAnalysis<MachineOptimizationRemarkEmitterPass>().getORE();
237 FrameSetupOpcode =
TII.getCallFrameSetupOpcode();
238 FrameDestroyOpcode =
TII.getCallFrameDestroyOpcode();
249 bool ArePointsInteresting()
const {
return Save !=
Entry && Save && Restore; }
273 MachineFunctionProperties::Property::NoVRegs);
285char ShrinkWrap::ID = 0;
298 bool StackAddressUsed)
const {
306 if (
Op->getValue()) {
310 if (
auto *Arg = dyn_cast<Argument>(UO))
311 return !Arg->hasPassPointeeByValueCopyAttr();
312 return isa<GlobalValue>(UO);
315 return PSV->isJumpTable();
320 if (StackAddressUsed &&
MI.mayLoadOrStore() &&
321 (
MI.isCall() ||
MI.hasUnmodeledSideEffects() ||
MI.memoperands_empty() ||
322 !
all_of(
MI.memoperands(), IsKnownNonStackPtr)))
325 if (
MI.getOpcode() == FrameSetupOpcode ||
326 MI.getOpcode() == FrameDestroyOpcode) {
333 bool UseOrDefCSR =
false;
336 if (!MO.isDef() && !MO.readsReg())
352 (!
MI.isCall() && PhysReg == SP) ||
354 (!
MI.isReturn() &&
TRI->isNonallocatableRegisterCalleeSave(PhysReg));
355 }
else if (MO.isRegMask()) {
357 for (
unsigned Reg : getCurrentCSRs(RS)) {
358 if (MO.clobbersPhysReg(Reg)) {
365 if (UseOrDefCSR || (MO.isFI() && !
MI.isDebugValue())) {
366 LLVM_DEBUG(
dbgs() <<
"Use or define CSR(" << UseOrDefCSR <<
") or FI("
367 << MO.isFI() <<
"): " <<
MI <<
'\n');
375template <
typename ListOfBBs,
typename DominanceAnalysis>
377 DominanceAnalysis &Dom,
bool Strict =
true) {
379 if (Strict && IDom == &
Block)
400 if (ReachableByDirty.
count(PredBB))
410 while (!Worklist.
empty()) {
412 if (!Visited.
insert(SuccMBB).second)
437 while (!Worklist.
empty()) {
439 if (CleanBB == SavePoint)
465 TII->insertUnconditionalBranch(*BBToUpdate, NMBB,
DL);
490 if (BB->getFallThrough(
false) ==
MBB)
491 MBBFallthrough.
insert(BB);
506 SuccBB->ReplaceUsesOfBlockWith(
MBB, NMBB);
531 if (BB->getFallThrough(
false) == NMBB)
532 NMBBFallthrough.
insert(BB);
536 SuccBB->ReplaceUsesOfBlockWith(NMBB,
MBB);
548bool ShrinkWrap::checkIfRestoreSplittable(
555 if (useOrDefCSROrFI(
MI, RS,
true))
562 if (ReachableByDirty.
count(PredBB))
568 return !(CleanPreds.
empty() || DirtyPreds.
empty());
571bool ShrinkWrap::postShrinkWrapping(
bool HasCandidate,
MachineFunction &MF,
581 InitRestore = Restore;
583 InitRestore =
nullptr;
584 InitSave = &MF.
front();
597 if (!InitSave || !InitRestore || InitRestore == InitSave ||
598 !MDT->
dominates(InitSave, InitRestore) ||
615 if (useOrDefCSROrFI(
MI, RS,
true)) {
628 if (!checkIfRestoreSplittable(InitRestore, ReachableByDirty, DirtyPreds,
629 CleanPreds,
TII, RS))
634 FindIDom<>(**DirtyPreds.
begin(), DirtyPreds, *MDT,
false);
636 while (NewSave && (
hasDirtyPred(ReachableByDirty, *NewSave) ||
637 EntryFreq < MBFI->getBlockFreq(NewSave) ||
645 if (!NewSave || NewSave == InitSave ||
663 Restore = NewRestore;
669 "Incorrect save or restore point due to dominance relations");
671 "Unexpected save or restore point in a loop");
674 "Incorrect save or restore point based on block frequency");
700 if (Restore == &
MBB) {
702 if (!useOrDefCSROrFI(Terminator, RS,
true))
711 Restore = FindIDom<>(*Restore, Restore->
successors(), *MPDT);
718 dbgs() <<
"Restore point needs to be spanned on several blocks\n");
729 bool SaveDominatesRestore =
false;
730 bool RestorePostDominatesSave =
false;
732 (!(SaveDominatesRestore = MDT->
dominates(Save, Restore)) ||
733 !(RestorePostDominatesSave = MPDT->
dominates(Restore, Save)) ||
753 if (!SaveDominatesRestore) {
758 if (!RestorePostDominatesSave)
778 IPdom = FindIDom<>(*IPdom, LoopExitBB->successors(), *MPDT);
809bool ShrinkWrap::performShrinkWrapping(
817 "EH Funclets are not supported yet.",
826 updateSaveRestorePoints(*
MBB, RS);
827 if (!ArePointsInteresting()) {
828 LLVM_DEBUG(
dbgs() <<
"EHPad/inlineasm_br prevents shrink-wrapping\n");
834 bool StackAddressUsed =
false;
841 if (StackAddressUsedBlockInfo.
test(Pred->getNumber())) {
842 StackAddressUsed =
true;
848 if (useOrDefCSROrFI(
MI, RS, StackAddressUsed)) {
851 updateSaveRestorePoints(*
MBB, RS);
854 if (!ArePointsInteresting()) {
860 StackAddressUsed =
true;
864 StackAddressUsedBlockInfo[
MBB->
getNumber()] = StackAddressUsed;
866 if (!ArePointsInteresting()) {
870 assert(!Save && !Restore &&
"We miss a shrink-wrap opportunity?!");
881 LLVM_DEBUG(
dbgs() <<
"Shrink wrap candidates (#, Name, Freq):\nSave: "
887 bool IsSaveCheap, TargetCanUseSaveAsPrologue =
false;
888 if (((IsSaveCheap = EntryFreq >= MBFI->
getBlockFreq(Save)) &&
894 dbgs() <<
"New points are too expensive or invalid for the target\n");
896 if (!IsSaveCheap || !TargetCanUseSaveAsPrologue) {
903 Restore = FindIDom<>(*Restore, Restore->
successors(), *MPDT);
908 updateSaveRestorePoints(*NewBB, RS);
909 }
while (Save && Restore);
911 if (!ArePointsInteresting()) {
912 ++NumCandidatesDropped;
919 if (skipFunction(MF.
getFunction()) || MF.
empty() || !isShrinkWrapEnabled(MF))
927 if (containsIrreducibleCFG<MachineBasicBlock *>(RPOT, *MLI)) {
935 "Irreducible CFGs are not supported yet.",
940 std::unique_ptr<RegScavenger> RS(
943 bool Changed =
false;
949 bool HasCandidate = performShrinkWrapping(RPOT, RS.get());
950 StackAddressUsedBlockInfo.
clear();
951 Changed = postShrinkWrapping(HasCandidate, MF, RS.get());
952 if (!HasCandidate && !Changed)
954 if (!ArePointsInteresting())
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
This file contains the simple types necessary to represent the attributes associated with functions a...
This file implements the BitVector class.
const HexagonInstrInfo * TII
unsigned const TargetRegisterInfo * TRI
#define INITIALIZE_PASS_DEPENDENCY(depName)
#define INITIALIZE_PASS_END(passName, arg, name, cfg, analysis)
#define INITIALIZE_PASS_BEGIN(passName, arg, name, cfg, analysis)
This file builds on the ADT/GraphTraits.h file to build a generic graph post order iterator.
const SmallVectorImpl< MachineOperand > MachineBasicBlock * TBB
const SmallVectorImpl< MachineOperand > & Cond
This file declares the machine register scavenger class.
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())
This file implements a set that has insertion order iteration characteristics.
static void markAllReachable(DenseSet< const MachineBasicBlock * > &Visited, const MachineBasicBlock &MBB)
Derives the list of all the basic blocks reachable from MBB.
static void updateTerminator(MachineBasicBlock *BBToUpdate, MachineBasicBlock *NMBB, const TargetInstrInfo *TII)
This function updates the branches post restore point split.
static MachineBasicBlock * tryToSplitRestore(MachineBasicBlock *MBB, ArrayRef< MachineBasicBlock * > DirtyPreds, const TargetInstrInfo *TII)
This function splits the restore point and returns new restore point/BB.
static bool hasDirtyPred(const DenseSet< const MachineBasicBlock * > &ReachableByDirty, const MachineBasicBlock &MBB)
Determines if any predecessor of MBB is on the path from block that has use or def of CSRs/FI to MBB.
static bool giveUpWithRemarks(MachineOptimizationRemarkEmitter *ORE, StringRef RemarkName, StringRef RemarkMessage, const DiagnosticLocation &Loc, const MachineBasicBlock *MBB)
static cl::opt< bool > EnablePostShrinkWrapOpt("enable-shrink-wrap-region-split", cl::init(true), cl::Hidden, cl::desc("enable splitting of the restore block if possible"))
static void rollbackRestoreSplit(MachineFunction &MF, MachineBasicBlock *NMBB, MachineBasicBlock *MBB, ArrayRef< MachineBasicBlock * > DirtyPreds, const TargetInstrInfo *TII)
This function undoes the restore point split done earlier.
static bool isAnalyzableBB(const TargetInstrInfo &TII, MachineBasicBlock &Entry)
static bool isSaveReachableThroughClean(const MachineBasicBlock *SavePoint, ArrayRef< MachineBasicBlock * > CleanPreds)
static cl::opt< cl::boolOrDefault > EnableShrinkWrapOpt("enable-shrink-wrap", cl::Hidden, cl::desc("enable the shrink-wrapping pass"))
static void collectBlocksReachableByDirty(const DenseSet< const MachineBasicBlock * > &DirtyBBs, DenseSet< const MachineBasicBlock * > &ReachableByDirty)
Collect blocks reachable by use or def of CSRs/FI.
static MachineBasicBlock * FindIDom(MachineBasicBlock &Block, ListOfBBs BBs, DominanceAnalysis &Dom, bool Strict=true)
Helper function to find the immediate (post) dominator.
This file defines the SmallVector class.
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...
#define STATISTIC(VARNAME, DESC)
This file describes how to lower LLVM code to machine code.
Represent the analysis usage information of a pass.
AnalysisUsage & addRequired()
void setPreservesAll()
Set by analyses that do not transform their input at all.
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
bool test(unsigned Idx) const
int find_first() const
find_first - Returns the index of the first set bit, -1 if none of the bits are set.
void resize(unsigned N, bool t=false)
resize - Grow or shrink the bitvector.
void clear()
clear - Removes all bits from the bitvector.
int find_next(unsigned Prev) const
find_next - Returns the index of the next set bit following the "Prev" bit.
uint64_t getFrequency() const
Returns the frequency as a fixpoint number scaled by the entry frequency.
This class represents an Operation in the Expression.
Implements a dense probed hash-table based set.
NodeT * findNearestCommonDominator(NodeT *A, NodeT *B) const
Find nearest common dominator basic block for basic block A and B.
bool dominates(const DomTreeNodeBase< NodeT > *A, const DomTreeNodeBase< NodeT > *B) const
dominates - Returns true iff A dominates B.
void recalculate(ParentType &Func)
recalculate - compute a dominator tree for the given function
DomTreeNodeBase< NodeT > * getNode(const NodeT *BB) const
getNode - return the (Post)DominatorTree node for the specified basic block.
DISubprogram * getSubprogram() const
Get the attached subprogram.
bool hasFnAttribute(Attribute::AttrKind Kind) const
Return true if the function has the attribute.
bool analyzeBranch(MachineBasicBlock &MBB, MachineBasicBlock *&TBB, MachineBasicBlock *&FBB, SmallVectorImpl< MachineOperand > &Cond, bool AllowModify) const override
Analyze the branching code at the end of MBB, returning true if it cannot be understood (e....
void getExitingBlocks(SmallVectorImpl< BlockT * > &ExitingBlocks) const
Return all blocks inside the loop that have successors outside of the loop.
unsigned getLoopDepth(const BlockT *BB) const
Return the loop nesting level of the specified block.
LoopT * getLoopFor(const BlockT *BB) const
Return the inner most loop that BB lives in.
bool usesWindowsCFI() const
bool isInlineAsmBrIndirectTarget() const
Returns true if this is the indirect dest of an INLINEASM_BR.
unsigned pred_size() const
bool isEHPad() const
Returns true if the block is a landing pad.
iterator_range< livein_iterator > liveins() const
int getNumber() const
MachineBasicBlocks are uniquely numbered at the function level, unless they're not in a MachineFuncti...
succ_iterator succ_begin()
bool isEHFuncletEntry() const
Returns true if this is the entry block of an EH funclet.
bool isReturnBlock() const
Convenience function that returns true if the block ends in a return instruction.
void addSuccessor(MachineBasicBlock *Succ, BranchProbability Prob=BranchProbability::getUnknown())
Add Succ as a successor of this MachineBasicBlock.
void removeSuccessor(MachineBasicBlock *Succ, bool NormalizeSuccProbs=false)
Remove successor from the successors list of this MachineBasicBlock.
pred_iterator pred_begin()
bool isLayoutSuccessor(const MachineBasicBlock *MBB) const
Return true if the specified MBB will be emitted immediately after this block, such that if this bloc...
void eraseFromParent()
This method unlinks 'this' from the containing function and deletes it.
void addLiveIn(MCRegister PhysReg, LaneBitmask LaneMask=LaneBitmask::getAll())
Adds the specified register as a live in.
const MachineFunction * getParent() const
Return the MachineFunction containing this basic block.
instr_iterator erase(instr_iterator I)
Remove an instruction from the instruction list and delete it.
iterator_range< iterator > terminators()
DebugLoc findBranchDebugLoc()
Find and return the merged DebugLoc of the branch instructions of the block.
iterator_range< succ_iterator > successors()
iterator_range< pred_iterator > predecessors()
MachineBlockFrequencyInfo pass uses BlockFrequencyInfoImpl implementation to estimate machine basic b...
BlockFrequency getBlockFreq(const MachineBasicBlock *MBB) const
getblockFreq - Return block frequency.
BlockFrequency getEntryFreq() const
Divide a block's BlockFrequency::getFrequency() value by this value to obtain the entry block - relat...
Analysis pass which computes a MachineDominatorTree.
DominatorTree Class - Concrete subclass of DominatorTreeBase that is used to compute a normal dominat...
bool dominates(const MachineInstr *A, const MachineInstr *B) const
The MachineFrameInfo class represents an abstract stack frame until prolog/epilog code is inserted.
void setRestorePoint(MachineBasicBlock *NewRestore)
void setSavePoint(MachineBasicBlock *NewSave)
MachineFunctionPass - This class adapts the FunctionPass interface to allow convenient creation of pa...
void getAnalysisUsage(AnalysisUsage &AU) const override
getAnalysisUsage - Subclasses that override getAnalysisUsage must call this.
virtual bool runOnMachineFunction(MachineFunction &MF)=0
runOnMachineFunction - This method must be overloaded to perform the desired machine code transformat...
virtual MachineFunctionProperties getRequiredProperties() const
Properties which a MachineFunction may have at a given point in time.
MachineFunctionProperties & set(Property P)
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
StringRef getName() const
getName - Return the name of the corresponding LLVM function.
MachineFrameInfo & getFrameInfo()
getFrameInfo - Return the frame info object for the current function.
Function & getFunction()
Return the LLVM function that this machine code represents.
unsigned getNumBlockIDs() const
getNumBlockIDs - Return the number of MBB ID's allocated.
const MachineBasicBlock & front() const
MachineBasicBlock * CreateMachineBasicBlock(const BasicBlock *BB=nullptr, std::optional< UniqueBBID > BBID=std::nullopt)
CreateMachineBasicBlock - Allocate a new MachineBasicBlock.
void insert(iterator MBBI, MachineBasicBlock *MBB)
const TargetMachine & getTarget() const
getTarget - Return the target machine this machine code is compiled with
Representation of each machine instruction.
const DebugLoc & getDebugLoc() const
Returns the debug location id of this MachineInstr.
A description of a memory reference used in the backend.
MachineOperand class - Representation of each machine instruction operand.
MachinePostDominatorTree - an analysis pass wrapper for DominatorTree used to compute the post-domina...
MachineBasicBlock * findNearestCommonDominator(ArrayRef< MachineBasicBlock * > Blocks) const
Returns the nearest common dominator of the given blocks.
static PassRegistry * getPassRegistry()
getPassRegistry - Access the global registry object, which is automatically initialized at applicatio...
Pass interface - Implemented by all 'passes'.
virtual StringRef getPassName() const
getPassName - Return a nice clean name for a pass.
Special value supplied for machine level alias analysis.
MCRegister getLastCalleeSavedAlias(MCRegister PhysReg) const
getLastCalleeSavedAlias - Returns the last callee saved register that overlaps PhysReg,...
void runOnMachineFunction(const MachineFunction &MF)
runOnFunction - Prepare to answer questions about MF.
Wrapper class representing virtual and physical registers.
constexpr bool isPhysical() const
Return true if the specified register number is in the physical register namespace.
std::pair< iterator, bool > insert(PtrType Ptr)
Inserts Ptr if and only if there is no element in the container equal to Ptr.
SmallPtrSet - This class implements a set which is optimized for holding SmallSize or less elements.
A SetVector that performs no allocations if smaller than a certain size.
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
void append(ItTy in_start, ItTy in_end)
Add the specified range to the end of the SmallVector.
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
StringRef - Represent a constant reference to a string, i.e.
Information about stack frame layout on the target.
virtual void determineCalleeSaves(MachineFunction &MF, BitVector &SavedRegs, RegScavenger *RS=nullptr) const
This method determines which of the registers reported by TargetRegisterInfo::getCalleeSavedRegs() sh...
virtual bool enableShrinkWrapping(const MachineFunction &MF) const
Returns true if the target will correctly handle shrink wrapping.
virtual bool canUseAsEpilogue(const MachineBasicBlock &MBB) const
Check whether or not the given MBB can be used as a epilogue for the target.
virtual bool canUseAsPrologue(const MachineBasicBlock &MBB) const
Check whether or not the given MBB can be used as a prologue for the target.
TargetInstrInfo - Interface to description of machine instruction set.
Register getStackPointerRegisterToSaveRestore() const
If a physical register, this specifies the register that llvm.savestack/llvm.restorestack should save...
const MCAsmInfo * getMCAsmInfo() const
Return target specific asm information.
TargetRegisterInfo base class - We assume that the target defines a static array of TargetRegisterDes...
TargetSubtargetInfo - Generic base class for all target subtargets.
virtual const TargetRegisterInfo * getRegisterInfo() const
getRegisterInfo - If register information is available, return it.
virtual const TargetFrameLowering * getFrameLowering() const
virtual const TargetInstrInfo * getInstrInfo() const
virtual const TargetLowering * getTargetLowering() const
LLVM Value Representation.
std::pair< iterator, bool > insert(const ValueT &V)
size_type count(const_arg_type_t< ValueT > V) const
Return 1 if the specified key is in the set, 0 otherwise.
A range adaptor for a pair of iterators.
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
initializer< Ty > init(const Ty &Val)
This is an optimization pass for GlobalISel generic memory operations.
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
const Value * getUnderlyingObject(const Value *V, unsigned MaxLookup=6)
This method strips off any GEP address adjustments, pointer casts or llvm.threadlocal....
char & ShrinkWrapID
ShrinkWrap pass. Look for the best place to insert save and restore.
void initializeShrinkWrapPass(PassRegistry &)
raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
DWARFExpression::Operation Op
Printable printBlockFreq(const BlockFrequencyInfo &BFI, BlockFrequency Freq)
Print the block frequency Freq relative to the current functions entry frequency.
Printable printMBBReference(const MachineBasicBlock &MBB)
Prints a machine basic block reference.
Pair of physical register and lane mask.