45#include "llvm/Config/llvm-config.h"
67#define DEBUG_TYPE "branch-folder"
69STATISTIC(NumDeadBlocks,
"Number of dead blocks removed");
70STATISTIC(NumBranchOpts,
"Number of branches optimized");
71STATISTIC(NumTailMerge ,
"Number of block tails merged");
72STATISTIC(NumHoist ,
"Number of times common instructions are hoisted");
73STATISTIC(NumTailCalls,
"Number of tail calls optimized");
81 cl::desc(
"Max number of predecessors to consider tail merging"),
87 cl::desc(
"Min number of instructions to consider tail merging"),
116char BranchFolderLegacy::ID = 0;
126 bool EnableTailMerge =
127 !MF.getTarget().requiresStructuredCFG() && this->EnableTailMerge;
131 .getCachedResult<ProfileSummaryAnalysis>(
132 *MF.getFunction().getParent());
135 "ProfileSummaryAnalysis is required for BranchFoldingPass",
false);
139 BranchFolder Folder(EnableTailMerge,
true, MBBFreqInfo, MBPI,
142 MF.getSubtarget().getRegisterInfo()))
157 getAnalysis<MachineBlockFrequencyInfoWrapperPass>().getMBFI());
159 EnableTailMerge,
true, MBBFreqInfo,
160 getAnalysis<MachineBranchProbabilityInfoWrapperPass>().getMBPI(),
161 &getAnalysis<ProfileSummaryInfoWrapperPass>().getPSI());
170 : EnableHoistCommonCode(CommonHoist), MinCommonTailLength(MinTailLength),
171 MBBFreqInfo(FreqInfo), MBPI(ProbInfo), PSI(PSI) {
174 EnableTailMerge = DefaultEnableTailMerge;
191 TriedMerging.erase(
MBB);
195 if (
MI.shouldUpdateAdditionalCallInfo())
200 EHScopeMembership.erase(
MBB);
209 if (!tii)
return false;
211 TriedMerging.clear();
214 AfterBlockPlacement = AfterPlacement;
220 if (MinCommonTailLength == 0) {
228 MRI.invalidateLiveness();
230 bool MadeChange =
false;
235 bool MadeChangeThisIteration =
true;
236 while (MadeChangeThisIteration) {
237 MadeChangeThisIteration = TailMergeBlocks(MF);
240 if (!AfterBlockPlacement || MadeChangeThisIteration)
241 MadeChangeThisIteration |= OptimizeBranches(MF);
242 if (EnableHoistCommonCode)
243 MadeChangeThisIteration |= HoistCommonCode(MF);
244 MadeChange |= MadeChangeThisIteration;
258 if (!
Op.isJTI())
continue;
261 JTIsLive.
set(
Op.getIndex());
267 for (
unsigned i = 0, e = JTIsLive.
size(); i != e; ++i)
268 if (!JTIsLive.
test(i)) {
282 unsigned Hash =
MI.getOpcode();
283 for (
unsigned i = 0, e =
MI.getNumOperands(); i != e; ++i) {
289 unsigned OperandHash = 0;
290 switch (
Op.getType()) {
292 OperandHash =
Op.getReg().id();
295 OperandHash =
Op.getImm();
298 OperandHash =
Op.getMBB()->getNumber();
303 OperandHash =
Op.getIndex();
309 OperandHash =
Op.getOffset();
315 Hash += ((OperandHash << 3) |
Op.getType()) << (i & 31);
331 return !(
MI.isDebugInstr() ||
MI.isCFIInstruction());
361 unsigned TailLen = 0;
365 if (MBBI1 == MBB1->
end() || MBBI2 == MBB2->
end())
367 if (!MBBI1->isIdenticalTo(*MBBI2) ||
373 MBBI1->isInlineAsm()) {
393 LiveRegs.addLiveOuts(OldMBB);
398 LiveRegs.stepBackward(*
I);
399 }
while (
I != OldInst);
408 "Can only handle full register.");
410 if (!LiveRegs.available(*MRI, Reg))
413 BuildMI(OldMBB, OldInst,
DL, TII->
get(TargetOpcode::IMPLICIT_DEF), Reg);
441 NewMBB->
splice(NewMBB->
end(), &CurMBB, BBI1, CurMBB.
end());
446 ML->addBasicBlockToLoop(NewMBB, *MLI);
455 const auto &EHScopeI = EHScopeMembership.find(&CurMBB);
456 if (EHScopeI != EHScopeMembership.end()) {
457 auto n = EHScopeI->second;
458 EHScopeMembership[NewMBB] = n;
469 for (;
I != E; ++
I) {
474 else if (
I->mayLoadOrStore())
497 if (
TBB == NextBB && !
Cond.empty() && !FBB) {
510BranchFolder::MergePotentialsElt::operator<(
const MergePotentialsElt &o)
const {
511 if (getHash() <
o.getHash())
513 if (getHash() >
o.getHash())
515 if (getBlock()->getNumber() <
o.getBlock()->getNumber())
517 if (getBlock()->getNumber() >
o.getBlock()->getNumber())
528 unsigned NumTerms = 0;
535 if (!
I->isTerminator())
break;
570 unsigned MinCommonTailLength,
unsigned &CommonTailLen,
579 if (!EHScopeMembership.
empty()) {
580 auto EHScope1 = EHScopeMembership.
find(MBB1);
581 assert(EHScope1 != EHScopeMembership.
end());
582 auto EHScope2 = EHScopeMembership.
find(MBB2);
583 assert(EHScope2 != EHScopeMembership.
end());
584 if (EHScope1->second != EHScope2->second)
589 if (CommonTailLen == 0)
593 << CommonTailLen <<
'\n');
603 bool FullBlockTail1 = I1 == MBB1->
begin();
604 bool FullBlockTail2 = I2 == MBB2->
begin();
611 if ((MBB1 == PredBB || MBB2 == PredBB) &&
612 (!AfterPlacement || MBB1->
succ_size() == 1)) {
615 if (CommonTailLen > NumTerms)
624 if (FullBlockTail1 && FullBlockTail2 &&
641 if (AfterPlacement && FullBlockTail1 && FullBlockTail2) {
647 return (
MBB != &*MF->
begin()) && std::prev(
I)->canFallThrough();
649 if (!BothFallThrough(MBB1) || !BothFallThrough(MBB2))
658 unsigned EffectiveTailLen = CommonTailLen;
659 if (SuccBB && MBB1 != PredBB && MBB2 != PredBB &&
660 (MBB1->
succ_size() == 1 || !AfterPlacement) &&
666 if (EffectiveTailLen >= MinCommonTailLength)
675 return EffectiveTailLen >= 2 && OptForSize &&
676 (FullBlockTail1 || FullBlockTail2);
679unsigned BranchFolder::ComputeSameTails(
unsigned CurHash,
680 unsigned MinCommonTailLength,
683 unsigned maxCommonTailLength = 0
U;
686 MPIterator HighestMPIter = std::prev(MergePotentials.end());
687 for (MPIterator CurMPIter = std::prev(MergePotentials.end()),
688 B = MergePotentials.begin();
689 CurMPIter !=
B && CurMPIter->getHash() == CurHash; --CurMPIter) {
690 for (MPIterator
I = std::prev(CurMPIter);
I->getHash() == CurHash; --
I) {
691 unsigned CommonTailLen;
694 CommonTailLen, TrialBBI1, TrialBBI2,
697 AfterBlockPlacement, MBBFreqInfo, PSI)) {
698 if (CommonTailLen > maxCommonTailLength) {
700 maxCommonTailLength = CommonTailLen;
701 HighestMPIter = CurMPIter;
702 SameTails.push_back(SameTailElt(CurMPIter, TrialBBI1));
704 if (HighestMPIter == CurMPIter &&
705 CommonTailLen == maxCommonTailLength)
706 SameTails.push_back(SameTailElt(
I, TrialBBI2));
712 return maxCommonTailLength;
715void BranchFolder::RemoveBlocksWithHash(
unsigned CurHash,
719 MPIterator CurMPIter,
B;
720 for (CurMPIter = std::prev(MergePotentials.end()),
721 B = MergePotentials.begin();
722 CurMPIter->getHash() == CurHash; --CurMPIter) {
725 if (SuccBB && CurMBB != PredBB)
726 FixTail(CurMBB, SuccBB, TII, BranchDL);
730 if (CurMPIter->getHash() != CurHash)
732 MergePotentials.erase(CurMPIter, MergePotentials.end());
737 unsigned maxCommonTailLength,
738 unsigned &commonTailIndex) {
740 unsigned TimeEstimate = ~0
U;
741 for (
unsigned i = 0, e = SameTails.size(); i != e; ++i) {
743 if (SameTails[i].getBlock() == PredBB) {
750 SameTails[i].getTailStartPos());
751 if (t <= TimeEstimate) {
758 SameTails[commonTailIndex].getTailStartPos();
762 << maxCommonTailLength);
775 SameTails[commonTailIndex].setBlock(newMBB);
776 SameTails[commonTailIndex].setTailStartPos(newMBB->
begin());
792 unsigned CommonTailLen = 0;
793 for (
auto E =
MBB->
end(); MBBIStartPos != E; ++MBBIStartPos)
801 while (CommonTailLen--) {
802 assert(
MBBI != MBBIE &&
"Reached BB end within common tail length!");
813 assert(MBBICommon != MBBIECommon &&
814 "Reached BB end within common tail length!");
815 assert(MBBICommon->isIdenticalTo(*
MBBI) &&
"Expected matching MIIs!");
818 if (MBBICommon->mayLoadOrStore())
819 MBBICommon->cloneMergedMemRefs(*
MBB->
getParent(), {&*MBBICommon, &*MBBI});
821 for (
unsigned I = 0, E = MBBICommon->getNumOperands();
I != E; ++
I) {
835void BranchFolder::mergeCommonTails(
unsigned commonTailIndex) {
838 std::vector<MachineBasicBlock::iterator> NextCommonInsts(SameTails.size());
839 for (
unsigned int i = 0 ; i != SameTails.size() ; ++i) {
840 if (i != commonTailIndex) {
841 NextCommonInsts[i] = SameTails[i].getTailStartPos();
845 "MBB is not a common tail only block");
849 for (
auto &
MI : *
MBB) {
853 for (
unsigned int i = 0 ; i < NextCommonInsts.size() ; i++) {
854 if (i == commonTailIndex)
857 auto &Pos = NextCommonInsts[i];
858 assert(Pos != SameTails[i].getBlock()->
end() &&
859 "Reached BB end within common tail");
862 assert(Pos != SameTails[i].getBlock()->
end() &&
863 "Reached BB end within common tail");
865 assert(
MI.isIdenticalTo(*Pos) &&
"Expected matching MIIs!");
867 NextCommonInsts[i] = ++Pos;
881 LiveRegs.addLiveOuts(*Pred);
884 if (!LiveRegs.available(*MRI, Reg))
890 return NewLiveIns.contains(SReg) && !MRI->isReserved(SReg);
895 BuildMI(*Pred, InsertBefore,
DL, TII->
get(TargetOpcode::IMPLICIT_DEF),
916 unsigned MinCommonTailLength) {
917 bool MadeChange =
false;
920 dbgs() <<
"\nTryTailMergeBlocks: ";
921 for (
unsigned i = 0, e = MergePotentials.size(); i != e; ++i)
923 << (i ==
e - 1 ?
"" :
", ");
931 dbgs() <<
"Looking for common tails of at least " << MinCommonTailLength
932 <<
" instruction" << (MinCommonTailLength == 1 ?
"" :
"s") <<
'\n';
937#if LLVM_ENABLE_DEBUGLOC_TRACKING_ORIGIN
940 std::sort(MergePotentials.begin(), MergePotentials.end());
946 while (MergePotentials.size() > 1) {
947 unsigned CurHash = MergePotentials.back().getHash();
948 const DebugLoc &BranchDL = MergePotentials.back().getBranchDebugLoc();
952 unsigned maxCommonTailLength = ComputeSameTails(CurHash,
958 if (SameTails.empty()) {
959 RemoveBlocksWithHash(CurHash, SuccBB, PredBB, BranchDL);
968 &MergePotentials.front().getBlock()->getParent()->front();
969 unsigned commonTailIndex = SameTails.size();
972 if (SameTails.size() == 2 &&
973 SameTails[0].getBlock()->isLayoutSuccessor(SameTails[1].getBlock()) &&
974 SameTails[1].tailIsWholeBlock() && !SameTails[1].getBlock()->isEHPad())
976 else if (SameTails.size() == 2 &&
977 SameTails[1].getBlock()->isLayoutSuccessor(
978 SameTails[0].getBlock()) &&
979 SameTails[0].tailIsWholeBlock() &&
980 !SameTails[0].getBlock()->isEHPad())
985 for (
unsigned i = 0, e = SameTails.size(); i != e; ++i) {
988 SameTails[i].tailIsWholeBlock())
994 if (SameTails[i].tailIsWholeBlock())
999 if (commonTailIndex == SameTails.size() ||
1000 (SameTails[commonTailIndex].getBlock() == PredBB &&
1001 !SameTails[commonTailIndex].tailIsWholeBlock())) {
1004 if (!CreateCommonTailOnlyBlock(PredBB, SuccBB,
1005 maxCommonTailLength, commonTailIndex)) {
1006 RemoveBlocksWithHash(CurHash, SuccBB, PredBB, BranchDL);
1014 setCommonTailEdgeWeights(*
MBB);
1018 mergeCommonTails(commonTailIndex);
1024 for (
unsigned int i=0, e = SameTails.size(); i != e; ++i) {
1025 if (commonTailIndex == i)
1028 << (i == e - 1 ?
"" :
", "));
1030 replaceTailWithBranchTo(SameTails[i].getTailStartPos(), *
MBB);
1032 MergePotentials.erase(SameTails[i].getMPIter());
1043 bool MadeChange =
false;
1044 if (!EnableTailMerge)
1049 MergePotentials.clear();
1061 for (
const MergePotentialsElt &Elt : MergePotentials)
1062 TriedMerging.insert(Elt.getBlock());
1065 if (MergePotentials.size() >= 2)
1066 MadeChange |= TryTailMergeBlocks(
nullptr,
nullptr, MinCommonTailLength);
1089 if (
I->pred_size() < 2)
continue;
1093 MergePotentials.clear();
1106 if (AfterBlockPlacement && MLI) {
1108 if (
ML && IBB ==
ML->getHeader())
1116 if (TriedMerging.count(PBB))
1124 if (!UniquePreds.
insert(PBB).second)
1129 if (PBB->hasEHPadSuccessor() || PBB->mayHaveInlineAsmBr())
1135 if (AfterBlockPlacement && MLI)
1145 if (!
Cond.empty() &&
TBB == IBB) {
1150 auto Next = ++PBB->getIterator();
1151 if (Next != MF.end())
1157 DebugLoc dl = PBB->findBranchDebugLoc();
1158 if (
TBB && (
Cond.empty() || FBB)) {
1166 MergePotentials.push_back(
1174 for (MergePotentialsElt &Elt : MergePotentials)
1175 TriedMerging.insert(Elt.getBlock());
1177 if (MergePotentials.size() >= 2)
1178 MadeChange |= TryTailMergeBlocks(IBB, PredBB, MinCommonTailLength);
1182 PredBB = &*std::prev(
I);
1183 if (MergePotentials.size() == 1 &&
1184 MergePotentials.begin()->getBlock() != PredBB)
1185 FixTail(MergePotentials.begin()->getBlock(), IBB, TII,
1186 MergePotentials.begin()->getBranchDebugLoc());
1199 for (
const auto &Src : SameTails) {
1202 AccumulatedMBBFreq += BlockFreq;
1209 auto EdgeFreq = EdgeFreqLs.begin();
1212 SuccI != SuccE; ++SuccI, ++EdgeFreq)
1216 MBBFreqInfo.
setBlockFreq(&TailMBB, AccumulatedMBBFreq);
1222 std::accumulate(EdgeFreqLs.begin(), EdgeFreqLs.end(),
BlockFrequency(0))
1224 auto EdgeFreq = EdgeFreqLs.begin();
1226 if (SumEdgeFreq > 0) {
1228 SuccI != SuccE; ++SuccI, ++EdgeFreq) {
1230 EdgeFreq->getFrequency(), SumEdgeFreq);
1241 bool MadeChange =
false;
1250 MadeChange |= OptimizeBlock(&
MBB);
1254 RemoveDeadBlock(&
MBB);
1274 return I->isBranch();
1283 assert(MBB1 && MBB2 &&
"Unknown MachineBasicBlock");
1291 if (MBB1I == MBB1->
end() || MBB2I == MBB2->
end())
1299 return MBB2I->isCall() && !MBB1I->isCall();
1307 if (
MI.isDebugInstr()) {
1308 TII->duplicate(PredMBB, InsertBefore,
MI);
1309 LLVM_DEBUG(
dbgs() <<
"Copied debug entity from empty block to pred: "
1319 if (
MI.isDebugInstr()) {
1320 TII->duplicate(SuccMBB, InsertBefore,
MI);
1321 LLVM_DEBUG(
dbgs() <<
"Copied debug entity from empty block to succ: "
1350 bool MadeChange =
false;
1358 bool SameEHScope =
true;
1359 if (!EHScopeMembership.empty() && FallThrough != MF.
end()) {
1360 auto MBBEHScope = EHScopeMembership.find(
MBB);
1361 assert(MBBEHScope != EHScopeMembership.end());
1362 auto FallThroughEHScope = EHScopeMembership.find(&*FallThrough);
1363 assert(FallThroughEHScope != EHScopeMembership.end());
1364 SameEHScope = MBBEHScope->second == FallThroughEHScope->second;
1371 bool CurUnAnalyzable =
1384 if (FallThrough == MF.
end()) {
1386 }
else if (FallThrough->isEHPad()) {
1402 if (*SI != &*FallThrough && !FallThrough->isSuccessor(*SI)) {
1403 assert((*SI)->isEHPad() &&
"Bad CFG");
1404 FallThrough->copySuccessor(
MBB, SI);
1409 MJTI->ReplaceMBBInJumpTables(
MBB, &*FallThrough);
1421 bool PriorUnAnalyzable =
1422 TII->
analyzeBranch(PrevBB, PriorTBB, PriorFBB, PriorCond,
true);
1423 if (!PriorUnAnalyzable) {
1427 if (PriorTBB && PriorTBB == PriorFBB) {
1431 if (PriorTBB !=
MBB)
1432 TII->
insertBranch(PrevBB, PriorTBB,
nullptr, PriorCond, Dl);
1435 goto ReoptimizeBlock;
1449 <<
"From MBB: " << *
MBB);
1451 if (!PrevBB.
empty()) {
1457 while (PrevBBIter != PrevBB.
begin() && MBBIter !=
MBB->
end()
1458 && PrevBBIter->isDebugInstr() && MBBIter->isDebugInstr()) {
1459 if (!MBBIter->isIdenticalTo(*PrevBBIter))
1462 ++MBBIter; -- PrevBBIter;
1476 if (PriorTBB ==
MBB && !PriorFBB) {
1480 goto ReoptimizeBlock;
1485 if (PriorFBB ==
MBB) {
1488 TII->
insertBranch(PrevBB, PriorTBB,
nullptr, PriorCond, Dl);
1491 goto ReoptimizeBlock;
1497 if (PriorTBB ==
MBB) {
1502 TII->
insertBranch(PrevBB, PriorFBB,
nullptr, NewPriorCond, Dl);
1505 goto ReoptimizeBlock;
1520 bool DoTransform =
true;
1527 if (FallThrough == --MF.
end() &&
1529 DoTransform =
false;
1536 <<
"To make fallthrough to: " << *PriorTBB <<
"\n");
1559 bool PredAnalyzable =
1560 !TII->
analyzeBranch(*Pred, PredTBB, PredFBB, PredCond,
true);
1563 if (PredAnalyzable && !PredCond.
empty() && PredTBB ==
MBB &&
1564 PredTBB != PredFBB) {
1582 if (!PredsChanged.
empty()) {
1583 NumTailCalls += PredsChanged.
size();
1584 for (
auto &Pred : PredsChanged)
1592 if (!CurUnAnalyzable) {
1598 if (CurTBB && CurFBB && CurFBB ==
MBB && CurTBB !=
MBB) {
1606 goto ReoptimizeBlock;
1612 if (CurTBB && CurCond.
empty() && !CurFBB &&
1635 if (PredHasNoFallThrough || !PriorUnAnalyzable ||
1640 PriorTBB !=
MBB && PriorFBB !=
MBB) {
1643 "Bad branch analysis");
1646 assert(!PriorFBB &&
"Machine CFG out of date!");
1651 TII->
insertBranch(PrevBB, PriorTBB, PriorFBB, PriorCond, PrevDl);
1656 bool DidChange =
false;
1657 bool HasBranchToSelf =
false;
1663 HasBranchToSelf =
true;
1673 assert((*SI)->isEHPad() &&
"Bad CFG");
1682 *PMBB, NewCurTBB, NewCurFBB, NewCurCond,
true);
1683 if (!NewCurUnAnalyzable && NewCurTBB && NewCurTBB == NewCurFBB) {
1687 TII->
insertBranch(*PMBB, NewCurTBB,
nullptr, NewCurCond,
1697 MJTI->ReplaceMBBInJumpTables(
MBB, CurTBB);
1701 if (!HasBranchToSelf)
return MadeChange;
1728 !TII->
analyzeBranch(*PredBB, PredTBB, PredFBB, PredCond,
true) &&
1729 (PredTBB ==
MBB || PredFBB ==
MBB) &&
1730 (!CurFallsThru || !CurTBB || !CurFBB) &&
1749 goto ReoptimizeBlock;
1754 if (!CurFallsThru) {
1757 if (!CurUnAnalyzable) {
1767 if (SuccBB !=
MBB && &*SuccPrev !=
MBB &&
1768 !SuccPrev->canFallThrough()) {
1771 goto ReoptimizeBlock;
1800 if (FallThrough != MF.
end() && !FallThrough->isEHPad() &&
1801 !FallThrough->isInlineAsmBrIndirectTarget() &&
1802 !TII->
analyzeBranch(PrevBB, PrevTBB, PrevFBB, PrevCond,
true) &&
1819 bool MadeChange =
false;
1821 MadeChange |= HoistCommonCodeInSuccs(&
MBB);
1831 if (SuccBB != TrueBB)
1836template <
class Container>
1839 if (Reg.isPhysical()) {
1861 if (!
TII->isUnpredicatedTerminator(*Loc))
1902 if (!MO.isReg() || MO.isUse())
1907 if (
Uses.count(Reg)) {
1923 bool DontMoveAcrossStore =
true;
1938 if (
Uses.erase(Reg)) {
1939 if (Reg.isPhysical()) {
1976 bool HasDups =
false;
1982 while (TIB != TIE && FIB != FIE) {
1986 if (TIB == TIE || FIB == FIE)
1999 if (MO.isRegMask()) {
2009 if (
Uses.count(Reg)) {
2016 if (Defs.
count(Reg) && !MO.isDead()) {
2031 }
else if (!ActiveDefsSet.
count(Reg)) {
2032 if (Defs.
count(Reg)) {
2038 if (MO.isKill() &&
Uses.count(Reg))
2041 MO.setIsKill(
false);
2047 bool DontMoveAcrossStore =
true;
2048 if (!TIB->isSafeToMove(DontMoveAcrossStore))
2058 if (!AllDefsSet.
count(Reg)) {
2061 if (
Reg.isPhysical()) {
2063 ActiveDefsSet.
erase(*AI);
2065 ActiveDefsSet.
erase(Reg);
2074 if (!Reg ||
Reg.isVirtual())
2099 assert(DI->isDebugInstr() &&
"Expected a debug instruction");
2100 if (DI->isDebugRef()) {
2105 DI->getDebugVariable(), DI->getDebugExpression());
2110 if (DI->isDebugPHI()) {
2111 DI->eraseFromParent();
2115 if (!DI->isDebugLabel())
2116 DI->setDebugValueUndef();
2117 DI->moveBefore(&*Loc);
2129 while (FI != FE && FI->isDebugInstr())
2130 HoistAndKillDbgInstr(FI++);
2133 if (TI->isDebugInstr()) {
2134 HoistAndKillDbgInstr(TI);
2139 assert(FI != FE &&
"Unexpected end of FBB range");
2142 assert(!TI->isPseudoProbe() &&
"Unexpected pseudo probe in range");
2146 "Expected non-debug lockstep");
2151 TI->moveBefore(&*Loc);
2156 FBB->erase(FBB->begin(), FIB);
unsigned const MachineRegisterInfo * MRI
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
MachineBasicBlock MachineBasicBlock::iterator MBBI
This file implements the BitVector class.
static unsigned EstimateRuntime(MachineBasicBlock::iterator I, MachineBasicBlock::iterator E)
EstimateRuntime - Make a rough estimate for how long it will take to run the specified code.
static unsigned ComputeCommonTailLength(MachineBasicBlock *MBB1, MachineBasicBlock *MBB2, MachineBasicBlock::iterator &I1, MachineBasicBlock::iterator &I2)
Given two machine basic blocks, return the number of instructions they actually have in common togeth...
static MachineBasicBlock * findFalseBlock(MachineBasicBlock *BB, MachineBasicBlock *TrueBB)
findFalseBlock - BB has a fallthrough.
static void copyDebugInfoToPredecessor(const TargetInstrInfo *TII, MachineBasicBlock &MBB, MachineBasicBlock &PredMBB)
static unsigned HashMachineInstr(const MachineInstr &MI)
HashMachineInstr - Compute a hash value for MI and its operands.
static bool countsAsInstruction(const MachineInstr &MI)
Whether MI should be counted as an instruction when calculating common tail.
static unsigned CountTerminators(MachineBasicBlock *MBB, MachineBasicBlock::iterator &I)
CountTerminators - Count the number of terminators in the given block and set I to the position of th...
static bool blockEndsInUnreachable(const MachineBasicBlock *MBB)
A no successor, non-return block probably ends in unreachable and is cold.
static void salvageDebugInfoFromEmptyBlock(const TargetInstrInfo *TII, MachineBasicBlock &MBB)
static MachineBasicBlock::iterator skipBackwardPastNonInstructions(MachineBasicBlock::iterator I, MachineBasicBlock *MBB)
Iterate backwards from the given iterator I, towards the beginning of the block.
static cl::opt< unsigned > TailMergeThreshold("tail-merge-threshold", cl::desc("Max number of predecessors to consider tail merging"), cl::init(150), cl::Hidden)
static void addRegAndItsAliases(Register Reg, const TargetRegisterInfo *TRI, Container &Set)
static cl::opt< cl::boolOrDefault > FlagEnableTailMerge("enable-tail-merge", cl::init(cl::BOU_UNSET), cl::Hidden)
static cl::opt< unsigned > TailMergeSize("tail-merge-size", cl::desc("Min number of instructions to consider tail merging"), cl::init(3), cl::Hidden)
static bool IsEmptyBlock(MachineBasicBlock *MBB)
static bool ProfitableToMerge(MachineBasicBlock *MBB1, MachineBasicBlock *MBB2, unsigned MinCommonTailLength, unsigned &CommonTailLen, MachineBasicBlock::iterator &I1, MachineBasicBlock::iterator &I2, MachineBasicBlock *SuccBB, MachineBasicBlock *PredBB, DenseMap< const MachineBasicBlock *, int > &EHScopeMembership, bool AfterPlacement, MBFIWrapper &MBBFreqInfo, ProfileSummaryInfo *PSI)
ProfitableToMerge - Check if two machine basic blocks have a common tail and decide if it would be pr...
static void copyDebugInfoToSuccessor(const TargetInstrInfo *TII, MachineBasicBlock &MBB, MachineBasicBlock &SuccMBB)
static bool IsBranchOnlyBlock(MachineBasicBlock *MBB)
static void FixTail(MachineBasicBlock *CurMBB, MachineBasicBlock *SuccBB, const TargetInstrInfo *TII, const DebugLoc &BranchDL)
static bool IsBetterFallthrough(MachineBasicBlock *MBB1, MachineBasicBlock *MBB2)
IsBetterFallthrough - Return true if it would be clearly better to fall-through to MBB1 than to fall ...
static unsigned HashEndOfMBB(const MachineBasicBlock &MBB)
HashEndOfMBB - Hash the last instruction in the MBB.
static void mergeOperations(MachineBasicBlock::iterator MBBIStartPos, MachineBasicBlock &MBBCommon)
static MachineBasicBlock::iterator findHoistingInsertPosAndDeps(MachineBasicBlock *MBB, const TargetInstrInfo *TII, const TargetRegisterInfo *TRI, SmallSet< Register, 4 > &Uses, SmallSet< Register, 4 > &Defs)
findHoistingInsertPosAndDeps - Find the location to move common instructions in successors to.
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
const HexagonInstrInfo * TII
A common definition of LaneBitmask for use in TableGen and CodeGen.
Register const TargetRegisterInfo * TRI
#define INITIALIZE_PASS(passName, arg, name, cfg, analysis)
const SmallVectorImpl< MachineOperand > MachineBasicBlock * TBB
const SmallVectorImpl< MachineOperand > & Cond
Remove Loads Into Fake Uses
This file defines the SmallSet class.
This file defines the SmallVector class.
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...
#define STATISTIC(VARNAME, DESC)
Target-Independent Code Generator Pass Configuration Options pass.
A container for analyses that lazily runs them and caches their results.
Represent the analysis usage information of a pass.
AnalysisUsage & addRequired()
LLVM Basic Block Representation.
bool test(unsigned Idx) const
size_type size() const
size - Returns the number of bits in this bitvector.
bool OptimizeFunction(MachineFunction &MF, const TargetInstrInfo *tii, const TargetRegisterInfo *tri, MachineLoopInfo *mli=nullptr, bool AfterPlacement=false)
Perhaps branch folding, tail merging and other CFG optimizations on the given function.
BranchFolder(bool DefaultEnableTailMerge, bool CommonHoist, MBFIWrapper &FreqInfo, const MachineBranchProbabilityInfo &ProbInfo, ProfileSummaryInfo *PSI, unsigned MinTailLength=0)
static LLVM_ABI BranchProbability getBranchProbability(uint64_t Numerator, uint64_t Denominator)
static LLVM_ABI DILocation * getMergedLocation(DILocation *LocA, DILocation *LocB)
Attempts to merge LocA and LocB into a single location; see DebugLoc::getMergedLocation for more deta...
This class represents an Operation in the Expression.
static LLVM_ABI DebugLoc getMergedLocation(DebugLoc LocA, DebugLoc LocB)
When two instructions are combined into a single instruction we also need to combine the original loc...
iterator find(const_arg_type_t< KeyT > Val)
unsigned removeBranch(MachineBasicBlock &MBB, int *BytesRemoved=nullptr) const override
Remove the branching code at the end of the specific MBB.
bool isPredicated(const MachineInstr &MI) const override
Returns true if the instruction is already predicated.
bool analyzeBranch(MachineBasicBlock &MBB, MachineBasicBlock *&TBB, MachineBasicBlock *&FBB, SmallVectorImpl< MachineOperand > &Cond, bool AllowModify) const override
Analyze the branching code at the end of MBB, returning true if it cannot be understood (e....
bool reverseBranchCondition(SmallVectorImpl< MachineOperand > &Cond) const override
Reverses the branch condition of the specified condition list, returning false on success and true if...
unsigned insertBranch(MachineBasicBlock &MBB, MachineBasicBlock *TBB, MachineBasicBlock *FBB, ArrayRef< MachineOperand > Cond, const DebugLoc &DL, int *BytesAdded=nullptr) const override
Insert branch code into the end of the specified MachineBasicBlock.
A set of physical registers with utility functions to track liveness when walking backward/forward th...
void removeBlock(BlockT *BB)
This method completely removes BB from all data structures, including all of the Loop objects it is n...
LoopT * getLoopFor(const BlockT *BB) const
Return the inner most loop that BB lives in.
BlockFrequency getBlockFreq(const MachineBasicBlock *MBB) const
void setBlockFreq(const MachineBasicBlock *MBB, BlockFrequency F)
Describe properties that are true of each instruction in the target description file.
const MCInstrDesc & get(unsigned Opcode) const
Return the machine instruction descriptor that corresponds to the specified instruction opcode.
MCRegAliasIterator enumerates all registers aliasing Reg.
iterator_range< MCSuperRegIterator > superregs(MCRegister Reg) const
Return an iterator range over all super-registers of Reg, excluding Reg.
Wrapper class representing physical registers. Should be passed by value.
An RAII based helper class to modify MachineFunctionProperties when running pass.
unsigned pred_size() const
bool isEHPad() const
Returns true if the block is a landing pad.
LLVM_ABI void moveBefore(MachineBasicBlock *NewAfter)
Move 'this' block before or after the specified block.
LLVM_ABI void transferSuccessors(MachineBasicBlock *FromMBB)
Transfers all the successors from MBB to this machine basic block (i.e., copies all the successors Fr...
LLVM_ABI instr_iterator insert(instr_iterator I, MachineInstr *M)
Insert MI into the instruction list before I, possibly inside a bundle.
iterator_range< livein_iterator > liveins() const
int getNumber() const
MachineBasicBlocks are uniquely numbered at the function level, unless they're not in a MachineFuncti...
LLVM_ABI iterator SkipPHIsAndLabels(iterator I)
Return the first instruction in MBB after I that is not a PHI or a label.
const BasicBlock * getBasicBlock() const
Return the LLVM basic block that this instance corresponded to originally.
LLVM_ABI bool canFallThrough()
Return true if the block can implicitly transfer control to the block after it by falling off the end...
LLVM_ABI void setSuccProbability(succ_iterator I, BranchProbability Prob)
Set successor probability of a given iterator.
LLVM_ABI iterator getFirstNonDebugInstr(bool SkipPseudoOp=true)
Returns an iterator to the first non-debug instruction in the basic block, or end().
succ_iterator succ_begin()
LLVM_ABI void clearLiveIns()
Clear live in list.
LLVM_ABI iterator getFirstTerminator()
Returns an iterator to the first terminator instruction of this basic block.
unsigned succ_size() const
bool hasAddressTaken() const
Test whether this block is used as something other than the target of a terminator,...
LLVM_ABI void addSuccessor(MachineBasicBlock *Succ, BranchProbability Prob=BranchProbability::getUnknown())
Add Succ as a successor of this MachineBasicBlock.
LLVM_ABI void copySuccessor(const MachineBasicBlock *Orig, succ_iterator I)
Copy a successor (and any probability info) from original block to this block's.
LLVM_ABI void removeSuccessor(MachineBasicBlock *Succ, bool NormalizeSuccProbs=false)
Remove successor from the successors list of this MachineBasicBlock.
pred_iterator pred_begin()
LLVM_ABI iterator getLastNonDebugInstr(bool SkipPseudoOp=true)
Returns an iterator to the last non-debug instruction in the basic block, or end().
LLVM_ABI void ReplaceUsesOfBlockWith(MachineBasicBlock *Old, MachineBasicBlock *New)
Given a machine basic block that branched to 'Old', change the code and CFG so that it branches to 'N...
LLVM_ABI bool isLayoutSuccessor(const MachineBasicBlock *MBB) const
Return true if the specified MBB will be emitted immediately after this block, such that if this bloc...
const MachineFunction * getParent() const
Return the MachineFunction containing this basic block.
LLVM_ABI instr_iterator erase(instr_iterator I)
Remove an instruction from the instruction list and delete it.
LLVM_ABI DebugLoc findBranchDebugLoc()
Find and return the merged DebugLoc of the branch instructions of the block.
iterator_range< succ_iterator > successors()
reverse_iterator rbegin()
bool isMachineBlockAddressTaken() const
Test whether this block is used as something other than the target of a terminator,...
LLVM_ABI bool isSuccessor(const MachineBasicBlock *MBB) const
Return true if the specified MBB is a successor of this block.
iterator_range< pred_iterator > predecessors()
void splice(iterator Where, MachineBasicBlock *Other, iterator From)
Take an instruction from MBB 'Other' at the position From, and insert it into this MBB right before '...
LLVM_ABI void moveAfter(MachineBasicBlock *NewBefore)
BranchProbability getEdgeProbability(const MachineBasicBlock *Src, const MachineBasicBlock *Dst) const
MachineFunctionPass - This class adapts the FunctionPass interface to allow convenient creation of pa...
void getAnalysisUsage(AnalysisUsage &AU) const override
getAnalysisUsage - Subclasses that override getAnalysisUsage must call this.
virtual bool runOnMachineFunction(MachineFunction &MF)=0
runOnMachineFunction - This method must be overloaded to perform the desired machine code transformat...
virtual MachineFunctionProperties getRequiredProperties() const
Properties which a MachineFunction may have at a given point in time.
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
MachineRegisterInfo & getRegInfo()
getRegInfo - Return information about the registers currently in use.
Function & getFunction()
Return the LLVM function that this machine code represents.
const MachineBasicBlock & back() const
void eraseAdditionalCallInfo(const MachineInstr *MI)
Following functions update call site info.
void RenumberBlocks(MachineBasicBlock *MBBFrom=nullptr)
RenumberBlocks - This discards all of the MachineBasicBlock numbers and recomputes them.
const MachineJumpTableInfo * getJumpTableInfo() const
getJumpTableInfo - Return the jump table info object for the current function.
MachineBasicBlock * CreateMachineBasicBlock(const BasicBlock *BB=nullptr, std::optional< UniqueBBID > BBID=std::nullopt)
CreateMachineBasicBlock - Allocate a new MachineBasicBlock.
void erase(iterator MBBI)
void insert(iterator MBBI, MachineBasicBlock *MBB)
const TargetMachine & getTarget() const
getTarget - Return the target machine this machine code is compiled with
Representation of each machine instruction.
bool isReturn(QueryType Type=AnyInBundle) const
bool isBarrier(QueryType Type=AnyInBundle) const
Returns true if the specified instruction stops control flow from executing the instruction immediate...
LLVM_ABI void eraseFromParent()
Unlink 'this' from the containing basic block and delete it.
bool isIndirectBranch(QueryType Type=AnyInBundle) const
Return true if this is an indirect branch, such as a branch through a register.
void RemoveJumpTable(unsigned Idx)
RemoveJumpTable - Mark the specific index as being dead.
const std::vector< MachineJumpTableEntry > & getJumpTables() const
MachineOperand class - Representation of each machine instruction operand.
bool isReg() const
isReg - Tests if this is a MO_Register operand.
void setIsUndef(bool Val=true)
@ MO_Immediate
Immediate operand.
@ MO_ConstantPoolIndex
Address of indexed Constant in Constant Pool.
@ MO_GlobalAddress
Address of a global value.
@ MO_MachineBasicBlock
MachineBasicBlock reference.
@ MO_FrameIndex
Abstract Stack Frame Index.
@ MO_Register
Register operand.
@ MO_ExternalSymbol
Name of external global symbol.
@ MO_JumpTableIndex
Address of indexed Jump Table for switch.
MachineRegisterInfo - Keep track of information for virtual and physical registers,...
An analysis over an "inner" IR unit that provides access to an analysis manager over a "outer" IR uni...
A set of analyses that are preserved following a run of a transformation pass.
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
An analysis pass based on legacy pass manager to deliver ProfileSummaryInfo.
Analysis providing profile information.
Wrapper class representing virtual and physical registers.
std::pair< iterator, bool > insert(PtrType Ptr)
Inserts Ptr if and only if there is no element in the container equal to Ptr.
SmallPtrSet - This class implements a set which is optimized for holding SmallSize or less elements.
SmallSet - This maintains a set of unique values, optimizing for the case when the set is small (less...
size_type count(const T &V) const
count - Return 1 if the element is in the set, 0 otherwise.
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
TargetInstrInfo - Interface to description of machine instruction set.
virtual bool reverseBranchCondition(SmallVectorImpl< MachineOperand > &Cond) const
Reverses the branch condition of the specified condition list, returning false on success and true if...
virtual unsigned removeBranch(MachineBasicBlock &MBB, int *BytesRemoved=nullptr) const
Remove the branching code at the end of the specific MBB.
virtual bool analyzeBranch(MachineBasicBlock &MBB, MachineBasicBlock *&TBB, MachineBasicBlock *&FBB, SmallVectorImpl< MachineOperand > &Cond, bool AllowModify=false) const
Analyze the branching code at the end of MBB, returning true if it cannot be understood (e....
virtual bool canMakeTailCallConditional(SmallVectorImpl< MachineOperand > &Cond, const MachineInstr &TailCall) const
Returns true if the tail call can be made conditional on BranchCond.
virtual void ReplaceTailWithBranchTo(MachineBasicBlock::iterator Tail, MachineBasicBlock *NewDest) const
Delete the instruction OldInst and everything after it, replacing it with an unconditional branch to ...
virtual bool isUnconditionalTailCall(const MachineInstr &MI) const
Returns true if MI is an unconditional tail call.
virtual unsigned insertBranch(MachineBasicBlock &MBB, MachineBasicBlock *TBB, MachineBasicBlock *FBB, ArrayRef< MachineOperand > Cond, const DebugLoc &DL, int *BytesAdded=nullptr) const
Insert branch code into the end of the specified MachineBasicBlock.
virtual unsigned getTailMergeSize(const MachineFunction &MF) const
Returns the target-specific default value for tail merging.
virtual bool isPredicated(const MachineInstr &MI) const
Returns true if the instruction is already predicated.
virtual void replaceBranchWithTailCall(MachineBasicBlock &MBB, SmallVectorImpl< MachineOperand > &Cond, const MachineInstr &TailCall) const
Replace the conditional branch in MBB with a conditional tail call.
virtual bool isLegalToSplitMBBAt(MachineBasicBlock &MBB, MachineBasicBlock::iterator MBBI) const
Return true if it's legal to split the given basic block at the specified instruction (i....
bool requiresStructuredCFG() const
Target-Independent Code Generator Pass Configuration Options.
bool getEnableTailMerge() const
TargetRegisterInfo base class - We assume that the target defines a static array of TargetRegisterDes...
virtual bool trackLivenessAfterRegAlloc(const MachineFunction &MF) const
Returns true if the live-ins should be tracked after register allocation.
virtual const TargetInstrInfo * getInstrInfo() const
virtual const TargetRegisterInfo * getRegisterInfo() const =0
Return the target's register information.
self_iterator getIterator()
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
Reg
All possible values of the reg field in the ModR/M byte.
initializer< Ty > init(const Ty &Val)
LLVM_ABI const_iterator begin(StringRef path LLVM_LIFETIME_BOUND, Style style=Style::native)
Get begin iterator over path.
LLVM_ABI const_iterator end(StringRef path LLVM_LIFETIME_BOUND)
Get end iterator over path.
This is an optimization pass for GlobalISel generic memory operations.
auto drop_begin(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the first N elements excluded.
MachineInstrBuilder BuildMI(MachineFunction &MF, const MIMetadata &MIMD, const MCInstrDesc &MCID)
Builder interface. Specify how to create the initial instruction itself.
iterator_range< T > make_range(T x, T y)
Convenience function for iterating over sub-ranges.
LLVM_ABI bool shouldOptimizeForSize(const MachineFunction *MF, ProfileSummaryInfo *PSI, const MachineBlockFrequencyInfo *BFI, PGSOQueryType QueryType=PGSOQueryType::Other)
Returns true if machine function MF is suggested to be size-optimized based on the profile.
iterator_range< early_inc_iterator_impl< detail::IterOfRange< RangeT > > > make_early_inc_range(RangeT &&Range)
Make a range that does early increment to allow mutation of the underlying range without disrupting i...
LLVM_ABI PreservedAnalyses getMachineFunctionPassPreservedAnalyses()
Returns the minimum set of Analyses that all machine function passes must preserve.
IterT skipDebugInstructionsForward(IterT It, IterT End, bool SkipPseudoOp=true)
Increment It until it points to a non-debug instruction or to End and return the resulting iterator.
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
LLVM_ABI void report_fatal_error(Error Err, bool gen_crash_diag=true)
void computeAndAddLiveIns(LivePhysRegs &LiveRegs, MachineBasicBlock &MBB)
Convenience function combining computeLiveIns() and addLiveIns().
void array_pod_sort(IteratorTy Start, IteratorTy End)
array_pod_sort - This sorts an array with the specified start and end extent.
void computeLiveIns(LivePhysRegs &LiveRegs, const MachineBasicBlock &MBB)
Computes registers live-in to MBB assuming all of its successors live-in lists are up-to-date.
LLVM_ABI char & BranchFolderPassID
BranchFolding - This pass performs machine code CFG based optimizations to delete branches to branche...
IterT prev_nodbg(IterT It, IterT Begin, bool SkipPseudoOp=true)
Decrement It, then continue decrementing it while it points to a debug instruction.
void fullyRecomputeLiveIns(ArrayRef< MachineBasicBlock * > MBBs)
Convenience function for recomputing live-in's for a set of MBBs until the computation converges.
LLVM_ABI Printable printMBBReference(const MachineBasicBlock &MBB)
Prints a machine basic block reference.
void addLiveIns(MachineBasicBlock &MBB, const LivePhysRegs &LiveRegs)
Adds registers contained in LiveRegs to the block live-in list of MBB.
DenseMap< const MachineBasicBlock *, int > getEHScopeMembership(const MachineFunction &MF)
static constexpr LaneBitmask getAll()
Pair of physical register and lane mask.