//===- BranchRelaxation.cpp -----------------------------------------------===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// #include "llvm/CodeGen/BranchRelaxation.h" #include "llvm/ADT/SmallVector.h" #include "llvm/ADT/Statistic.h" #include "llvm/CodeGen/LivePhysRegs.h" #include "llvm/CodeGen/MachineBasicBlock.h" #include "llvm/CodeGen/MachineFunction.h" #include "llvm/CodeGen/MachineFunctionPass.h" #include "llvm/CodeGen/MachineInstr.h" #include "llvm/CodeGen/RegisterScavenging.h" #include "llvm/CodeGen/TargetInstrInfo.h" #include "llvm/CodeGen/TargetRegisterInfo.h" #include "llvm/CodeGen/TargetSubtargetInfo.h" #include "llvm/Config/llvm-config.h" #include "llvm/IR/DebugLoc.h" #include "llvm/InitializePasses.h" #include "llvm/Pass.h" #include "llvm/Support/Compiler.h" #include "llvm/Support/Debug.h" #include "llvm/Support/ErrorHandling.h" #include "llvm/Support/Format.h" #include "llvm/Support/raw_ostream.h" #include "llvm/Target/TargetMachine.h" #include #include #include #include using namespace llvm; #define DEBUG_TYPE "branch-relaxation" STATISTIC(NumSplit, "Number of basic blocks split"); STATISTIC(NumConditionalRelaxed, "Number of conditional branches relaxed"); STATISTIC(NumUnconditionalRelaxed, "Number of unconditional branches relaxed"); #define BRANCH_RELAX_NAME "Branch relaxation pass" namespace { class BranchRelaxation { /// BasicBlockInfo - Information about the offset and size of a single /// basic block. struct BasicBlockInfo { /// Offset - Distance from the beginning of the function to the beginning /// of this basic block. /// /// The offset is always aligned as required by the basic block. unsigned Offset = 0; /// Size - Size of the basic block in bytes. If the block contains /// inline assembly, this is a worst case estimate. /// /// The size does not include any alignment padding whether from the /// beginning of the block, or from an aligned jump table at the end. unsigned Size = 0; BasicBlockInfo() = default; /// Compute the offset immediately following this block. \p MBB is the next /// block. unsigned postOffset(const MachineBasicBlock &MBB) const { const unsigned PO = Offset + Size; const Align Alignment = MBB.getAlignment(); const Align ParentAlign = MBB.getParent()->getAlignment(); if (Alignment <= ParentAlign) return alignTo(PO, Alignment); // The alignment of this MBB is larger than the function's alignment, so // we can't tell whether or not it will insert nops. Assume that it will. return alignTo(PO, Alignment) + Alignment.value() - ParentAlign.value(); } }; SmallVector BlockInfo; // The basic block after which trampolines are inserted. This is the last // basic block that isn't in the cold section. MachineBasicBlock *TrampolineInsertionPoint = nullptr; SmallDenseSet> RelaxedUnconditionals; std::unique_ptr RS; LivePhysRegs LiveRegs; MachineFunction *MF = nullptr; const TargetRegisterInfo *TRI = nullptr; const TargetInstrInfo *TII = nullptr; const TargetMachine *TM = nullptr; bool relaxBranchInstructions(); void scanFunction(); MachineBasicBlock *createNewBlockAfter(MachineBasicBlock &OrigMBB); MachineBasicBlock *createNewBlockAfter(MachineBasicBlock &OrigMBB, const BasicBlock *BB); MachineBasicBlock *splitBlockBeforeInstr(MachineInstr &MI, MachineBasicBlock *DestBB); void adjustBlockOffsets(MachineBasicBlock &Start); void adjustBlockOffsets(MachineBasicBlock &Start, MachineFunction::iterator End); bool isBlockInRange(const MachineInstr &MI, const MachineBasicBlock &BB) const; bool fixupConditionalBranch(MachineInstr &MI); bool fixupUnconditionalBranch(MachineInstr &MI); uint64_t computeBlockSize(const MachineBasicBlock &MBB) const; unsigned getInstrOffset(const MachineInstr &MI) const; void dumpBBs(); void verify(); public: bool run(MachineFunction &MF); }; class BranchRelaxationLegacy : public MachineFunctionPass { public: static char ID; BranchRelaxationLegacy() : MachineFunctionPass(ID) {} bool runOnMachineFunction(MachineFunction &MF) override { return BranchRelaxation().run(MF); } StringRef getPassName() const override { return BRANCH_RELAX_NAME; } }; } // end anonymous namespace char BranchRelaxationLegacy::ID = 0; char &llvm::BranchRelaxationPassID = BranchRelaxationLegacy::ID; INITIALIZE_PASS(BranchRelaxationLegacy, DEBUG_TYPE, BRANCH_RELAX_NAME, false, false) /// verify - check BBOffsets, BBSizes, alignment of islands void BranchRelaxation::verify() { #ifndef NDEBUG unsigned PrevNum = MF->begin()->getNumber(); for (MachineBasicBlock &MBB : *MF) { const unsigned Num = MBB.getNumber(); assert(!Num || BlockInfo[PrevNum].postOffset(MBB) <= BlockInfo[Num].Offset); assert(BlockInfo[Num].Size == computeBlockSize(MBB)); PrevNum = Num; } for (MachineBasicBlock &MBB : *MF) { for (MachineBasicBlock::iterator J = MBB.getFirstTerminator(); J != MBB.end(); J = std::next(J)) { MachineInstr &MI = *J; if (!MI.isConditionalBranch() && !MI.isUnconditionalBranch()) continue; if (MI.getOpcode() == TargetOpcode::FAULTING_OP) continue; MachineBasicBlock *DestBB = TII->getBranchDestBlock(MI); assert(isBlockInRange(MI, *DestBB) || RelaxedUnconditionals.contains({&MBB, DestBB})); } } #endif } #if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP) /// print block size and offset information - debugging LLVM_DUMP_METHOD void BranchRelaxation::dumpBBs() { for (auto &MBB : *MF) { const BasicBlockInfo &BBI = BlockInfo[MBB.getNumber()]; dbgs() << format("%%bb.%u\toffset=%08x\t", MBB.getNumber(), BBI.Offset) << format("size=%#x\n", BBI.Size); } } #endif /// scanFunction - Do the initial scan of the function, building up /// information about each block. void BranchRelaxation::scanFunction() { BlockInfo.clear(); BlockInfo.resize(MF->getNumBlockIDs()); TrampolineInsertionPoint = nullptr; RelaxedUnconditionals.clear(); // First thing, compute the size of all basic blocks, and see if the function // has any inline assembly in it. If so, we have to be conservative about // alignment assumptions, as we don't know for sure the size of any // instructions in the inline assembly. At the same time, place the // trampoline insertion point at the end of the hot portion of the function. for (MachineBasicBlock &MBB : *MF) { BlockInfo[MBB.getNumber()].Size = computeBlockSize(MBB); if (MBB.getSectionID() != MBBSectionID::ColdSectionID) TrampolineInsertionPoint = &MBB; } // Compute block offsets and known bits. adjustBlockOffsets(*MF->begin()); if (TrampolineInsertionPoint == nullptr) { LLVM_DEBUG(dbgs() << " No suitable trampoline insertion point found in " << MF->getName() << ".\n"); } } /// computeBlockSize - Compute the size for MBB. uint64_t BranchRelaxation::computeBlockSize(const MachineBasicBlock &MBB) const { uint64_t Size = 0; for (const MachineInstr &MI : MBB) Size += TII->getInstSizeInBytes(MI); return Size; } /// getInstrOffset - Return the current offset of the specified machine /// instruction from the start of the function. This offset changes as stuff is /// moved around inside the function. unsigned BranchRelaxation::getInstrOffset(const MachineInstr &MI) const { const MachineBasicBlock *MBB = MI.getParent(); // The offset is composed of two things: the sum of the sizes of all MBB's // before this instruction's block, and the offset from the start of the block // it is in. unsigned Offset = BlockInfo[MBB->getNumber()].Offset; // Sum instructions before MI in MBB. for (MachineBasicBlock::const_iterator I = MBB->begin(); &*I != &MI; ++I) { assert(I != MBB->end() && "Didn't find MI in its own basic block?"); Offset += TII->getInstSizeInBytes(*I); } return Offset; } void BranchRelaxation::adjustBlockOffsets(MachineBasicBlock &Start) { adjustBlockOffsets(Start, MF->end()); } void BranchRelaxation::adjustBlockOffsets(MachineBasicBlock &Start, MachineFunction::iterator End) { unsigned PrevNum = Start.getNumber(); for (auto &MBB : make_range(std::next(MachineFunction::iterator(Start)), End)) { unsigned Num = MBB.getNumber(); // Get the offset and known bits at the end of the layout predecessor. // Include the alignment of the current block. BlockInfo[Num].Offset = BlockInfo[PrevNum].postOffset(MBB); PrevNum = Num; } } /// Insert a new empty MachineBasicBlock and insert it after \p OrigMBB MachineBasicBlock * BranchRelaxation::createNewBlockAfter(MachineBasicBlock &OrigBB) { return createNewBlockAfter(OrigBB, OrigBB.getBasicBlock()); } /// Insert a new empty MachineBasicBlock with \p BB as its BasicBlock /// and insert it after \p OrigMBB MachineBasicBlock * BranchRelaxation::createNewBlockAfter(MachineBasicBlock &OrigMBB, const BasicBlock *BB) { // Create a new MBB for the code after the OrigBB. MachineBasicBlock *NewBB = MF->CreateMachineBasicBlock(BB); MF->insert(++OrigMBB.getIterator(), NewBB); // Place the new block in the same section as OrigBB NewBB->setSectionID(OrigMBB.getSectionID()); NewBB->setIsEndSection(OrigMBB.isEndSection()); OrigMBB.setIsEndSection(false); // Insert an entry into BlockInfo to align it properly with the block numbers. BlockInfo.insert(BlockInfo.begin() + NewBB->getNumber(), BasicBlockInfo()); return NewBB; } /// Split the basic block containing MI into two blocks, which are joined by /// an unconditional branch. Update data structures and renumber blocks to /// account for this change and returns the newly created block. MachineBasicBlock * BranchRelaxation::splitBlockBeforeInstr(MachineInstr &MI, MachineBasicBlock *DestBB) { MachineBasicBlock *OrigBB = MI.getParent(); // Create a new MBB for the code after the OrigBB. MachineBasicBlock *NewBB = MF->CreateMachineBasicBlock(OrigBB->getBasicBlock()); MF->insert(++OrigBB->getIterator(), NewBB); // Place the new block in the same section as OrigBB. NewBB->setSectionID(OrigBB->getSectionID()); NewBB->setIsEndSection(OrigBB->isEndSection()); OrigBB->setIsEndSection(false); // Splice the instructions starting with MI over to NewBB. NewBB->splice(NewBB->end(), OrigBB, MI.getIterator(), OrigBB->end()); // Add an unconditional branch from OrigBB to NewBB. // Note the new unconditional branch is not being recorded. // There doesn't seem to be meaningful DebugInfo available; this doesn't // correspond to anything in the source. TII->insertUnconditionalBranch(*OrigBB, NewBB, DebugLoc()); // Insert an entry into BlockInfo to align it properly with the block numbers. BlockInfo.insert(BlockInfo.begin() + NewBB->getNumber(), BasicBlockInfo()); NewBB->transferSuccessors(OrigBB); OrigBB->addSuccessor(NewBB); OrigBB->addSuccessor(DestBB); // Cleanup potential unconditional branch to successor block. // Note that updateTerminator may change the size of the blocks. OrigBB->updateTerminator(NewBB); // Figure out how large the OrigBB is. As the first half of the original // block, it cannot contain a tablejump. The size includes // the new jump we added. (It should be possible to do this without // recounting everything, but it's very confusing, and this is rarely // executed.) BlockInfo[OrigBB->getNumber()].Size = computeBlockSize(*OrigBB); // Figure out how large the NewMBB is. As the second half of the original // block, it may contain a tablejump. BlockInfo[NewBB->getNumber()].Size = computeBlockSize(*NewBB); // Update the offset of the new block. adjustBlockOffsets(*OrigBB, std::next(NewBB->getIterator())); // Need to fix live-in lists if we track liveness. if (TRI->trackLivenessAfterRegAlloc(*MF)) computeAndAddLiveIns(LiveRegs, *NewBB); ++NumSplit; return NewBB; } /// isBlockInRange - Returns true if the distance between specific MI and /// specific BB can fit in MI's displacement field. bool BranchRelaxation::isBlockInRange(const MachineInstr &MI, const MachineBasicBlock &DestBB) const { int64_t BrOffset = getInstrOffset(MI); int64_t DestOffset = BlockInfo[DestBB.getNumber()].Offset; const MachineBasicBlock *SrcBB = MI.getParent(); if (TII->isBranchOffsetInRange(MI.getOpcode(), SrcBB->getSectionID() != DestBB.getSectionID() ? TM->getMaxCodeSize() : DestOffset - BrOffset)) return true; LLVM_DEBUG(dbgs() << "Out of range branch to destination " << printMBBReference(DestBB) << " from " << printMBBReference(*MI.getParent()) << " to " << DestOffset << " offset " << DestOffset - BrOffset << '\t' << MI); return false; } /// fixupConditionalBranch - Fix up a conditional branch whose destination is /// too far away to fit in its displacement field. It is converted to an inverse /// conditional branch + an unconditional branch to the destination. bool BranchRelaxation::fixupConditionalBranch(MachineInstr &MI) { DebugLoc DL = MI.getDebugLoc(); MachineBasicBlock *MBB = MI.getParent(); MachineBasicBlock *TBB = nullptr, *FBB = nullptr; MachineBasicBlock *NewBB = nullptr; SmallVector Cond; auto insertUncondBranch = [&](MachineBasicBlock *MBB, MachineBasicBlock *DestBB) { unsigned &BBSize = BlockInfo[MBB->getNumber()].Size; int NewBrSize = 0; TII->insertUnconditionalBranch(*MBB, DestBB, DL, &NewBrSize); BBSize += NewBrSize; }; auto insertBranch = [&](MachineBasicBlock *MBB, MachineBasicBlock *TBB, MachineBasicBlock *FBB, SmallVectorImpl &Cond) { unsigned &BBSize = BlockInfo[MBB->getNumber()].Size; int NewBrSize = 0; TII->insertBranch(*MBB, TBB, FBB, Cond, DL, &NewBrSize); BBSize += NewBrSize; }; auto removeBranch = [&](MachineBasicBlock *MBB) { unsigned &BBSize = BlockInfo[MBB->getNumber()].Size; int RemovedSize = 0; TII->removeBranch(*MBB, &RemovedSize); BBSize -= RemovedSize; }; // Populate the block offset and live-ins for a new basic block. auto updateOffsetAndLiveness = [&](MachineBasicBlock *NewBB) { assert(NewBB != nullptr && "can't populate offset for nullptr"); // Keep the block offsets approximately up to date. While they will be // slight underestimates, we will update them appropriately in the next // scan through the function. adjustBlockOffsets(*std::prev(NewBB->getIterator()), std::next(NewBB->getIterator())); // Need to fix live-in lists if we track liveness. if (TRI->trackLivenessAfterRegAlloc(*MF)) computeAndAddLiveIns(LiveRegs, *NewBB); }; bool Fail = TII->analyzeBranch(*MBB, TBB, FBB, Cond); assert(!Fail && "branches to be relaxed must be analyzable"); (void)Fail; // Since cross-section conditional branches to the cold section are rarely // taken, try to avoid inverting the condition. Instead, add a "trampoline // branch", which unconditionally branches to the branch destination. Place // the trampoline branch at the end of the function and retarget the // conditional branch to the trampoline. // tbz L1 // => // tbz L1Trampoline // ... // L1Trampoline: b L1 if (MBB->getSectionID() != TBB->getSectionID() && TBB->getSectionID() == MBBSectionID::ColdSectionID && TrampolineInsertionPoint != nullptr) { // If the insertion point is out of range, we can't put a trampoline there. NewBB = createNewBlockAfter(*TrampolineInsertionPoint, MBB->getBasicBlock()); if (isBlockInRange(MI, *NewBB)) { LLVM_DEBUG(dbgs() << " Retarget destination to trampoline at " << NewBB->back()); insertUncondBranch(NewBB, TBB); // Update the successor lists to include the trampoline. MBB->replaceSuccessor(TBB, NewBB); NewBB->addSuccessor(TBB); // Replace branch in the current (MBB) block. removeBranch(MBB); insertBranch(MBB, NewBB, FBB, Cond); TrampolineInsertionPoint = NewBB; updateOffsetAndLiveness(NewBB); return true; } LLVM_DEBUG( dbgs() << " Trampoline insertion point out of range for Bcc from " << printMBBReference(*MBB) << " to " << printMBBReference(*TBB) << ".\n"); TrampolineInsertionPoint->setIsEndSection(NewBB->isEndSection()); MF->erase(NewBB); NewBB = nullptr; } // Add an unconditional branch to the destination and invert the branch // condition to jump over it: // tbz L1 // => // tbnz L2 // b L1 // L2: bool ReversedCond = !TII->reverseBranchCondition(Cond); if (ReversedCond) { if (FBB && isBlockInRange(MI, *FBB)) { // Last MI in the BB is an unconditional branch. We can simply invert the // condition and swap destinations: // beq L1 // b L2 // => // bne L2 // b L1 LLVM_DEBUG(dbgs() << " Invert condition and swap " "its destination with " << MBB->back()); removeBranch(MBB); insertBranch(MBB, FBB, TBB, Cond); return true; } if (FBB) { // If we get here with a MBB which ends like this: // // bb.1: // successors: %bb.2; // ... // BNE $x1, $x0, %bb.2 // PseudoBR %bb.2 // // Just remove conditional branch. if (TBB == FBB) { removeBranch(MBB); insertUncondBranch(MBB, TBB); return true; } // We need to split the basic block here to obtain two long-range // unconditional branches. NewBB = createNewBlockAfter(*MBB); insertUncondBranch(NewBB, FBB); // Update the succesor lists according to the transformation to follow. // Do it here since if there's no split, no update is needed. MBB->replaceSuccessor(FBB, NewBB); NewBB->addSuccessor(FBB); updateOffsetAndLiveness(NewBB); } // We now have an appropriate fall-through block in place (either naturally // or just created), so we can use the inverted the condition. MachineBasicBlock &NextBB = *std::next(MachineFunction::iterator(MBB)); LLVM_DEBUG(dbgs() << " Insert B to " << printMBBReference(*TBB) << ", invert condition and change dest. to " << printMBBReference(NextBB) << '\n'); removeBranch(MBB); // Insert a new conditional branch and a new unconditional branch. insertBranch(MBB, &NextBB, TBB, Cond); return true; } // Branch cond can't be inverted. // In this case we always add a block after the MBB. LLVM_DEBUG(dbgs() << " The branch condition can't be inverted. " << " Insert a new BB after " << MBB->back()); if (!FBB) FBB = &(*std::next(MachineFunction::iterator(MBB))); // This is the block with cond. branch and the distance to TBB is too long. // beq L1 // L2: // We do the following transformation: // beq NewBB // b L2 // NewBB: // b L1 // L2: NewBB = createNewBlockAfter(*MBB); insertUncondBranch(NewBB, TBB); LLVM_DEBUG(dbgs() << " Insert cond B to the new BB " << printMBBReference(*NewBB) << " Keep the exiting condition.\n" << " Insert B to " << printMBBReference(*FBB) << ".\n" << " In the new BB: Insert B to " << printMBBReference(*TBB) << ".\n"); // Update the successor lists according to the transformation to follow. MBB->replaceSuccessor(TBB, NewBB); NewBB->addSuccessor(TBB); // Replace branch in the current (MBB) block. removeBranch(MBB); insertBranch(MBB, NewBB, FBB, Cond); updateOffsetAndLiveness(NewBB); return true; } bool BranchRelaxation::fixupUnconditionalBranch(MachineInstr &MI) { MachineBasicBlock *MBB = MI.getParent(); unsigned OldBrSize = TII->getInstSizeInBytes(MI); MachineBasicBlock *DestBB = TII->getBranchDestBlock(MI); int64_t DestOffset = BlockInfo[DestBB->getNumber()].Offset; int64_t SrcOffset = getInstrOffset(MI); assert(!TII->isBranchOffsetInRange( MI.getOpcode(), MBB->getSectionID() != DestBB->getSectionID() ? TM->getMaxCodeSize() : DestOffset - SrcOffset)); BlockInfo[MBB->getNumber()].Size -= OldBrSize; MachineBasicBlock *BranchBB = MBB; // If this was an expanded conditional branch, there is already a single // unconditional branch in a block. if (!MBB->empty()) { BranchBB = createNewBlockAfter(*MBB); // Add live outs. for (const MachineBasicBlock *Succ : MBB->successors()) { for (const MachineBasicBlock::RegisterMaskPair &LiveIn : Succ->liveins()) BranchBB->addLiveIn(LiveIn); } BranchBB->sortUniqueLiveIns(); BranchBB->addSuccessor(DestBB); MBB->replaceSuccessor(DestBB, BranchBB); if (TrampolineInsertionPoint == MBB) TrampolineInsertionPoint = BranchBB; } DebugLoc DL = MI.getDebugLoc(); MI.eraseFromParent(); // Create the optional restore block and, initially, place it at the end of // function. That block will be placed later if it's used; otherwise, it will // be erased. MachineBasicBlock *RestoreBB = createNewBlockAfter(MF->back(), DestBB->getBasicBlock()); std::prev(RestoreBB->getIterator()) ->setIsEndSection(RestoreBB->isEndSection()); RestoreBB->setIsEndSection(false); TII->insertIndirectBranch(*BranchBB, *DestBB, *RestoreBB, DL, BranchBB->getSectionID() != DestBB->getSectionID() ? TM->getMaxCodeSize() : DestOffset - SrcOffset, RS.get()); // Update the block size and offset for the BranchBB (which may be newly // created). BlockInfo[BranchBB->getNumber()].Size = computeBlockSize(*BranchBB); adjustBlockOffsets(*MBB, std::next(BranchBB->getIterator())); // If RestoreBB is required, place it appropriately. if (!RestoreBB->empty()) { // If the jump is Cold -> Hot, don't place the restore block (which is // cold) in the middle of the function. Place it at the end. if (MBB->getSectionID() == MBBSectionID::ColdSectionID && DestBB->getSectionID() != MBBSectionID::ColdSectionID) { MachineBasicBlock *NewBB = createNewBlockAfter(*TrampolineInsertionPoint); TII->insertUnconditionalBranch(*NewBB, DestBB, DebugLoc()); BlockInfo[NewBB->getNumber()].Size = computeBlockSize(*NewBB); adjustBlockOffsets(*TrampolineInsertionPoint, std::next(NewBB->getIterator())); // New trampolines should be inserted after NewBB. TrampolineInsertionPoint = NewBB; // Retarget the unconditional branch to the trampoline block. BranchBB->replaceSuccessor(DestBB, NewBB); NewBB->addSuccessor(DestBB); DestBB = NewBB; } // In all other cases, try to place just before DestBB. // TODO: For multiple far branches to the same destination, there are // chances that some restore blocks could be shared if they clobber the // same registers and share the same restore sequence. So far, those // restore blocks are just duplicated for each far branch. assert(!DestBB->isEntryBlock()); MachineBasicBlock *PrevBB = &*std::prev(DestBB->getIterator()); // Fall through only if PrevBB has no unconditional branch as one of its // terminators. if (auto *FT = PrevBB->getLogicalFallThrough()) { assert(FT == DestBB); TII->insertUnconditionalBranch(*PrevBB, FT, DebugLoc()); BlockInfo[PrevBB->getNumber()].Size = computeBlockSize(*PrevBB); } // Now, RestoreBB could be placed directly before DestBB. MF->splice(DestBB->getIterator(), RestoreBB->getIterator()); // Update successors and predecessors. RestoreBB->addSuccessor(DestBB); BranchBB->replaceSuccessor(DestBB, RestoreBB); if (TRI->trackLivenessAfterRegAlloc(*MF)) computeAndAddLiveIns(LiveRegs, *RestoreBB); // Compute the restore block size. BlockInfo[RestoreBB->getNumber()].Size = computeBlockSize(*RestoreBB); // Update the estimated offset for the restore block. adjustBlockOffsets(*PrevBB, DestBB->getIterator()); // Fix up section information for RestoreBB and DestBB RestoreBB->setSectionID(DestBB->getSectionID()); RestoreBB->setIsBeginSection(DestBB->isBeginSection()); DestBB->setIsBeginSection(false); RelaxedUnconditionals.insert({BranchBB, RestoreBB}); } else { // Remove restore block if it's not required. MF->erase(RestoreBB); RelaxedUnconditionals.insert({BranchBB, DestBB}); } return true; } bool BranchRelaxation::relaxBranchInstructions() { bool Changed = false; // Relaxing branches involves creating new basic blocks, so re-eval // end() for termination. for (MachineBasicBlock &MBB : *MF) { // Empty block? MachineBasicBlock::iterator Last = MBB.getLastNonDebugInstr(); if (Last == MBB.end()) continue; // Expand the unconditional branch first if necessary. If there is a // conditional branch, this will end up changing the branch destination of // it to be over the newly inserted indirect branch block, which may avoid // the need to try expanding the conditional branch first, saving an extra // jump. if (Last->isUnconditionalBranch()) { // Unconditional branch destination might be unanalyzable, assume these // are OK. if (MachineBasicBlock *DestBB = TII->getBranchDestBlock(*Last)) { if (!isBlockInRange(*Last, *DestBB) && !TII->isTailCall(*Last) && !RelaxedUnconditionals.contains({&MBB, DestBB})) { fixupUnconditionalBranch(*Last); ++NumUnconditionalRelaxed; Changed = true; } } } // Loop over the conditional branches. MachineBasicBlock::iterator Next; for (MachineBasicBlock::iterator J = MBB.getFirstTerminator(); J != MBB.end(); J = Next) { Next = std::next(J); MachineInstr &MI = *J; if (!MI.isConditionalBranch()) continue; if (MI.getOpcode() == TargetOpcode::FAULTING_OP) // FAULTING_OP's destination is not encoded in the instruction stream // and thus never needs relaxed. continue; MachineBasicBlock *DestBB = TII->getBranchDestBlock(MI); if (!isBlockInRange(MI, *DestBB)) { if (Next != MBB.end() && Next->isConditionalBranch()) { // If there are multiple conditional branches, this isn't an // analyzable block. Split later terminators into a new block so // each one will be analyzable. splitBlockBeforeInstr(*Next, DestBB); } else { fixupConditionalBranch(MI); ++NumConditionalRelaxed; } Changed = true; // This may have modified all of the terminators, so start over. Next = MBB.getFirstTerminator(); } } } // If we relaxed a branch, we must recompute offsets for *all* basic blocks. // Otherwise, we may underestimate branch distances and fail to relax a branch // that has been pushed out of range. if (Changed) adjustBlockOffsets(MF->front()); return Changed; } PreservedAnalyses BranchRelaxationPass::run(MachineFunction &MF, MachineFunctionAnalysisManager &MFAM) { if (!BranchRelaxation().run(MF)) return PreservedAnalyses::all(); return getMachineFunctionPassPreservedAnalyses(); } bool BranchRelaxation::run(MachineFunction &mf) { MF = &mf; LLVM_DEBUG(dbgs() << "***** BranchRelaxation *****\n"); const TargetSubtargetInfo &ST = MF->getSubtarget(); TII = ST.getInstrInfo(); TM = &MF->getTarget(); TRI = ST.getRegisterInfo(); if (TRI->trackLivenessAfterRegAlloc(*MF)) RS.reset(new RegScavenger()); // Renumber all of the machine basic blocks in the function, guaranteeing that // the numbers agree with the position of the block in the function. MF->RenumberBlocks(); // Do the initial scan of the function, building up information about the // sizes of each block. scanFunction(); LLVM_DEBUG(dbgs() << " Basic blocks before relaxation\n"; dumpBBs();); bool MadeChange = false; while (relaxBranchInstructions()) MadeChange = true; // After a while, this might be made debug-only, but it is not expensive. verify(); LLVM_DEBUG(dbgs() << " Basic blocks after relaxation\n\n"; dumpBBs()); BlockInfo.clear(); RelaxedUnconditionals.clear(); return MadeChange; }