|  | //===- BlockExtractor.cpp - Extracts blocks into their own functions ------===// | 
|  | // | 
|  | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. | 
|  | // See https://llvm.org/LICENSE.txt for license information. | 
|  | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception | 
|  | // | 
|  | //===----------------------------------------------------------------------===// | 
|  | // | 
|  | // This pass extracts the specified basic blocks from the module into their | 
|  | // own functions. | 
|  | // | 
|  | //===----------------------------------------------------------------------===// | 
|  |  | 
|  | #include "llvm/Transforms/IPO/BlockExtractor.h" | 
|  | #include "llvm/ADT/STLExtras.h" | 
|  | #include "llvm/ADT/Statistic.h" | 
|  | #include "llvm/IR/Instructions.h" | 
|  | #include "llvm/IR/Module.h" | 
|  | #include "llvm/IR/PassManager.h" | 
|  | #include "llvm/Support/CommandLine.h" | 
|  | #include "llvm/Support/Debug.h" | 
|  | #include "llvm/Support/MemoryBuffer.h" | 
|  | #include "llvm/Transforms/IPO.h" | 
|  | #include "llvm/Transforms/Utils/BasicBlockUtils.h" | 
|  | #include "llvm/Transforms/Utils/CodeExtractor.h" | 
|  |  | 
|  | using namespace llvm; | 
|  |  | 
|  | #define DEBUG_TYPE "block-extractor" | 
|  |  | 
|  | STATISTIC(NumExtracted, "Number of basic blocks extracted"); | 
|  |  | 
|  | static cl::opt<std::string> BlockExtractorFile( | 
|  | "extract-blocks-file", cl::value_desc("filename"), | 
|  | cl::desc("A file containing list of basic blocks to extract"), cl::Hidden); | 
|  |  | 
|  | static cl::opt<bool> | 
|  | BlockExtractorEraseFuncs("extract-blocks-erase-funcs", | 
|  | cl::desc("Erase the existing functions"), | 
|  | cl::Hidden); | 
|  | namespace { | 
|  | class BlockExtractor { | 
|  | public: | 
|  | BlockExtractor(bool EraseFunctions) : EraseFunctions(EraseFunctions) {} | 
|  | bool runOnModule(Module &M); | 
|  | void | 
|  | init(const std::vector<std::vector<BasicBlock *>> &GroupsOfBlocksToExtract) { | 
|  | GroupsOfBlocks = GroupsOfBlocksToExtract; | 
|  | if (!BlockExtractorFile.empty()) | 
|  | loadFile(); | 
|  | } | 
|  |  | 
|  | private: | 
|  | std::vector<std::vector<BasicBlock *>> GroupsOfBlocks; | 
|  | bool EraseFunctions; | 
|  | /// Map a function name to groups of blocks. | 
|  | SmallVector<std::pair<std::string, SmallVector<std::string, 4>>, 4> | 
|  | BlocksByName; | 
|  |  | 
|  | void loadFile(); | 
|  | void splitLandingPadPreds(Function &F); | 
|  | }; | 
|  |  | 
|  | } // end anonymous namespace | 
|  |  | 
|  | /// Gets all of the blocks specified in the input file. | 
|  | void BlockExtractor::loadFile() { | 
|  | auto ErrOrBuf = MemoryBuffer::getFile(BlockExtractorFile); | 
|  | if (ErrOrBuf.getError()) | 
|  | report_fatal_error("BlockExtractor couldn't load the file."); | 
|  | // Read the file. | 
|  | auto &Buf = *ErrOrBuf; | 
|  | SmallVector<StringRef, 16> Lines; | 
|  | Buf->getBuffer().split(Lines, '\n', /*MaxSplit=*/-1, | 
|  | /*KeepEmpty=*/false); | 
|  | for (const auto &Line : Lines) { | 
|  | SmallVector<StringRef, 4> LineSplit; | 
|  | Line.split(LineSplit, ' ', /*MaxSplit=*/-1, | 
|  | /*KeepEmpty=*/false); | 
|  | if (LineSplit.empty()) | 
|  | continue; | 
|  | if (LineSplit.size()!=2) | 
|  | reportFatalUsageError( | 
|  | "Invalid line format, expecting lines like: 'funcname bb1[;bb2..]'"); | 
|  | SmallVector<StringRef, 4> BBNames; | 
|  | LineSplit[1].split(BBNames, ';', /*MaxSplit=*/-1, | 
|  | /*KeepEmpty=*/false); | 
|  | if (BBNames.empty()) | 
|  | report_fatal_error("Missing bbs name"); | 
|  | BlocksByName.push_back( | 
|  | {std::string(LineSplit[0]), {BBNames.begin(), BBNames.end()}}); | 
|  | } | 
|  | } | 
|  |  | 
|  | /// Extracts the landing pads to make sure all of them have only one | 
|  | /// predecessor. | 
|  | void BlockExtractor::splitLandingPadPreds(Function &F) { | 
|  | for (BasicBlock &BB : F) { | 
|  | for (Instruction &I : BB) { | 
|  | if (!isa<InvokeInst>(&I)) | 
|  | continue; | 
|  | InvokeInst *II = cast<InvokeInst>(&I); | 
|  | BasicBlock *Parent = II->getParent(); | 
|  | BasicBlock *LPad = II->getUnwindDest(); | 
|  |  | 
|  | // Look through the landing pad's predecessors. If one of them ends in an | 
|  | // 'invoke', then we want to split the landing pad. | 
|  | bool Split = false; | 
|  | for (auto *PredBB : predecessors(LPad)) { | 
|  | if (PredBB->isLandingPad() && PredBB != Parent && | 
|  | isa<InvokeInst>(Parent->getTerminator())) { | 
|  | Split = true; | 
|  | break; | 
|  | } | 
|  | } | 
|  |  | 
|  | if (!Split) | 
|  | continue; | 
|  |  | 
|  | SmallVector<BasicBlock *, 2> NewBBs; | 
|  | SplitLandingPadPredecessors(LPad, Parent, ".1", ".2", NewBBs); | 
|  | } | 
|  | } | 
|  | } | 
|  |  | 
|  | bool BlockExtractor::runOnModule(Module &M) { | 
|  | bool Changed = false; | 
|  |  | 
|  | // Get all the functions. | 
|  | SmallVector<Function *, 4> Functions; | 
|  | for (Function &F : M) { | 
|  | splitLandingPadPreds(F); | 
|  | Functions.push_back(&F); | 
|  | } | 
|  |  | 
|  | // Get all the blocks specified in the input file. | 
|  | unsigned NextGroupIdx = GroupsOfBlocks.size(); | 
|  | GroupsOfBlocks.resize(NextGroupIdx + BlocksByName.size()); | 
|  | for (const auto &BInfo : BlocksByName) { | 
|  | Function *F = M.getFunction(BInfo.first); | 
|  | if (!F) | 
|  | reportFatalUsageError( | 
|  | "Invalid function name specified in the input file"); | 
|  | for (const auto &BBInfo : BInfo.second) { | 
|  | auto Res = llvm::find_if( | 
|  | *F, [&](const BasicBlock &BB) { return BB.getName() == BBInfo; }); | 
|  | if (Res == F->end()) | 
|  | reportFatalUsageError("Invalid block name specified in the input file"); | 
|  | GroupsOfBlocks[NextGroupIdx].push_back(&*Res); | 
|  | } | 
|  | ++NextGroupIdx; | 
|  | } | 
|  |  | 
|  | // Extract each group of basic blocks. | 
|  | for (auto &BBs : GroupsOfBlocks) { | 
|  | SmallVector<BasicBlock *, 32> BlocksToExtractVec; | 
|  | for (BasicBlock *BB : BBs) { | 
|  | // Check if the module contains BB. | 
|  | if (BB->getParent()->getParent() != &M) | 
|  | reportFatalUsageError("Invalid basic block"); | 
|  | LLVM_DEBUG(dbgs() << "BlockExtractor: Extracting " | 
|  | << BB->getParent()->getName() << ":" << BB->getName() | 
|  | << "\n"); | 
|  | BlocksToExtractVec.push_back(BB); | 
|  | if (const InvokeInst *II = dyn_cast<InvokeInst>(BB->getTerminator())) | 
|  | BlocksToExtractVec.push_back(II->getUnwindDest()); | 
|  | ++NumExtracted; | 
|  | Changed = true; | 
|  | } | 
|  | CodeExtractorAnalysisCache CEAC(*BBs[0]->getParent()); | 
|  | Function *F = CodeExtractor(BlocksToExtractVec).extractCodeRegion(CEAC); | 
|  | if (F) | 
|  | LLVM_DEBUG(dbgs() << "Extracted group '" << (*BBs.begin())->getName() | 
|  | << "' in: " << F->getName() << '\n'); | 
|  | else | 
|  | LLVM_DEBUG(dbgs() << "Failed to extract for group '" | 
|  | << (*BBs.begin())->getName() << "'\n"); | 
|  | } | 
|  |  | 
|  | // Erase the functions. | 
|  | if (EraseFunctions || BlockExtractorEraseFuncs) { | 
|  | for (Function *F : Functions) { | 
|  | LLVM_DEBUG(dbgs() << "BlockExtractor: Trying to delete " << F->getName() | 
|  | << "\n"); | 
|  | F->deleteBody(); | 
|  | } | 
|  | // Set linkage as ExternalLinkage to avoid erasing unreachable functions. | 
|  | for (Function &F : M) | 
|  | F.setLinkage(GlobalValue::ExternalLinkage); | 
|  | Changed = true; | 
|  | } | 
|  |  | 
|  | return Changed; | 
|  | } | 
|  |  | 
|  | BlockExtractorPass::BlockExtractorPass( | 
|  | std::vector<std::vector<BasicBlock *>> &&GroupsOfBlocks, | 
|  | bool EraseFunctions) | 
|  | : GroupsOfBlocks(GroupsOfBlocks), EraseFunctions(EraseFunctions) {} | 
|  |  | 
|  | PreservedAnalyses BlockExtractorPass::run(Module &M, | 
|  | ModuleAnalysisManager &AM) { | 
|  | BlockExtractor BE(EraseFunctions); | 
|  | BE.init(GroupsOfBlocks); | 
|  | return BE.runOnModule(M) ? PreservedAnalyses::none() | 
|  | : PreservedAnalyses::all(); | 
|  | } |