252 lines
		
	
	
		
			9.7 KiB
		
	
	
	
		
			C++
		
	
	
	
			
		
		
	
	
			252 lines
		
	
	
		
			9.7 KiB
		
	
	
	
		
			C++
		
	
	
	
| //===- FunctionPropertiesAnalysis.cpp - Function Properties Analysis ------===//
 | |
| //
 | |
| // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
 | |
| // See https://llvm.org/LICENSE.txt for license information.
 | |
| // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
 | |
| //
 | |
| //===----------------------------------------------------------------------===//
 | |
| //
 | |
| // This file defines the FunctionPropertiesInfo and FunctionPropertiesAnalysis
 | |
| // classes used to extract function properties.
 | |
| //
 | |
| //===----------------------------------------------------------------------===//
 | |
| 
 | |
| #include "llvm/Analysis/FunctionPropertiesAnalysis.h"
 | |
| #include "llvm/ADT/STLExtras.h"
 | |
| #include "llvm/ADT/SetVector.h"
 | |
| #include "llvm/Analysis/LoopInfo.h"
 | |
| #include "llvm/IR/CFG.h"
 | |
| #include "llvm/IR/Dominators.h"
 | |
| #include "llvm/IR/Instructions.h"
 | |
| #include <deque>
 | |
| 
 | |
| using namespace llvm;
 | |
| 
 | |
| namespace {
 | |
| int64_t getNrBlocksFromCond(const BasicBlock &BB) {
 | |
|   int64_t Ret = 0;
 | |
|   if (const auto *BI = dyn_cast<BranchInst>(BB.getTerminator())) {
 | |
|     if (BI->isConditional())
 | |
|       Ret += BI->getNumSuccessors();
 | |
|   } else if (const auto *SI = dyn_cast<SwitchInst>(BB.getTerminator())) {
 | |
|     Ret += (SI->getNumCases() + (nullptr != SI->getDefaultDest()));
 | |
|   }
 | |
|   return Ret;
 | |
| }
 | |
| 
 | |
| int64_t getUses(const Function &F) {
 | |
|   return ((!F.hasLocalLinkage()) ? 1 : 0) + F.getNumUses();
 | |
| }
 | |
| } // namespace
 | |
| 
 | |
| void FunctionPropertiesInfo::reIncludeBB(const BasicBlock &BB) {
 | |
|   updateForBB(BB, +1);
 | |
| }
 | |
| 
 | |
| void FunctionPropertiesInfo::updateForBB(const BasicBlock &BB,
 | |
|                                          int64_t Direction) {
 | |
|   assert(Direction == 1 || Direction == -1);
 | |
|   BasicBlockCount += Direction;
 | |
|   BlocksReachedFromConditionalInstruction +=
 | |
|       (Direction * getNrBlocksFromCond(BB));
 | |
|   for (const auto &I : BB) {
 | |
|     if (auto *CS = dyn_cast<CallBase>(&I)) {
 | |
|       const auto *Callee = CS->getCalledFunction();
 | |
|       if (Callee && !Callee->isIntrinsic() && !Callee->isDeclaration())
 | |
|         DirectCallsToDefinedFunctions += Direction;
 | |
|     }
 | |
|     if (I.getOpcode() == Instruction::Load) {
 | |
|       LoadInstCount += Direction;
 | |
|     } else if (I.getOpcode() == Instruction::Store) {
 | |
|       StoreInstCount += Direction;
 | |
|     }
 | |
|   }
 | |
|   TotalInstructionCount += Direction * BB.sizeWithoutDebug();
 | |
| }
 | |
| 
 | |
| void FunctionPropertiesInfo::updateAggregateStats(const Function &F,
 | |
|                                                   const LoopInfo &LI) {
 | |
| 
 | |
|   Uses = getUses(F);
 | |
|   TopLevelLoopCount = llvm::size(LI);
 | |
|   MaxLoopDepth = 0;
 | |
|   std::deque<const Loop *> Worklist;
 | |
|   llvm::append_range(Worklist, LI);
 | |
|   while (!Worklist.empty()) {
 | |
|     const auto *L = Worklist.front();
 | |
|     MaxLoopDepth =
 | |
|         std::max(MaxLoopDepth, static_cast<int64_t>(L->getLoopDepth()));
 | |
|     Worklist.pop_front();
 | |
|     llvm::append_range(Worklist, L->getSubLoops());
 | |
|   }
 | |
| }
 | |
| 
 | |
| FunctionPropertiesInfo FunctionPropertiesInfo::getFunctionPropertiesInfo(
 | |
|     const Function &F, FunctionAnalysisManager &FAM) {
 | |
| 
 | |
|   FunctionPropertiesInfo FPI;
 | |
|   // The const casts are due to the getResult API - there's no mutation of F.
 | |
|   const auto &LI = FAM.getResult<LoopAnalysis>(const_cast<Function &>(F));
 | |
|   const auto &DT =
 | |
|       FAM.getResult<DominatorTreeAnalysis>(const_cast<Function &>(F));
 | |
|   for (const auto &BB : F)
 | |
|     if (DT.isReachableFromEntry(&BB))
 | |
|       FPI.reIncludeBB(BB);
 | |
|   FPI.updateAggregateStats(F, LI);
 | |
|   return FPI;
 | |
| }
 | |
| 
 | |
| void FunctionPropertiesInfo::print(raw_ostream &OS) const {
 | |
|   OS << "BasicBlockCount: " << BasicBlockCount << "\n"
 | |
|      << "BlocksReachedFromConditionalInstruction: "
 | |
|      << BlocksReachedFromConditionalInstruction << "\n"
 | |
|      << "Uses: " << Uses << "\n"
 | |
|      << "DirectCallsToDefinedFunctions: " << DirectCallsToDefinedFunctions
 | |
|      << "\n"
 | |
|      << "LoadInstCount: " << LoadInstCount << "\n"
 | |
|      << "StoreInstCount: " << StoreInstCount << "\n"
 | |
|      << "MaxLoopDepth: " << MaxLoopDepth << "\n"
 | |
|      << "TopLevelLoopCount: " << TopLevelLoopCount << "\n"
 | |
|      << "TotalInstructionCount: " << TotalInstructionCount << "\n\n";
 | |
| }
 | |
| 
 | |
| AnalysisKey FunctionPropertiesAnalysis::Key;
 | |
| 
 | |
| FunctionPropertiesInfo
 | |
| FunctionPropertiesAnalysis::run(Function &F, FunctionAnalysisManager &FAM) {
 | |
|   return FunctionPropertiesInfo::getFunctionPropertiesInfo(F, FAM);
 | |
| }
 | |
| 
 | |
| PreservedAnalyses
 | |
| FunctionPropertiesPrinterPass::run(Function &F, FunctionAnalysisManager &AM) {
 | |
|   OS << "Printing analysis results of CFA for function "
 | |
|      << "'" << F.getName() << "':"
 | |
|      << "\n";
 | |
|   AM.getResult<FunctionPropertiesAnalysis>(F).print(OS);
 | |
|   return PreservedAnalyses::all();
 | |
| }
 | |
| 
 | |
| FunctionPropertiesUpdater::FunctionPropertiesUpdater(
 | |
|     FunctionPropertiesInfo &FPI, const CallBase &CB)
 | |
|     : FPI(FPI), CallSiteBB(*CB.getParent()), Caller(*CallSiteBB.getParent()) {
 | |
|   assert(isa<CallInst>(CB) || isa<InvokeInst>(CB));
 | |
|   // For BBs that are likely to change, we subtract from feature totals their
 | |
|   // contribution. Some features, like max loop counts or depths, are left
 | |
|   // invalid, as they will be updated post-inlining.
 | |
|   SmallPtrSet<const BasicBlock *, 4> LikelyToChangeBBs;
 | |
|   // The CB BB will change - it'll either be split or the callee's body (single
 | |
|   // BB) will be pasted in.
 | |
|   LikelyToChangeBBs.insert(&CallSiteBB);
 | |
| 
 | |
|   // The caller's entry BB may change due to new alloca instructions.
 | |
|   LikelyToChangeBBs.insert(&*Caller.begin());
 | |
| 
 | |
|   // The successors may become unreachable in the case of `invoke` inlining.
 | |
|   // We track successors separately, too, because they form a boundary, together
 | |
|   // with the CB BB ('Entry') between which the inlined callee will be pasted.
 | |
|   Successors.insert(succ_begin(&CallSiteBB), succ_end(&CallSiteBB));
 | |
| 
 | |
|   // Inlining only handles invoke and calls. If this is an invoke, and inlining
 | |
|   // it pulls another invoke, the original landing pad may get split, so as to
 | |
|   // share its content with other potential users. So the edge up to which we
 | |
|   // need to invalidate and then re-account BB data is the successors of the
 | |
|   // current landing pad. We can leave the current lp, too - if it doesn't get
 | |
|   // split, then it will be the place traversal stops. Either way, the
 | |
|   // discounted BBs will be checked if reachable and re-added.
 | |
|   if (const auto *II = dyn_cast<InvokeInst>(&CB)) {
 | |
|     const auto *UnwindDest = II->getUnwindDest();
 | |
|     Successors.insert(succ_begin(UnwindDest), succ_end(UnwindDest));
 | |
|   }
 | |
| 
 | |
|   // Exclude the CallSiteBB, if it happens to be its own successor (1-BB loop).
 | |
|   // We are only interested in BBs the graph moves past the callsite BB to
 | |
|   // define the frontier past which we don't want to re-process BBs. Including
 | |
|   // the callsite BB in this case would prematurely stop the traversal in
 | |
|   // finish().
 | |
|   Successors.erase(&CallSiteBB);
 | |
| 
 | |
|   for (const auto *BB : Successors)
 | |
|     LikelyToChangeBBs.insert(BB);
 | |
| 
 | |
|   // Commit the change. While some of the BBs accounted for above may play dual
 | |
|   // role - e.g. caller's entry BB may be the same as the callsite BB - set
 | |
|   // insertion semantics make sure we account them once. This needs to be
 | |
|   // followed in `finish`, too.
 | |
|   for (const auto *BB : LikelyToChangeBBs)
 | |
|     FPI.updateForBB(*BB, -1);
 | |
| }
 | |
| 
 | |
| void FunctionPropertiesUpdater::finish(FunctionAnalysisManager &FAM) const {
 | |
|   // Update feature values from the BBs that were copied from the callee, or
 | |
|   // might have been modified because of inlining. The latter have been
 | |
|   // subtracted in the FunctionPropertiesUpdater ctor.
 | |
|   // There could be successors that were reached before but now are only
 | |
|   // reachable from elsewhere in the CFG.
 | |
|   // One example is the following diamond CFG (lines are arrows pointing down):
 | |
|   //    A
 | |
|   //  /   \
 | |
|   // B     C
 | |
|   // |     |
 | |
|   // |     D
 | |
|   // |     |
 | |
|   // |     E
 | |
|   //  \   /
 | |
|   //    F
 | |
|   // There's a call site in C that is inlined. Upon doing that, it turns out
 | |
|   // it expands to
 | |
|   //   call void @llvm.trap()
 | |
|   //   unreachable
 | |
|   // F isn't reachable from C anymore, but we did discount it when we set up
 | |
|   // FunctionPropertiesUpdater, so we need to re-include it here.
 | |
|   // At the same time, D and E were reachable before, but now are not anymore,
 | |
|   // so we need to leave D out (we discounted it at setup), and explicitly
 | |
|   // remove E.
 | |
|   SetVector<const BasicBlock *> Reinclude;
 | |
|   SetVector<const BasicBlock *> Unreachable;
 | |
|   const auto &DT =
 | |
|       FAM.getResult<DominatorTreeAnalysis>(const_cast<Function &>(Caller));
 | |
| 
 | |
|   if (&CallSiteBB != &*Caller.begin())
 | |
|     Reinclude.insert(&*Caller.begin());
 | |
| 
 | |
|   // Distribute the successors to the 2 buckets.
 | |
|   for (const auto *Succ : Successors)
 | |
|     if (DT.isReachableFromEntry(Succ))
 | |
|       Reinclude.insert(Succ);
 | |
|     else
 | |
|       Unreachable.insert(Succ);
 | |
| 
 | |
|   // For reinclusion, we want to stop at the reachable successors, who are at
 | |
|   // the beginning of the worklist; but, starting from the callsite bb and
 | |
|   // ending at those successors, we also want to perform a traversal.
 | |
|   // IncludeSuccessorsMark is the index after which we include successors.
 | |
|   const auto IncludeSuccessorsMark = Reinclude.size();
 | |
|   bool CSInsertion = Reinclude.insert(&CallSiteBB);
 | |
|   (void)CSInsertion;
 | |
|   assert(CSInsertion);
 | |
|   for (size_t I = 0; I < Reinclude.size(); ++I) {
 | |
|     const auto *BB = Reinclude[I];
 | |
|     FPI.reIncludeBB(*BB);
 | |
|     if (I >= IncludeSuccessorsMark)
 | |
|       Reinclude.insert(succ_begin(BB), succ_end(BB));
 | |
|   }
 | |
| 
 | |
|   // For exclusion, we don't need to exclude the set of BBs that were successors
 | |
|   // before and are now unreachable, because we already did that at setup. For
 | |
|   // the rest, as long as a successor is unreachable, we want to explicitly
 | |
|   // exclude it.
 | |
|   const auto AlreadyExcludedMark = Unreachable.size();
 | |
|   for (size_t I = 0; I < Unreachable.size(); ++I) {
 | |
|     const auto *U = Unreachable[I];
 | |
|     if (I >= AlreadyExcludedMark)
 | |
|       FPI.updateForBB(*U, -1);
 | |
|     for (const auto *Succ : successors(U))
 | |
|       if (!DT.isReachableFromEntry(Succ))
 | |
|         Unreachable.insert(Succ);
 | |
|   }
 | |
| 
 | |
|   const auto &LI = FAM.getResult<LoopAnalysis>(const_cast<Function &>(Caller));
 | |
|   FPI.updateAggregateStats(Caller, LI);
 | |
|   assert(FPI == FunctionPropertiesInfo::getFunctionPropertiesInfo(Caller, FAM));
 | |
| }
 |