307 lines
		
	
	
		
			9.8 KiB
		
	
	
	
		
			C++
		
	
	
	
			
		
		
	
	
			307 lines
		
	
	
		
			9.8 KiB
		
	
	
	
		
			C++
		
	
	
	
//===-- SpeculateAnalyses.cpp  --*- C++ -*-===//
 | 
						|
//
 | 
						|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
 | 
						|
// See https://llvm.org/LICENSE.txt for license information.
 | 
						|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
 | 
						|
//
 | 
						|
//===----------------------------------------------------------------------===//
 | 
						|
 | 
						|
#include "llvm/ExecutionEngine/Orc/SpeculateAnalyses.h"
 | 
						|
#include "llvm/ADT/ArrayRef.h"
 | 
						|
#include "llvm/ADT/DenseMap.h"
 | 
						|
#include "llvm/ADT/STLExtras.h"
 | 
						|
#include "llvm/ADT/SmallPtrSet.h"
 | 
						|
#include "llvm/ADT/SmallVector.h"
 | 
						|
#include "llvm/Analysis/BlockFrequencyInfo.h"
 | 
						|
#include "llvm/Analysis/BranchProbabilityInfo.h"
 | 
						|
#include "llvm/Analysis/CFG.h"
 | 
						|
#include "llvm/IR/PassManager.h"
 | 
						|
#include "llvm/Passes/PassBuilder.h"
 | 
						|
#include "llvm/Support/ErrorHandling.h"
 | 
						|
 | 
						|
#include <algorithm>
 | 
						|
 | 
						|
namespace {
 | 
						|
using namespace llvm;
 | 
						|
SmallVector<const BasicBlock *, 8> findBBwithCalls(const Function &F,
 | 
						|
                                                   bool IndirectCall = false) {
 | 
						|
  SmallVector<const BasicBlock *, 8> BBs;
 | 
						|
 | 
						|
  auto findCallInst = [&IndirectCall](const Instruction &I) {
 | 
						|
    if (auto Call = dyn_cast<CallBase>(&I))
 | 
						|
      return Call->isIndirectCall() ? IndirectCall : true;
 | 
						|
    else
 | 
						|
      return false;
 | 
						|
  };
 | 
						|
  for (auto &BB : F)
 | 
						|
    if (findCallInst(*BB.getTerminator()) ||
 | 
						|
        llvm::any_of(BB.instructionsWithoutDebug(), findCallInst))
 | 
						|
      BBs.emplace_back(&BB);
 | 
						|
 | 
						|
  return BBs;
 | 
						|
}
 | 
						|
} // namespace
 | 
						|
 | 
						|
// Implementations of Queries shouldn't need to lock the resources
 | 
						|
// such as LLVMContext, each argument (function) has a non-shared LLVMContext
 | 
						|
// Plus, if Queries contain states necessary locking scheme should be provided.
 | 
						|
namespace llvm {
 | 
						|
namespace orc {
 | 
						|
 | 
						|
// Collect direct calls only
 | 
						|
void SpeculateQuery::findCalles(const BasicBlock *BB,
 | 
						|
                                DenseSet<StringRef> &CallesNames) {
 | 
						|
  assert(BB != nullptr && "Traversing Null BB to find calls?");
 | 
						|
 | 
						|
  auto getCalledFunction = [&CallesNames](const CallBase *Call) {
 | 
						|
    auto CalledValue = Call->getCalledOperand()->stripPointerCasts();
 | 
						|
    if (auto DirectCall = dyn_cast<Function>(CalledValue))
 | 
						|
      CallesNames.insert(DirectCall->getName());
 | 
						|
  };
 | 
						|
  for (auto &I : BB->instructionsWithoutDebug())
 | 
						|
    if (auto CI = dyn_cast<CallInst>(&I))
 | 
						|
      getCalledFunction(CI);
 | 
						|
 | 
						|
  if (auto II = dyn_cast<InvokeInst>(BB->getTerminator()))
 | 
						|
    getCalledFunction(II);
 | 
						|
}
 | 
						|
 | 
						|
bool SpeculateQuery::isStraightLine(const Function &F) {
 | 
						|
  return llvm::all_of(F.getBasicBlockList(), [](const BasicBlock &BB) {
 | 
						|
    return BB.getSingleSuccessor() != nullptr;
 | 
						|
  });
 | 
						|
}
 | 
						|
 | 
						|
// BlockFreqQuery Implementations
 | 
						|
 | 
						|
size_t BlockFreqQuery::numBBToGet(size_t numBB) {
 | 
						|
  // small CFG
 | 
						|
  if (numBB < 4)
 | 
						|
    return numBB;
 | 
						|
  // mid-size CFG
 | 
						|
  else if (numBB < 20)
 | 
						|
    return (numBB / 2);
 | 
						|
  else
 | 
						|
    return (numBB / 2) + (numBB / 4);
 | 
						|
}
 | 
						|
 | 
						|
BlockFreqQuery::ResultTy BlockFreqQuery::operator()(Function &F) {
 | 
						|
  DenseMap<StringRef, DenseSet<StringRef>> CallerAndCalles;
 | 
						|
  DenseSet<StringRef> Calles;
 | 
						|
  SmallVector<std::pair<const BasicBlock *, uint64_t>, 8> BBFreqs;
 | 
						|
 | 
						|
  PassBuilder PB;
 | 
						|
  FunctionAnalysisManager FAM;
 | 
						|
  PB.registerFunctionAnalyses(FAM);
 | 
						|
 | 
						|
  auto IBBs = findBBwithCalls(F);
 | 
						|
 | 
						|
  if (IBBs.empty())
 | 
						|
    return None;
 | 
						|
 | 
						|
  auto &BFI = FAM.getResult<BlockFrequencyAnalysis>(F);
 | 
						|
 | 
						|
  for (const auto I : IBBs)
 | 
						|
    BBFreqs.push_back({I, BFI.getBlockFreq(I).getFrequency()});
 | 
						|
 | 
						|
  assert(IBBs.size() == BBFreqs.size() && "BB Count Mismatch");
 | 
						|
 | 
						|
  llvm::sort(BBFreqs, [](decltype(BBFreqs)::const_reference BBF,
 | 
						|
                         decltype(BBFreqs)::const_reference BBS) {
 | 
						|
    return BBF.second > BBS.second ? true : false;
 | 
						|
  });
 | 
						|
 | 
						|
  // ignoring number of direct calls in a BB
 | 
						|
  auto Topk = numBBToGet(BBFreqs.size());
 | 
						|
 | 
						|
  for (size_t i = 0; i < Topk; i++)
 | 
						|
    findCalles(BBFreqs[i].first, Calles);
 | 
						|
 | 
						|
  assert(!Calles.empty() && "Running Analysis on Function with no calls?");
 | 
						|
 | 
						|
  CallerAndCalles.insert({F.getName(), std::move(Calles)});
 | 
						|
 | 
						|
  return CallerAndCalles;
 | 
						|
}
 | 
						|
 | 
						|
// SequenceBBQuery Implementation
 | 
						|
std::size_t SequenceBBQuery::getHottestBlocks(std::size_t TotalBlocks) {
 | 
						|
  if (TotalBlocks == 1)
 | 
						|
    return TotalBlocks;
 | 
						|
  return TotalBlocks / 2;
 | 
						|
}
 | 
						|
 | 
						|
// FIXME : find good implementation.
 | 
						|
SequenceBBQuery::BlockListTy
 | 
						|
SequenceBBQuery::rearrangeBB(const Function &F, const BlockListTy &BBList) {
 | 
						|
  BlockListTy RearrangedBBSet;
 | 
						|
 | 
						|
  for (auto &Block : F.getBasicBlockList())
 | 
						|
    if (llvm::is_contained(BBList, &Block))
 | 
						|
      RearrangedBBSet.push_back(&Block);
 | 
						|
 | 
						|
  assert(RearrangedBBSet.size() == BBList.size() &&
 | 
						|
         "BasicBlock missing while rearranging?");
 | 
						|
  return RearrangedBBSet;
 | 
						|
}
 | 
						|
 | 
						|
void SequenceBBQuery::traverseToEntryBlock(const BasicBlock *AtBB,
 | 
						|
                                           const BlockListTy &CallerBlocks,
 | 
						|
                                           const BackEdgesInfoTy &BackEdgesInfo,
 | 
						|
                                           const BranchProbabilityInfo *BPI,
 | 
						|
                                           VisitedBlocksInfoTy &VisitedBlocks) {
 | 
						|
  auto Itr = VisitedBlocks.find(AtBB);
 | 
						|
  if (Itr != VisitedBlocks.end()) { // already visited.
 | 
						|
    if (!Itr->second.Upward)
 | 
						|
      return;
 | 
						|
    Itr->second.Upward = false;
 | 
						|
  } else {
 | 
						|
    // Create hint for newly discoverd blocks.
 | 
						|
    WalkDirection BlockHint;
 | 
						|
    BlockHint.Upward = false;
 | 
						|
    // FIXME: Expensive Check
 | 
						|
    if (llvm::is_contained(CallerBlocks, AtBB))
 | 
						|
      BlockHint.CallerBlock = true;
 | 
						|
    VisitedBlocks.insert(std::make_pair(AtBB, BlockHint));
 | 
						|
  }
 | 
						|
 | 
						|
  const_pred_iterator PIt = pred_begin(AtBB), EIt = pred_end(AtBB);
 | 
						|
  // Move this check to top, when we have code setup to launch speculative
 | 
						|
  // compiles for function in entry BB, this triggers the speculative compiles
 | 
						|
  // before running the program.
 | 
						|
  if (PIt == EIt) // No Preds.
 | 
						|
    return;
 | 
						|
 | 
						|
  DenseSet<const BasicBlock *> PredSkipNodes;
 | 
						|
 | 
						|
  // Since we are checking for predecessor's backedges, this Block
 | 
						|
  // occurs in second position.
 | 
						|
  for (auto &I : BackEdgesInfo)
 | 
						|
    if (I.second == AtBB)
 | 
						|
      PredSkipNodes.insert(I.first);
 | 
						|
 | 
						|
  // Skip predecessors which source of back-edges.
 | 
						|
  for (; PIt != EIt; ++PIt)
 | 
						|
    // checking EdgeHotness is cheaper
 | 
						|
    if (BPI->isEdgeHot(*PIt, AtBB) && !PredSkipNodes.count(*PIt))
 | 
						|
      traverseToEntryBlock(*PIt, CallerBlocks, BackEdgesInfo, BPI,
 | 
						|
                           VisitedBlocks);
 | 
						|
}
 | 
						|
 | 
						|
void SequenceBBQuery::traverseToExitBlock(const BasicBlock *AtBB,
 | 
						|
                                          const BlockListTy &CallerBlocks,
 | 
						|
                                          const BackEdgesInfoTy &BackEdgesInfo,
 | 
						|
                                          const BranchProbabilityInfo *BPI,
 | 
						|
                                          VisitedBlocksInfoTy &VisitedBlocks) {
 | 
						|
  auto Itr = VisitedBlocks.find(AtBB);
 | 
						|
  if (Itr != VisitedBlocks.end()) { // already visited.
 | 
						|
    if (!Itr->second.Downward)
 | 
						|
      return;
 | 
						|
    Itr->second.Downward = false;
 | 
						|
  } else {
 | 
						|
    // Create hint for newly discoverd blocks.
 | 
						|
    WalkDirection BlockHint;
 | 
						|
    BlockHint.Downward = false;
 | 
						|
    // FIXME: Expensive Check
 | 
						|
    if (llvm::is_contained(CallerBlocks, AtBB))
 | 
						|
      BlockHint.CallerBlock = true;
 | 
						|
    VisitedBlocks.insert(std::make_pair(AtBB, BlockHint));
 | 
						|
  }
 | 
						|
 | 
						|
  const_succ_iterator PIt = succ_begin(AtBB), EIt = succ_end(AtBB);
 | 
						|
  if (PIt == EIt) // No succs.
 | 
						|
    return;
 | 
						|
 | 
						|
  // If there are hot edges, then compute SuccSkipNodes.
 | 
						|
  DenseSet<const BasicBlock *> SuccSkipNodes;
 | 
						|
 | 
						|
  // Since we are checking for successor's backedges, this Block
 | 
						|
  // occurs in first position.
 | 
						|
  for (auto &I : BackEdgesInfo)
 | 
						|
    if (I.first == AtBB)
 | 
						|
      SuccSkipNodes.insert(I.second);
 | 
						|
 | 
						|
  for (; PIt != EIt; ++PIt)
 | 
						|
    if (BPI->isEdgeHot(AtBB, *PIt) && !SuccSkipNodes.count(*PIt))
 | 
						|
      traverseToExitBlock(*PIt, CallerBlocks, BackEdgesInfo, BPI,
 | 
						|
                          VisitedBlocks);
 | 
						|
}
 | 
						|
 | 
						|
// Get Block frequencies for blocks and take most frquently executed block,
 | 
						|
// walk towards the entry block from those blocks and discover the basic blocks
 | 
						|
// with call.
 | 
						|
SequenceBBQuery::BlockListTy
 | 
						|
SequenceBBQuery::queryCFG(Function &F, const BlockListTy &CallerBlocks) {
 | 
						|
 | 
						|
  BlockFreqInfoTy BBFreqs;
 | 
						|
  VisitedBlocksInfoTy VisitedBlocks;
 | 
						|
  BackEdgesInfoTy BackEdgesInfo;
 | 
						|
 | 
						|
  PassBuilder PB;
 | 
						|
  FunctionAnalysisManager FAM;
 | 
						|
  PB.registerFunctionAnalyses(FAM);
 | 
						|
 | 
						|
  auto &BFI = FAM.getResult<BlockFrequencyAnalysis>(F);
 | 
						|
 | 
						|
  llvm::FindFunctionBackedges(F, BackEdgesInfo);
 | 
						|
 | 
						|
  for (const auto I : CallerBlocks)
 | 
						|
    BBFreqs.push_back({I, BFI.getBlockFreq(I).getFrequency()});
 | 
						|
 | 
						|
  llvm::sort(BBFreqs, [](decltype(BBFreqs)::const_reference Bbf,
 | 
						|
                         decltype(BBFreqs)::const_reference Bbs) {
 | 
						|
    return Bbf.second > Bbs.second;
 | 
						|
  });
 | 
						|
 | 
						|
  ArrayRef<std::pair<const BasicBlock *, uint64_t>> HotBlocksRef(BBFreqs);
 | 
						|
  HotBlocksRef =
 | 
						|
      HotBlocksRef.drop_back(BBFreqs.size() - getHottestBlocks(BBFreqs.size()));
 | 
						|
 | 
						|
  BranchProbabilityInfo *BPI =
 | 
						|
      FAM.getCachedResult<BranchProbabilityAnalysis>(F);
 | 
						|
 | 
						|
  // visit NHotBlocks,
 | 
						|
  // traverse upwards to entry
 | 
						|
  // traverse downwards to end.
 | 
						|
 | 
						|
  for (auto I : HotBlocksRef) {
 | 
						|
    traverseToEntryBlock(I.first, CallerBlocks, BackEdgesInfo, BPI,
 | 
						|
                         VisitedBlocks);
 | 
						|
    traverseToExitBlock(I.first, CallerBlocks, BackEdgesInfo, BPI,
 | 
						|
                        VisitedBlocks);
 | 
						|
  }
 | 
						|
 | 
						|
  BlockListTy MinCallerBlocks;
 | 
						|
  for (auto &I : VisitedBlocks)
 | 
						|
    if (I.second.CallerBlock)
 | 
						|
      MinCallerBlocks.push_back(std::move(I.first));
 | 
						|
 | 
						|
  return rearrangeBB(F, MinCallerBlocks);
 | 
						|
}
 | 
						|
 | 
						|
SpeculateQuery::ResultTy SequenceBBQuery::operator()(Function &F) {
 | 
						|
  // reduce the number of lists!
 | 
						|
  DenseMap<StringRef, DenseSet<StringRef>> CallerAndCalles;
 | 
						|
  DenseSet<StringRef> Calles;
 | 
						|
  BlockListTy SequencedBlocks;
 | 
						|
  BlockListTy CallerBlocks;
 | 
						|
 | 
						|
  CallerBlocks = findBBwithCalls(F);
 | 
						|
  if (CallerBlocks.empty())
 | 
						|
    return None;
 | 
						|
 | 
						|
  if (isStraightLine(F))
 | 
						|
    SequencedBlocks = rearrangeBB(F, CallerBlocks);
 | 
						|
  else
 | 
						|
    SequencedBlocks = queryCFG(F, CallerBlocks);
 | 
						|
 | 
						|
  for (auto BB : SequencedBlocks)
 | 
						|
    findCalles(BB, Calles);
 | 
						|
 | 
						|
  CallerAndCalles.insert({F.getName(), std::move(Calles)});
 | 
						|
  return CallerAndCalles;
 | 
						|
}
 | 
						|
 | 
						|
} // namespace orc
 | 
						|
} // namespace llvm
 |