217 lines
		
	
	
		
			7.4 KiB
		
	
	
	
		
			C++
		
	
	
	
			
		
		
	
	
			217 lines
		
	
	
		
			7.4 KiB
		
	
	
	
		
			C++
		
	
	
	
| //===-- RegUsageInfoCollector.cpp - Register Usage Information Collector --===//
 | |
| //
 | |
| // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
 | |
| // See https://llvm.org/LICENSE.txt for license information.
 | |
| // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
 | |
| //
 | |
| //===----------------------------------------------------------------------===//
 | |
| ///
 | |
| /// This pass is required to take advantage of the interprocedural register
 | |
| /// allocation infrastructure.
 | |
| ///
 | |
| /// This pass is simple MachineFunction pass which collects register usage
 | |
| /// details by iterating through each physical registers and checking
 | |
| /// MRI::isPhysRegUsed() then creates a RegMask based on this details.
 | |
| /// The pass then stores this RegMask in PhysicalRegisterUsageInfo.cpp
 | |
| ///
 | |
| //===----------------------------------------------------------------------===//
 | |
| 
 | |
| #include "llvm/ADT/Statistic.h"
 | |
| #include "llvm/CodeGen/MachineBasicBlock.h"
 | |
| #include "llvm/CodeGen/MachineFunctionPass.h"
 | |
| #include "llvm/CodeGen/MachineInstr.h"
 | |
| #include "llvm/CodeGen/MachineOperand.h"
 | |
| #include "llvm/CodeGen/MachineRegisterInfo.h"
 | |
| #include "llvm/CodeGen/Passes.h"
 | |
| #include "llvm/CodeGen/RegisterUsageInfo.h"
 | |
| #include "llvm/Support/Debug.h"
 | |
| #include "llvm/Support/raw_ostream.h"
 | |
| #include "llvm/CodeGen/TargetFrameLowering.h"
 | |
| 
 | |
| using namespace llvm;
 | |
| 
 | |
| #define DEBUG_TYPE "ip-regalloc"
 | |
| 
 | |
| STATISTIC(NumCSROpt,
 | |
|           "Number of functions optimized for callee saved registers");
 | |
| 
 | |
| namespace {
 | |
| 
 | |
| class RegUsageInfoCollector : public MachineFunctionPass {
 | |
| public:
 | |
|   RegUsageInfoCollector() : MachineFunctionPass(ID) {
 | |
|     PassRegistry &Registry = *PassRegistry::getPassRegistry();
 | |
|     initializeRegUsageInfoCollectorPass(Registry);
 | |
|   }
 | |
| 
 | |
|   StringRef getPassName() const override {
 | |
|     return "Register Usage Information Collector Pass";
 | |
|   }
 | |
| 
 | |
|   void getAnalysisUsage(AnalysisUsage &AU) const override {
 | |
|     AU.addRequired<PhysicalRegisterUsageInfo>();
 | |
|     AU.setPreservesAll();
 | |
|     MachineFunctionPass::getAnalysisUsage(AU);
 | |
|   }
 | |
| 
 | |
|   bool runOnMachineFunction(MachineFunction &MF) override;
 | |
| 
 | |
|   // Call getCalleeSaves and then also set the bits for subregs and
 | |
|   // fully saved superregs.
 | |
|   static void computeCalleeSavedRegs(BitVector &SavedRegs, MachineFunction &MF);
 | |
| 
 | |
|   static char ID;
 | |
| };
 | |
| 
 | |
| } // end of anonymous namespace
 | |
| 
 | |
| char RegUsageInfoCollector::ID = 0;
 | |
| 
 | |
| INITIALIZE_PASS_BEGIN(RegUsageInfoCollector, "RegUsageInfoCollector",
 | |
|                       "Register Usage Information Collector", false, false)
 | |
| INITIALIZE_PASS_DEPENDENCY(PhysicalRegisterUsageInfo)
 | |
| INITIALIZE_PASS_END(RegUsageInfoCollector, "RegUsageInfoCollector",
 | |
|                     "Register Usage Information Collector", false, false)
 | |
| 
 | |
| FunctionPass *llvm::createRegUsageInfoCollector() {
 | |
|   return new RegUsageInfoCollector();
 | |
| }
 | |
| 
 | |
| // TODO: Move to hook somwehere?
 | |
| 
 | |
| // Return true if it is useful to track the used registers for IPRA / no CSR
 | |
| // optimizations. This is not useful for entry points, and computing the
 | |
| // register usage information is expensive.
 | |
| static bool isCallableFunction(const MachineFunction &MF) {
 | |
|   switch (MF.getFunction().getCallingConv()) {
 | |
|   case CallingConv::AMDGPU_VS:
 | |
|   case CallingConv::AMDGPU_GS:
 | |
|   case CallingConv::AMDGPU_PS:
 | |
|   case CallingConv::AMDGPU_CS:
 | |
|   case CallingConv::AMDGPU_HS:
 | |
|   case CallingConv::AMDGPU_ES:
 | |
|   case CallingConv::AMDGPU_LS:
 | |
|   case CallingConv::AMDGPU_KERNEL:
 | |
|     return false;
 | |
|   default:
 | |
|     return true;
 | |
|   }
 | |
| }
 | |
| 
 | |
| bool RegUsageInfoCollector::runOnMachineFunction(MachineFunction &MF) {
 | |
|   MachineRegisterInfo *MRI = &MF.getRegInfo();
 | |
|   const TargetRegisterInfo *TRI = MF.getSubtarget().getRegisterInfo();
 | |
|   const LLVMTargetMachine &TM = MF.getTarget();
 | |
| 
 | |
|   LLVM_DEBUG(dbgs() << " -------------------- " << getPassName()
 | |
|                     << " -------------------- \nFunction Name : "
 | |
|                     << MF.getName() << '\n');
 | |
| 
 | |
|   // Analyzing the register usage may be expensive on some targets.
 | |
|   if (!isCallableFunction(MF)) {
 | |
|     LLVM_DEBUG(dbgs() << "Not analyzing non-callable function\n");
 | |
|     return false;
 | |
|   }
 | |
| 
 | |
|   // If there are no callers, there's no point in computing more precise
 | |
|   // register usage here.
 | |
|   if (MF.getFunction().use_empty()) {
 | |
|     LLVM_DEBUG(dbgs() << "Not analyzing function with no callers\n");
 | |
|     return false;
 | |
|   }
 | |
| 
 | |
|   std::vector<uint32_t> RegMask;
 | |
| 
 | |
|   // Compute the size of the bit vector to represent all the registers.
 | |
|   // The bit vector is broken into 32-bit chunks, thus takes the ceil of
 | |
|   // the number of registers divided by 32 for the size.
 | |
|   unsigned RegMaskSize = MachineOperand::getRegMaskSize(TRI->getNumRegs());
 | |
|   RegMask.resize(RegMaskSize, ~((uint32_t)0));
 | |
| 
 | |
|   const Function &F = MF.getFunction();
 | |
| 
 | |
|   PhysicalRegisterUsageInfo &PRUI = getAnalysis<PhysicalRegisterUsageInfo>();
 | |
|   PRUI.setTargetMachine(TM);
 | |
| 
 | |
|   LLVM_DEBUG(dbgs() << "Clobbered Registers: ");
 | |
| 
 | |
|   BitVector SavedRegs;
 | |
|   computeCalleeSavedRegs(SavedRegs, MF);
 | |
| 
 | |
|   const BitVector &UsedPhysRegsMask = MRI->getUsedPhysRegsMask();
 | |
|   auto SetRegAsDefined = [&RegMask] (unsigned Reg) {
 | |
|     RegMask[Reg / 32] &= ~(1u << Reg % 32);
 | |
|   };
 | |
| 
 | |
|   // Some targets can clobber registers "inside" a call, typically in
 | |
|   // linker-generated code.
 | |
|   for (const MCPhysReg Reg : TRI->getIntraCallClobberedRegs(&MF))
 | |
|     for (MCRegAliasIterator AI(Reg, TRI, true); AI.isValid(); ++AI)
 | |
|       SetRegAsDefined(*AI);
 | |
| 
 | |
|   // Scan all the physical registers. When a register is defined in the current
 | |
|   // function set it and all the aliasing registers as defined in the regmask.
 | |
|   // FIXME: Rewrite to use regunits.
 | |
|   for (unsigned PReg = 1, PRegE = TRI->getNumRegs(); PReg < PRegE; ++PReg) {
 | |
|     // Don't count registers that are saved and restored.
 | |
|     if (SavedRegs.test(PReg))
 | |
|       continue;
 | |
|     // If a register is defined by an instruction mark it as defined together
 | |
|     // with all it's unsaved aliases.
 | |
|     if (!MRI->def_empty(PReg)) {
 | |
|       for (MCRegAliasIterator AI(PReg, TRI, true); AI.isValid(); ++AI)
 | |
|         if (!SavedRegs.test(*AI))
 | |
|           SetRegAsDefined(*AI);
 | |
|       continue;
 | |
|     }
 | |
|     // If a register is in the UsedPhysRegsMask set then mark it as defined.
 | |
|     // All clobbered aliases will also be in the set, so we can skip setting
 | |
|     // as defined all the aliases here.
 | |
|     if (UsedPhysRegsMask.test(PReg))
 | |
|       SetRegAsDefined(PReg);
 | |
|   }
 | |
| 
 | |
|   if (TargetFrameLowering::isSafeForNoCSROpt(F) &&
 | |
|       MF.getSubtarget().getFrameLowering()->isProfitableForNoCSROpt(F)) {
 | |
|     ++NumCSROpt;
 | |
|     LLVM_DEBUG(dbgs() << MF.getName()
 | |
|                       << " function optimized for not having CSR.\n");
 | |
|   }
 | |
| 
 | |
|   LLVM_DEBUG(
 | |
|     for (unsigned PReg = 1, PRegE = TRI->getNumRegs(); PReg < PRegE; ++PReg) {
 | |
|       if (MachineOperand::clobbersPhysReg(&(RegMask[0]), PReg))
 | |
|         dbgs() << printReg(PReg, TRI) << " ";
 | |
|     }
 | |
| 
 | |
|     dbgs() << " \n----------------------------------------\n";
 | |
|   );
 | |
| 
 | |
|   PRUI.storeUpdateRegUsageInfo(F, RegMask);
 | |
| 
 | |
|   return false;
 | |
| }
 | |
| 
 | |
| void RegUsageInfoCollector::
 | |
| computeCalleeSavedRegs(BitVector &SavedRegs, MachineFunction &MF) {
 | |
|   const TargetFrameLowering &TFI = *MF.getSubtarget().getFrameLowering();
 | |
|   const TargetRegisterInfo &TRI = *MF.getSubtarget().getRegisterInfo();
 | |
| 
 | |
|   // Target will return the set of registers that it saves/restores as needed.
 | |
|   SavedRegs.clear();
 | |
|   TFI.getCalleeSaves(MF, SavedRegs);
 | |
|   if (SavedRegs.none())
 | |
|     return;
 | |
| 
 | |
|   // Insert subregs.
 | |
|   const MCPhysReg *CSRegs = TRI.getCalleeSavedRegs(&MF);
 | |
|   for (unsigned i = 0; CSRegs[i]; ++i) {
 | |
|     MCPhysReg Reg = CSRegs[i];
 | |
|     if (SavedRegs.test(Reg)) {
 | |
|       // Save subregisters
 | |
|       for (MCSubRegIterator SR(Reg, &TRI); SR.isValid(); ++SR)
 | |
|         SavedRegs.set(*SR);
 | |
|     }
 | |
|   }
 | |
| }
 |