196 lines
		
	
	
		
			6.6 KiB
		
	
	
	
		
			C++
		
	
	
	
			
		
		
	
	
			196 lines
		
	
	
		
			6.6 KiB
		
	
	
	
		
			C++
		
	
	
	
//===- HexagonVExtract.cpp ------------------------------------------------===//
 | 
						|
//
 | 
						|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
 | 
						|
// See https://llvm.org/LICENSE.txt for license information.
 | 
						|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
 | 
						|
//
 | 
						|
//===----------------------------------------------------------------------===//
 | 
						|
// This pass will replace multiple occurrences of V6_extractw from the same
 | 
						|
// vector register with a combination of a vector store and scalar loads.
 | 
						|
//===----------------------------------------------------------------------===//
 | 
						|
 | 
						|
#include "Hexagon.h"
 | 
						|
#include "HexagonInstrInfo.h"
 | 
						|
#include "HexagonMachineFunctionInfo.h"
 | 
						|
#include "HexagonRegisterInfo.h"
 | 
						|
#include "HexagonSubtarget.h"
 | 
						|
#include "llvm/ADT/SmallVector.h"
 | 
						|
#include "llvm/Pass.h"
 | 
						|
#include "llvm/CodeGen/MachineBasicBlock.h"
 | 
						|
#include "llvm/CodeGen/MachineFunction.h"
 | 
						|
#include "llvm/CodeGen/MachineFunctionPass.h"
 | 
						|
#include "llvm/CodeGen/MachineInstrBuilder.h"
 | 
						|
#include "llvm/CodeGen/MachineRegisterInfo.h"
 | 
						|
#include "llvm/Support/CommandLine.h"
 | 
						|
 | 
						|
#include <map>
 | 
						|
 | 
						|
using namespace llvm;
 | 
						|
 | 
						|
static cl::opt<unsigned> VExtractThreshold("hexagon-vextract-threshold",
 | 
						|
  cl::Hidden, cl::ZeroOrMore, cl::init(1),
 | 
						|
  cl::desc("Threshold for triggering vextract replacement"));
 | 
						|
 | 
						|
namespace llvm {
 | 
						|
  void initializeHexagonVExtractPass(PassRegistry& Registry);
 | 
						|
  FunctionPass *createHexagonVExtract();
 | 
						|
}
 | 
						|
 | 
						|
namespace {
 | 
						|
  class HexagonVExtract : public MachineFunctionPass {
 | 
						|
  public:
 | 
						|
    static char ID;
 | 
						|
    HexagonVExtract() : MachineFunctionPass(ID) {}
 | 
						|
 | 
						|
    StringRef getPassName() const override {
 | 
						|
      return "Hexagon optimize vextract";
 | 
						|
    }
 | 
						|
    void getAnalysisUsage(AnalysisUsage &AU) const override {
 | 
						|
      MachineFunctionPass::getAnalysisUsage(AU);
 | 
						|
    }
 | 
						|
    bool runOnMachineFunction(MachineFunction &MF) override;
 | 
						|
 | 
						|
  private:
 | 
						|
    const HexagonSubtarget *HST = nullptr;
 | 
						|
    const HexagonInstrInfo *HII = nullptr;
 | 
						|
 | 
						|
    unsigned genElemLoad(MachineInstr *ExtI, unsigned BaseR,
 | 
						|
                         MachineRegisterInfo &MRI);
 | 
						|
  };
 | 
						|
 | 
						|
  char HexagonVExtract::ID = 0;
 | 
						|
}
 | 
						|
 | 
						|
INITIALIZE_PASS(HexagonVExtract, "hexagon-vextract",
 | 
						|
  "Hexagon optimize vextract", false, false)
 | 
						|
 | 
						|
unsigned HexagonVExtract::genElemLoad(MachineInstr *ExtI, unsigned BaseR,
 | 
						|
                                      MachineRegisterInfo &MRI) {
 | 
						|
  MachineBasicBlock &ExtB = *ExtI->getParent();
 | 
						|
  DebugLoc DL = ExtI->getDebugLoc();
 | 
						|
  Register ElemR = MRI.createVirtualRegister(&Hexagon::IntRegsRegClass);
 | 
						|
 | 
						|
  Register ExtIdxR = ExtI->getOperand(2).getReg();
 | 
						|
  unsigned ExtIdxS = ExtI->getOperand(2).getSubReg();
 | 
						|
 | 
						|
  // Simplified check for a compile-time constant value of ExtIdxR.
 | 
						|
  if (ExtIdxS == 0) {
 | 
						|
    MachineInstr *DI = MRI.getVRegDef(ExtIdxR);
 | 
						|
    if (DI->getOpcode() == Hexagon::A2_tfrsi) {
 | 
						|
      unsigned V = DI->getOperand(1).getImm();
 | 
						|
      V &= (HST->getVectorLength()-1) & -4u;
 | 
						|
 | 
						|
      BuildMI(ExtB, ExtI, DL, HII->get(Hexagon::L2_loadri_io), ElemR)
 | 
						|
        .addReg(BaseR)
 | 
						|
        .addImm(V);
 | 
						|
      return ElemR;
 | 
						|
    }
 | 
						|
  }
 | 
						|
 | 
						|
  Register IdxR = MRI.createVirtualRegister(&Hexagon::IntRegsRegClass);
 | 
						|
  BuildMI(ExtB, ExtI, DL, HII->get(Hexagon::A2_andir), IdxR)
 | 
						|
    .add(ExtI->getOperand(2))
 | 
						|
    .addImm(-4);
 | 
						|
  BuildMI(ExtB, ExtI, DL, HII->get(Hexagon::L4_loadri_rr), ElemR)
 | 
						|
    .addReg(BaseR)
 | 
						|
    .addReg(IdxR)
 | 
						|
    .addImm(0);
 | 
						|
  return ElemR;
 | 
						|
}
 | 
						|
 | 
						|
bool HexagonVExtract::runOnMachineFunction(MachineFunction &MF) {
 | 
						|
  HST = &MF.getSubtarget<HexagonSubtarget>();
 | 
						|
  HII = HST->getInstrInfo();
 | 
						|
  const auto &HRI = *HST->getRegisterInfo();
 | 
						|
  MachineRegisterInfo &MRI = MF.getRegInfo();
 | 
						|
  MachineFrameInfo &MFI = MF.getFrameInfo();
 | 
						|
  Register AR =
 | 
						|
      MF.getInfo<HexagonMachineFunctionInfo>()->getStackAlignBaseVReg();
 | 
						|
  std::map<unsigned, SmallVector<MachineInstr*,4>> VExtractMap;
 | 
						|
  MaybeAlign MaxAlign;
 | 
						|
  bool Changed = false;
 | 
						|
 | 
						|
  for (MachineBasicBlock &MBB : MF) {
 | 
						|
    for (MachineInstr &MI : MBB) {
 | 
						|
      unsigned Opc = MI.getOpcode();
 | 
						|
      if (Opc != Hexagon::V6_extractw)
 | 
						|
        continue;
 | 
						|
      Register VecR = MI.getOperand(1).getReg();
 | 
						|
      VExtractMap[VecR].push_back(&MI);
 | 
						|
    }
 | 
						|
  }
 | 
						|
 | 
						|
  auto EmitAddr = [&] (MachineBasicBlock &BB, MachineBasicBlock::iterator At,
 | 
						|
                       DebugLoc dl, int FI, unsigned Offset) {
 | 
						|
    Register AddrR = MRI.createVirtualRegister(&Hexagon::IntRegsRegClass);
 | 
						|
    unsigned FiOpc = AR != 0 ? Hexagon::PS_fia : Hexagon::PS_fi;
 | 
						|
    auto MIB = BuildMI(BB, At, dl, HII->get(FiOpc), AddrR);
 | 
						|
    if (AR)
 | 
						|
      MIB.addReg(AR);
 | 
						|
    MIB.addFrameIndex(FI).addImm(Offset);
 | 
						|
    return AddrR;
 | 
						|
  };
 | 
						|
 | 
						|
  for (auto &P : VExtractMap) {
 | 
						|
    unsigned VecR = P.first;
 | 
						|
    if (P.second.size() <= VExtractThreshold)
 | 
						|
      continue;
 | 
						|
 | 
						|
    const auto &VecRC = *MRI.getRegClass(VecR);
 | 
						|
    Align Alignment = HRI.getSpillAlign(VecRC);
 | 
						|
    MaxAlign = max(MaxAlign, Alignment);
 | 
						|
    // Make sure this is not a spill slot: spill slots cannot be aligned
 | 
						|
    // if there are variable-sized objects on the stack. They must be
 | 
						|
    // accessible via FP (which is not aligned), because SP is unknown,
 | 
						|
    // and AP may not be available at the location of the load/store.
 | 
						|
    int FI = MFI.CreateStackObject(HRI.getSpillSize(VecRC), Alignment,
 | 
						|
                                   /*isSpillSlot*/ false);
 | 
						|
 | 
						|
    MachineInstr *DefI = MRI.getVRegDef(VecR);
 | 
						|
    MachineBasicBlock::iterator At = std::next(DefI->getIterator());
 | 
						|
    MachineBasicBlock &DefB = *DefI->getParent();
 | 
						|
    unsigned StoreOpc = VecRC.getID() == Hexagon::HvxVRRegClassID
 | 
						|
                          ? Hexagon::V6_vS32b_ai
 | 
						|
                          : Hexagon::PS_vstorerw_ai;
 | 
						|
    Register AddrR = EmitAddr(DefB, At, DefI->getDebugLoc(), FI, 0);
 | 
						|
    BuildMI(DefB, At, DefI->getDebugLoc(), HII->get(StoreOpc))
 | 
						|
      .addReg(AddrR)
 | 
						|
      .addImm(0)
 | 
						|
      .addReg(VecR);
 | 
						|
 | 
						|
    unsigned VecSize = HRI.getRegSizeInBits(VecRC) / 8;
 | 
						|
 | 
						|
    for (MachineInstr *ExtI : P.second) {
 | 
						|
      assert(ExtI->getOpcode() == Hexagon::V6_extractw);
 | 
						|
      unsigned SR = ExtI->getOperand(1).getSubReg();
 | 
						|
      assert(ExtI->getOperand(1).getReg() == VecR);
 | 
						|
 | 
						|
      MachineBasicBlock &ExtB = *ExtI->getParent();
 | 
						|
      DebugLoc DL = ExtI->getDebugLoc();
 | 
						|
      Register BaseR = EmitAddr(ExtB, ExtI, ExtI->getDebugLoc(), FI,
 | 
						|
                                SR == 0 ? 0 : VecSize/2);
 | 
						|
 | 
						|
      unsigned ElemR = genElemLoad(ExtI, BaseR, MRI);
 | 
						|
      Register ExtR = ExtI->getOperand(0).getReg();
 | 
						|
      MRI.replaceRegWith(ExtR, ElemR);
 | 
						|
      ExtB.erase(ExtI);
 | 
						|
      Changed = true;
 | 
						|
    }
 | 
						|
  }
 | 
						|
 | 
						|
  if (AR && MaxAlign) {
 | 
						|
    // Update the required stack alignment.
 | 
						|
    MachineInstr *AlignaI = MRI.getVRegDef(AR);
 | 
						|
    assert(AlignaI->getOpcode() == Hexagon::PS_aligna);
 | 
						|
    MachineOperand &Op = AlignaI->getOperand(1);
 | 
						|
    if (*MaxAlign > Op.getImm())
 | 
						|
      Op.setImm(MaxAlign->value());
 | 
						|
  }
 | 
						|
 | 
						|
  return Changed;
 | 
						|
}
 | 
						|
 | 
						|
FunctionPass *llvm::createHexagonVExtract() {
 | 
						|
  return new HexagonVExtract();
 | 
						|
}
 |