311 lines
		
	
	
		
			6.6 KiB
		
	
	
	
		
			C++
		
	
	
	
			
		
		
	
	
			311 lines
		
	
	
		
			6.6 KiB
		
	
	
	
		
			C++
		
	
	
	
//=====-- AMDGPUSubtarget.h - Define Subtarget for AMDGPU ------*- C++ -*-====//
 | 
						|
//
 | 
						|
//                     The LLVM Compiler Infrastructure
 | 
						|
//
 | 
						|
// This file is distributed under the University of Illinois Open Source
 | 
						|
// License. See LICENSE.TXT for details.
 | 
						|
//
 | 
						|
//==-----------------------------------------------------------------------===//
 | 
						|
//
 | 
						|
/// \file
 | 
						|
/// \brief AMDGPU specific subclass of TargetSubtarget.
 | 
						|
//
 | 
						|
//===----------------------------------------------------------------------===//
 | 
						|
 | 
						|
#ifndef LLVM_LIB_TARGET_AMDGPU_AMDGPUSUBTARGET_H
 | 
						|
#define LLVM_LIB_TARGET_AMDGPU_AMDGPUSUBTARGET_H
 | 
						|
 | 
						|
#include "AMDGPU.h"
 | 
						|
#include "AMDGPUFrameLowering.h"
 | 
						|
#include "AMDGPUInstrInfo.h"
 | 
						|
#include "AMDGPUISelLowering.h"
 | 
						|
#include "AMDGPUSubtarget.h"
 | 
						|
#include "Utils/AMDGPUBaseInfo.h"
 | 
						|
#include "llvm/ADT/StringRef.h"
 | 
						|
#include "llvm/Target/TargetSubtargetInfo.h"
 | 
						|
 | 
						|
#define GET_SUBTARGETINFO_HEADER
 | 
						|
#include "AMDGPUGenSubtargetInfo.inc"
 | 
						|
 | 
						|
namespace llvm {
 | 
						|
 | 
						|
class SIMachineFunctionInfo;
 | 
						|
 | 
						|
class AMDGPUSubtarget : public AMDGPUGenSubtargetInfo {
 | 
						|
 | 
						|
public:
 | 
						|
  enum Generation {
 | 
						|
    R600 = 0,
 | 
						|
    R700,
 | 
						|
    EVERGREEN,
 | 
						|
    NORTHERN_ISLANDS,
 | 
						|
    SOUTHERN_ISLANDS,
 | 
						|
    SEA_ISLANDS,
 | 
						|
    VOLCANIC_ISLANDS,
 | 
						|
  };
 | 
						|
 | 
						|
  enum {
 | 
						|
    FIXED_SGPR_COUNT_FOR_INIT_BUG = 80
 | 
						|
  };
 | 
						|
 | 
						|
  enum {
 | 
						|
    ISAVersion0_0_0,
 | 
						|
    ISAVersion7_0_0,
 | 
						|
    ISAVersion7_0_1,
 | 
						|
    ISAVersion8_0_0,
 | 
						|
    ISAVersion8_0_1
 | 
						|
  };
 | 
						|
 | 
						|
private:
 | 
						|
  std::string DevName;
 | 
						|
  bool Is64bit;
 | 
						|
  bool DumpCode;
 | 
						|
  bool R600ALUInst;
 | 
						|
  bool HasVertexCache;
 | 
						|
  short TexVTXClauseSize;
 | 
						|
  Generation Gen;
 | 
						|
  bool FP64;
 | 
						|
  bool FP64Denormals;
 | 
						|
  bool FP32Denormals;
 | 
						|
  bool FastFMAF32;
 | 
						|
  bool CaymanISA;
 | 
						|
  bool FlatAddressSpace;
 | 
						|
  bool EnableIRStructurizer;
 | 
						|
  bool EnablePromoteAlloca;
 | 
						|
  bool EnableIfCvt;
 | 
						|
  bool EnableLoadStoreOpt;
 | 
						|
  bool EnableUnsafeDSOffsetFolding;
 | 
						|
  unsigned WavefrontSize;
 | 
						|
  bool CFALUBug;
 | 
						|
  int LocalMemorySize;
 | 
						|
  bool EnableVGPRSpilling;
 | 
						|
  bool SGPRInitBug;
 | 
						|
  bool IsGCN;
 | 
						|
  bool GCN1Encoding;
 | 
						|
  bool GCN3Encoding;
 | 
						|
  bool CIInsts;
 | 
						|
  bool FeatureDisable;
 | 
						|
  int LDSBankCount;
 | 
						|
  unsigned IsaVersion;
 | 
						|
  bool EnableHugeScratchBuffer;
 | 
						|
 | 
						|
  std::unique_ptr<AMDGPUFrameLowering> FrameLowering;
 | 
						|
  std::unique_ptr<AMDGPUTargetLowering> TLInfo;
 | 
						|
  std::unique_ptr<AMDGPUInstrInfo> InstrInfo;
 | 
						|
  InstrItineraryData InstrItins;
 | 
						|
  Triple TargetTriple;
 | 
						|
 | 
						|
public:
 | 
						|
  AMDGPUSubtarget(const Triple &TT, StringRef CPU, StringRef FS,
 | 
						|
                  TargetMachine &TM);
 | 
						|
  AMDGPUSubtarget &initializeSubtargetDependencies(const Triple &TT,
 | 
						|
                                                   StringRef GPU, StringRef FS);
 | 
						|
 | 
						|
  const AMDGPUFrameLowering *getFrameLowering() const override {
 | 
						|
    return FrameLowering.get();
 | 
						|
  }
 | 
						|
  const AMDGPUInstrInfo *getInstrInfo() const override {
 | 
						|
    return InstrInfo.get();
 | 
						|
  }
 | 
						|
  const AMDGPURegisterInfo *getRegisterInfo() const override {
 | 
						|
    return &InstrInfo->getRegisterInfo();
 | 
						|
  }
 | 
						|
  AMDGPUTargetLowering *getTargetLowering() const override {
 | 
						|
    return TLInfo.get();
 | 
						|
  }
 | 
						|
  const InstrItineraryData *getInstrItineraryData() const override {
 | 
						|
    return &InstrItins;
 | 
						|
  }
 | 
						|
 | 
						|
  void ParseSubtargetFeatures(StringRef CPU, StringRef FS);
 | 
						|
 | 
						|
  bool is64bit() const {
 | 
						|
    return Is64bit;
 | 
						|
  }
 | 
						|
 | 
						|
  bool hasVertexCache() const {
 | 
						|
    return HasVertexCache;
 | 
						|
  }
 | 
						|
 | 
						|
  short getTexVTXClauseSize() const {
 | 
						|
    return TexVTXClauseSize;
 | 
						|
  }
 | 
						|
 | 
						|
  Generation getGeneration() const {
 | 
						|
    return Gen;
 | 
						|
  }
 | 
						|
 | 
						|
  bool hasHWFP64() const {
 | 
						|
    return FP64;
 | 
						|
  }
 | 
						|
 | 
						|
  bool hasCaymanISA() const {
 | 
						|
    return CaymanISA;
 | 
						|
  }
 | 
						|
 | 
						|
  bool hasFP32Denormals() const {
 | 
						|
    return FP32Denormals;
 | 
						|
  }
 | 
						|
 | 
						|
  bool hasFP64Denormals() const {
 | 
						|
    return FP64Denormals;
 | 
						|
  }
 | 
						|
 | 
						|
  bool hasFastFMAF32() const {
 | 
						|
    return FastFMAF32;
 | 
						|
  }
 | 
						|
 | 
						|
  bool hasFlatAddressSpace() const {
 | 
						|
    return FlatAddressSpace;
 | 
						|
  }
 | 
						|
 | 
						|
  bool hasBFE() const {
 | 
						|
    return (getGeneration() >= EVERGREEN);
 | 
						|
  }
 | 
						|
 | 
						|
  bool hasBFI() const {
 | 
						|
    return (getGeneration() >= EVERGREEN);
 | 
						|
  }
 | 
						|
 | 
						|
  bool hasBFM() const {
 | 
						|
    return hasBFE();
 | 
						|
  }
 | 
						|
 | 
						|
  bool hasBCNT(unsigned Size) const {
 | 
						|
    if (Size == 32)
 | 
						|
      return (getGeneration() >= EVERGREEN);
 | 
						|
 | 
						|
    if (Size == 64)
 | 
						|
      return (getGeneration() >= SOUTHERN_ISLANDS);
 | 
						|
 | 
						|
    return false;
 | 
						|
  }
 | 
						|
 | 
						|
  bool hasMulU24() const {
 | 
						|
    return (getGeneration() >= EVERGREEN);
 | 
						|
  }
 | 
						|
 | 
						|
  bool hasMulI24() const {
 | 
						|
    return (getGeneration() >= SOUTHERN_ISLANDS ||
 | 
						|
            hasCaymanISA());
 | 
						|
  }
 | 
						|
 | 
						|
  bool hasFFBL() const {
 | 
						|
    return (getGeneration() >= EVERGREEN);
 | 
						|
  }
 | 
						|
 | 
						|
  bool hasFFBH() const {
 | 
						|
    return (getGeneration() >= EVERGREEN);
 | 
						|
  }
 | 
						|
 | 
						|
  bool hasCARRY() const {
 | 
						|
    return (getGeneration() >= EVERGREEN);
 | 
						|
  }
 | 
						|
 | 
						|
  bool hasBORROW() const {
 | 
						|
    return (getGeneration() >= EVERGREEN);
 | 
						|
  }
 | 
						|
 | 
						|
  bool IsIRStructurizerEnabled() const {
 | 
						|
    return EnableIRStructurizer;
 | 
						|
  }
 | 
						|
 | 
						|
  bool isPromoteAllocaEnabled() const {
 | 
						|
    return EnablePromoteAlloca;
 | 
						|
  }
 | 
						|
 | 
						|
  bool isIfCvtEnabled() const {
 | 
						|
    return EnableIfCvt;
 | 
						|
  }
 | 
						|
 | 
						|
  bool loadStoreOptEnabled() const {
 | 
						|
    return EnableLoadStoreOpt;
 | 
						|
  }
 | 
						|
 | 
						|
  bool unsafeDSOffsetFoldingEnabled() const {
 | 
						|
    return EnableUnsafeDSOffsetFolding;
 | 
						|
  }
 | 
						|
 | 
						|
  unsigned getWavefrontSize() const {
 | 
						|
    return WavefrontSize;
 | 
						|
  }
 | 
						|
 | 
						|
  unsigned getStackEntrySize() const;
 | 
						|
 | 
						|
  bool hasCFAluBug() const {
 | 
						|
    assert(getGeneration() <= NORTHERN_ISLANDS);
 | 
						|
    return CFALUBug;
 | 
						|
  }
 | 
						|
 | 
						|
  int getLocalMemorySize() const {
 | 
						|
    return LocalMemorySize;
 | 
						|
  }
 | 
						|
 | 
						|
  bool hasSGPRInitBug() const {
 | 
						|
    return SGPRInitBug;
 | 
						|
  }
 | 
						|
 | 
						|
  int getLDSBankCount() const {
 | 
						|
    return LDSBankCount;
 | 
						|
  }
 | 
						|
 | 
						|
  unsigned getAmdKernelCodeChipID() const;
 | 
						|
 | 
						|
  AMDGPU::IsaVersion getIsaVersion() const;
 | 
						|
 | 
						|
  bool enableMachineScheduler() const override {
 | 
						|
    return true;
 | 
						|
  }
 | 
						|
 | 
						|
  void overrideSchedPolicy(MachineSchedPolicy &Policy,
 | 
						|
                           MachineInstr *begin, MachineInstr *end,
 | 
						|
                           unsigned NumRegionInstrs) const override;
 | 
						|
 | 
						|
  // Helper functions to simplify if statements
 | 
						|
  bool isTargetELF() const {
 | 
						|
    return false;
 | 
						|
  }
 | 
						|
 | 
						|
  StringRef getDeviceName() const {
 | 
						|
    return DevName;
 | 
						|
  }
 | 
						|
 | 
						|
  bool enableHugeScratchBuffer() const {
 | 
						|
    return EnableHugeScratchBuffer;
 | 
						|
  }
 | 
						|
 | 
						|
  bool dumpCode() const {
 | 
						|
    return DumpCode;
 | 
						|
  }
 | 
						|
  bool r600ALUEncoding() const {
 | 
						|
    return R600ALUInst;
 | 
						|
  }
 | 
						|
  bool isAmdHsaOS() const {
 | 
						|
    return TargetTriple.getOS() == Triple::AMDHSA;
 | 
						|
  }
 | 
						|
  bool isVGPRSpillingEnabled(const SIMachineFunctionInfo *MFI) const;
 | 
						|
 | 
						|
  unsigned getMaxWavesPerCU() const {
 | 
						|
    if (getGeneration() >= AMDGPUSubtarget::SOUTHERN_ISLANDS)
 | 
						|
      return 10;
 | 
						|
 | 
						|
    // FIXME: Not sure what this is for other subtagets.
 | 
						|
    llvm_unreachable("do not know max waves per CU for this subtarget.");
 | 
						|
  }
 | 
						|
 | 
						|
  bool enableSubRegLiveness() const override {
 | 
						|
    return true;
 | 
						|
  }
 | 
						|
 | 
						|
  /// \brief Returns the offset in bytes from the start of the input buffer
 | 
						|
  ///        of the first explicit kernel argument.
 | 
						|
  unsigned getExplicitKernelArgOffset() const {
 | 
						|
    return isAmdHsaOS() ? 0 : 36;
 | 
						|
  }
 | 
						|
 | 
						|
};
 | 
						|
 | 
						|
} // End namespace llvm
 | 
						|
 | 
						|
#endif
 |