forked from OSchip/llvm-project
				
			
		
			
				
	
	
		
			72 lines
		
	
	
		
			2.0 KiB
		
	
	
	
		
			C++
		
	
	
	
			
		
		
	
	
			72 lines
		
	
	
		
			2.0 KiB
		
	
	
	
		
			C++
		
	
	
	
//===--- SIProgramInfo.h ----------------------------------------*- C++ -*-===//
 | 
						|
//
 | 
						|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
 | 
						|
// See https://llvm.org/LICENSE.txt for license information.
 | 
						|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
 | 
						|
//
 | 
						|
//===----------------------------------------------------------------------===//
 | 
						|
//
 | 
						|
/// \file
 | 
						|
/// Defines struct to track resource usage for kernels and entry functions.
 | 
						|
///
 | 
						|
//
 | 
						|
//===----------------------------------------------------------------------===//
 | 
						|
 | 
						|
#ifndef LLVM_LIB_TARGET_AMDGPU_SIPROGRAMINFO_H
 | 
						|
#define LLVM_LIB_TARGET_AMDGPU_SIPROGRAMINFO_H
 | 
						|
 | 
						|
namespace llvm {
 | 
						|
 | 
						|
/// Track resource usage for kernels / entry functions.
 | 
						|
struct SIProgramInfo {
 | 
						|
    // Fields set in PGM_RSRC1 pm4 packet.
 | 
						|
    uint32_t VGPRBlocks = 0;
 | 
						|
    uint32_t SGPRBlocks = 0;
 | 
						|
    uint32_t Priority = 0;
 | 
						|
    uint32_t FloatMode = 0;
 | 
						|
    uint32_t Priv = 0;
 | 
						|
    uint32_t DX10Clamp = 0;
 | 
						|
    uint32_t DebugMode = 0;
 | 
						|
    uint32_t IEEEMode = 0;
 | 
						|
    uint32_t WgpMode = 0; // GFX10+
 | 
						|
    uint32_t MemOrdered = 0; // GFX10+
 | 
						|
    uint64_t ScratchSize = 0;
 | 
						|
 | 
						|
    uint64_t ComputePGMRSrc1 = 0;
 | 
						|
 | 
						|
    // Fields set in PGM_RSRC2 pm4 packet.
 | 
						|
    uint32_t LDSBlocks = 0;
 | 
						|
    uint32_t ScratchBlocks = 0;
 | 
						|
 | 
						|
    uint64_t ComputePGMRSrc2 = 0;
 | 
						|
 | 
						|
    uint32_t NumVGPR = 0;
 | 
						|
    uint32_t NumArchVGPR = 0;
 | 
						|
    uint32_t NumAccVGPR = 0;
 | 
						|
    uint32_t NumSGPR = 0;
 | 
						|
    uint32_t LDSSize = 0;
 | 
						|
    bool FlatUsed = false;
 | 
						|
 | 
						|
    // Number of SGPRs that meets number of waves per execution unit request.
 | 
						|
    uint32_t NumSGPRsForWavesPerEU = 0;
 | 
						|
 | 
						|
    // Number of VGPRs that meets number of waves per execution unit request.
 | 
						|
    uint32_t NumVGPRsForWavesPerEU = 0;
 | 
						|
 | 
						|
    // Final occupancy.
 | 
						|
    uint32_t Occupancy = 0;
 | 
						|
 | 
						|
    // Whether there is recursion, dynamic allocas, indirect calls or some other
 | 
						|
    // reason there may be statically unknown stack usage.
 | 
						|
    bool DynamicCallStack = false;
 | 
						|
 | 
						|
    // Bonus information for debugging.
 | 
						|
    bool VCCUsed = false;
 | 
						|
 | 
						|
    SIProgramInfo() = default;
 | 
						|
};
 | 
						|
 | 
						|
} // namespace llvm
 | 
						|
 | 
						|
#endif // LLVM_LIB_TARGET_AMDGPU_SIPROGRAMINFO_H
 |