diff options
Diffstat (limited to 'contrib/llvm-project/llvm/lib/Target/AMDGPU/SIProgramInfo.h')
| -rw-r--r-- | contrib/llvm-project/llvm/lib/Target/AMDGPU/SIProgramInfo.h | 82 | 
1 files changed, 82 insertions, 0 deletions
diff --git a/contrib/llvm-project/llvm/lib/Target/AMDGPU/SIProgramInfo.h b/contrib/llvm-project/llvm/lib/Target/AMDGPU/SIProgramInfo.h new file mode 100644 index 000000000000..553fb4cf496c --- /dev/null +++ b/contrib/llvm-project/llvm/lib/Target/AMDGPU/SIProgramInfo.h @@ -0,0 +1,82 @@ +//===--- SIProgramInfo.h ----------------------------------------*- C++ -*-===// +// +// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. +// See https://llvm.org/LICENSE.txt for license information. +// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception +// +//===----------------------------------------------------------------------===// +// +/// \file +/// Defines struct to track resource usage and hardware flags for kernels and +/// entry functions. +/// +// +//===----------------------------------------------------------------------===// + +#ifndef LLVM_LIB_TARGET_AMDGPU_SIPROGRAMINFO_H +#define LLVM_LIB_TARGET_AMDGPU_SIPROGRAMINFO_H + +#include "llvm/IR/CallingConv.h" +#include <cstdint> + +namespace llvm { + +/// Track resource usage for kernels / entry functions. +struct SIProgramInfo { +    // Fields set in PGM_RSRC1 pm4 packet. +    uint32_t VGPRBlocks = 0; +    uint32_t SGPRBlocks = 0; +    uint32_t Priority = 0; +    uint32_t FloatMode = 0; +    uint32_t Priv = 0; +    uint32_t DX10Clamp = 0; +    uint32_t DebugMode = 0; +    uint32_t IEEEMode = 0; +    uint32_t WgpMode = 0; // GFX10+ +    uint32_t MemOrdered = 0; // GFX10+ +    uint64_t ScratchSize = 0; + +    // Fields set in PGM_RSRC2 pm4 packet. +    uint32_t LDSBlocks = 0; +    uint32_t ScratchBlocks = 0; + +    uint64_t ComputePGMRSrc2 = 0; +    uint64_t ComputePGMRSrc3GFX90A = 0; + +    uint32_t NumVGPR = 0; +    uint32_t NumArchVGPR = 0; +    uint32_t NumAccVGPR = 0; +    uint32_t AccumOffset = 0; +    uint32_t TgSplit = 0; +    uint32_t NumSGPR = 0; +    unsigned SGPRSpill = 0; +    unsigned VGPRSpill = 0; +    uint32_t LDSSize = 0; +    bool FlatUsed = false; + +    // Number of SGPRs that meets number of waves per execution unit request. +    uint32_t NumSGPRsForWavesPerEU = 0; + +    // Number of VGPRs that meets number of waves per execution unit request. +    uint32_t NumVGPRsForWavesPerEU = 0; + +    // Final occupancy. +    uint32_t Occupancy = 0; + +    // Whether there is recursion, dynamic allocas, indirect calls or some other +    // reason there may be statically unknown stack usage. +    bool DynamicCallStack = false; + +    // Bonus information for debugging. +    bool VCCUsed = false; + +    SIProgramInfo() = default; + +    /// Compute the value of the ComputePGMRsrc1 register. +    uint64_t getComputePGMRSrc1() const; +    uint64_t getPGMRSrc1(CallingConv::ID CC) const; +}; + +} // namespace llvm + +#endif // LLVM_LIB_TARGET_AMDGPU_SIPROGRAMINFO_H  | 
