forked from eden-emu/eden
		
	
		
			
				
	
	
		
			880 lines
		
	
	
	
		
			32 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			880 lines
		
	
	
	
		
			32 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
| // Copyright 2018 yuzu Emulator Project
 | |
| // Licensed under GPLv2 or any later version
 | |
| // Refer to the license.txt file included.
 | |
| 
 | |
| #pragma once
 | |
| 
 | |
| #include <array>
 | |
| #include <cstring>
 | |
| #include <map>
 | |
| #include <optional>
 | |
| #include <set>
 | |
| #include <string>
 | |
| #include <tuple>
 | |
| #include <variant>
 | |
| #include <vector>
 | |
| 
 | |
| #include "common/common_types.h"
 | |
| #include "video_core/engines/maxwell_3d.h"
 | |
| #include "video_core/engines/shader_bytecode.h"
 | |
| #include "video_core/engines/shader_header.h"
 | |
| 
 | |
| namespace VideoCommon::Shader {
 | |
| 
 | |
| class OperationNode;
 | |
| class ConditionalNode;
 | |
| class GprNode;
 | |
| class ImmediateNode;
 | |
| class InternalFlagNode;
 | |
| class PredicateNode;
 | |
| class AbufNode; ///< Attribute buffer
 | |
| class CbufNode; ///< Constant buffer
 | |
| class LmemNode; ///< Local memory
 | |
| class GmemNode; ///< Global memory
 | |
| class CommentNode;
 | |
| 
 | |
| using ProgramCode = std::vector<u64>;
 | |
| 
 | |
| using NodeData =
 | |
|     std::variant<OperationNode, ConditionalNode, GprNode, ImmediateNode, InternalFlagNode,
 | |
|                  PredicateNode, AbufNode, CbufNode, LmemNode, GmemNode, CommentNode>;
 | |
| using Node = const NodeData*;
 | |
| using Node4 = std::array<Node, 4>;
 | |
| using NodeBlock = std::vector<Node>;
 | |
| 
 | |
| constexpr u32 MAX_PROGRAM_LENGTH = 0x1000;
 | |
| 
 | |
| enum class OperationCode {
 | |
|     Assign, /// (float& dest, float src) -> void
 | |
| 
 | |
|     Select, /// (MetaArithmetic, bool pred, float a, float b) -> float
 | |
| 
 | |
|     FAdd,          /// (MetaArithmetic, float a, float b) -> float
 | |
|     FMul,          /// (MetaArithmetic, float a, float b) -> float
 | |
|     FDiv,          /// (MetaArithmetic, float a, float b) -> float
 | |
|     FFma,          /// (MetaArithmetic, float a, float b, float c) -> float
 | |
|     FNegate,       /// (MetaArithmetic, float a) -> float
 | |
|     FAbsolute,     /// (MetaArithmetic, float a) -> float
 | |
|     FClamp,        /// (MetaArithmetic, float value, float min, float max) -> float
 | |
|     FMin,          /// (MetaArithmetic, float a, float b) -> float
 | |
|     FMax,          /// (MetaArithmetic, float a, float b) -> float
 | |
|     FCos,          /// (MetaArithmetic, float a) -> float
 | |
|     FSin,          /// (MetaArithmetic, float a) -> float
 | |
|     FExp2,         /// (MetaArithmetic, float a) -> float
 | |
|     FLog2,         /// (MetaArithmetic, float a) -> float
 | |
|     FInverseSqrt,  /// (MetaArithmetic, float a) -> float
 | |
|     FSqrt,         /// (MetaArithmetic, float a) -> float
 | |
|     FRoundEven,    /// (MetaArithmetic, float a) -> float
 | |
|     FFloor,        /// (MetaArithmetic, float a) -> float
 | |
|     FCeil,         /// (MetaArithmetic, float a) -> float
 | |
|     FTrunc,        /// (MetaArithmetic, float a) -> float
 | |
|     FCastInteger,  /// (MetaArithmetic, int a) -> float
 | |
|     FCastUInteger, /// (MetaArithmetic, uint a) -> float
 | |
| 
 | |
|     IAdd,                  /// (MetaArithmetic, int a, int b) -> int
 | |
|     IMul,                  /// (MetaArithmetic, int a, int b) -> int
 | |
|     IDiv,                  /// (MetaArithmetic, int a, int b) -> int
 | |
|     INegate,               /// (MetaArithmetic, int a) -> int
 | |
|     IAbsolute,             /// (MetaArithmetic, int a) -> int
 | |
|     IMin,                  /// (MetaArithmetic, int a, int b) -> int
 | |
|     IMax,                  /// (MetaArithmetic, int a, int b) -> int
 | |
|     ICastFloat,            /// (MetaArithmetic, float a) -> int
 | |
|     ICastUnsigned,         /// (MetaArithmetic, uint a) -> int
 | |
|     ILogicalShiftLeft,     /// (MetaArithmetic, int a, uint b) -> int
 | |
|     ILogicalShiftRight,    /// (MetaArithmetic, int a, uint b) -> int
 | |
|     IArithmeticShiftRight, /// (MetaArithmetic, int a, uint b) -> int
 | |
|     IBitwiseAnd,           /// (MetaArithmetic, int a, int b) -> int
 | |
|     IBitwiseOr,            /// (MetaArithmetic, int a, int b) -> int
 | |
|     IBitwiseXor,           /// (MetaArithmetic, int a, int b) -> int
 | |
|     IBitwiseNot,           /// (MetaArithmetic, int a) -> int
 | |
|     IBitfieldInsert,       /// (MetaArithmetic, int base, int insert, int offset, int bits) -> int
 | |
|     IBitfieldExtract,      /// (MetaArithmetic, int value, int offset, int offset) -> int
 | |
|     IBitCount,             /// (MetaArithmetic, int) -> int
 | |
| 
 | |
|     UAdd,                  /// (MetaArithmetic, uint a, uint b) -> uint
 | |
|     UMul,                  /// (MetaArithmetic, uint a, uint b) -> uint
 | |
|     UDiv,                  /// (MetaArithmetic, uint a, uint b) -> uint
 | |
|     UMin,                  /// (MetaArithmetic, uint a, uint b) -> uint
 | |
|     UMax,                  /// (MetaArithmetic, uint a, uint b) -> uint
 | |
|     UCastFloat,            /// (MetaArithmetic, float a) -> uint
 | |
|     UCastSigned,           /// (MetaArithmetic, int a) -> uint
 | |
|     ULogicalShiftLeft,     /// (MetaArithmetic, uint a, uint b) -> uint
 | |
|     ULogicalShiftRight,    /// (MetaArithmetic, uint a, uint b) -> uint
 | |
|     UArithmeticShiftRight, /// (MetaArithmetic, uint a, uint b) -> uint
 | |
|     UBitwiseAnd,           /// (MetaArithmetic, uint a, uint b) -> uint
 | |
|     UBitwiseOr,            /// (MetaArithmetic, uint a, uint b) -> uint
 | |
|     UBitwiseXor,           /// (MetaArithmetic, uint a, uint b) -> uint
 | |
|     UBitwiseNot,           /// (MetaArithmetic, uint a) -> uint
 | |
|     UBitfieldInsert,  /// (MetaArithmetic, uint base, uint insert, int offset, int bits) -> uint
 | |
|     UBitfieldExtract, /// (MetaArithmetic, uint value, int offset, int offset) -> uint
 | |
|     UBitCount,        /// (MetaArithmetic, uint) -> uint
 | |
| 
 | |
|     HAdd,      /// (MetaArithmetic, f16vec2 a, f16vec2 b) -> f16vec2
 | |
|     HMul,      /// (MetaArithmetic, f16vec2 a, f16vec2 b) -> f16vec2
 | |
|     HFma,      /// (MetaArithmetic, f16vec2 a, f16vec2 b, f16vec2 c) -> f16vec2
 | |
|     HAbsolute, /// (f16vec2 a) -> f16vec2
 | |
|     HNegate,   /// (f16vec2 a, bool first, bool second) -> f16vec2
 | |
|     HClamp,    /// (f16vec2 src, float min, float max) -> f16vec2
 | |
|     HUnpack,   /// (Tegra::Shader::HalfType, T value) -> f16vec2
 | |
|     HMergeF32, /// (f16vec2 src) -> float
 | |
|     HMergeH0,  /// (f16vec2 dest, f16vec2 src) -> f16vec2
 | |
|     HMergeH1,  /// (f16vec2 dest, f16vec2 src) -> f16vec2
 | |
|     HPack2,    /// (float a, float b) -> f16vec2
 | |
| 
 | |
|     LogicalAssign, /// (bool& dst, bool src) -> void
 | |
|     LogicalAnd,    /// (bool a, bool b) -> bool
 | |
|     LogicalOr,     /// (bool a, bool b) -> bool
 | |
|     LogicalXor,    /// (bool a, bool b) -> bool
 | |
|     LogicalNegate, /// (bool a) -> bool
 | |
|     LogicalPick2,  /// (bool2 pair, uint index) -> bool
 | |
|     LogicalAll2,   /// (bool2 a) -> bool
 | |
|     LogicalAny2,   /// (bool2 a) -> bool
 | |
| 
 | |
|     LogicalFLessThan,     /// (float a, float b) -> bool
 | |
|     LogicalFEqual,        /// (float a, float b) -> bool
 | |
|     LogicalFLessEqual,    /// (float a, float b) -> bool
 | |
|     LogicalFGreaterThan,  /// (float a, float b) -> bool
 | |
|     LogicalFNotEqual,     /// (float a, float b) -> bool
 | |
|     LogicalFGreaterEqual, /// (float a, float b) -> bool
 | |
|     LogicalFIsNan,        /// (float a) -> bool
 | |
| 
 | |
|     LogicalILessThan,     /// (int a, int b) -> bool
 | |
|     LogicalIEqual,        /// (int a, int b) -> bool
 | |
|     LogicalILessEqual,    /// (int a, int b) -> bool
 | |
|     LogicalIGreaterThan,  /// (int a, int b) -> bool
 | |
|     LogicalINotEqual,     /// (int a, int b) -> bool
 | |
|     LogicalIGreaterEqual, /// (int a, int b) -> bool
 | |
| 
 | |
|     LogicalULessThan,     /// (uint a, uint b) -> bool
 | |
|     LogicalUEqual,        /// (uint a, uint b) -> bool
 | |
|     LogicalULessEqual,    /// (uint a, uint b) -> bool
 | |
|     LogicalUGreaterThan,  /// (uint a, uint b) -> bool
 | |
|     LogicalUNotEqual,     /// (uint a, uint b) -> bool
 | |
|     LogicalUGreaterEqual, /// (uint a, uint b) -> bool
 | |
| 
 | |
|     Logical2HLessThan,            /// (MetaHalfArithmetic, f16vec2 a, f16vec2) -> bool2
 | |
|     Logical2HEqual,               /// (MetaHalfArithmetic, f16vec2 a, f16vec2) -> bool2
 | |
|     Logical2HLessEqual,           /// (MetaHalfArithmetic, f16vec2 a, f16vec2) -> bool2
 | |
|     Logical2HGreaterThan,         /// (MetaHalfArithmetic, f16vec2 a, f16vec2) -> bool2
 | |
|     Logical2HNotEqual,            /// (MetaHalfArithmetic, f16vec2 a, f16vec2) -> bool2
 | |
|     Logical2HGreaterEqual,        /// (MetaHalfArithmetic, f16vec2 a, f16vec2) -> bool2
 | |
|     Logical2HLessThanWithNan,     /// (MetaHalfArithmetic, f16vec2 a, f16vec2) -> bool2
 | |
|     Logical2HEqualWithNan,        /// (MetaHalfArithmetic, f16vec2 a, f16vec2) -> bool2
 | |
|     Logical2HLessEqualWithNan,    /// (MetaHalfArithmetic, f16vec2 a, f16vec2) -> bool2
 | |
|     Logical2HGreaterThanWithNan,  /// (MetaHalfArithmetic, f16vec2 a, f16vec2) -> bool2
 | |
|     Logical2HNotEqualWithNan,     /// (MetaHalfArithmetic, f16vec2 a, f16vec2) -> bool2
 | |
|     Logical2HGreaterEqualWithNan, /// (MetaHalfArithmetic, f16vec2 a, f16vec2) -> bool2
 | |
| 
 | |
|     Texture,                /// (MetaTexture, float[N] coords) -> float4
 | |
|     TextureLod,             /// (MetaTexture, float[N] coords) -> float4
 | |
|     TextureGather,          /// (MetaTexture, float[N] coords) -> float4
 | |
|     TextureQueryDimensions, /// (MetaTexture, float a) -> float4
 | |
|     TextureQueryLod,        /// (MetaTexture, float[N] coords) -> float4
 | |
|     TexelFetch,             /// (MetaTexture, int[N], int) -> float4
 | |
| 
 | |
|     Branch,        /// (uint branch_target) -> void
 | |
|     PushFlowStack, /// (uint branch_target) -> void
 | |
|     PopFlowStack,  /// () -> void
 | |
|     Exit,          /// () -> void
 | |
|     Discard,       /// () -> void
 | |
| 
 | |
|     EmitVertex,   /// () -> void
 | |
|     EndPrimitive, /// () -> void
 | |
| 
 | |
|     YNegate, /// () -> float
 | |
| 
 | |
|     Amount,
 | |
| };
 | |
| 
 | |
| enum class InternalFlag {
 | |
|     Zero = 0,
 | |
|     Sign = 1,
 | |
|     Carry = 2,
 | |
|     Overflow = 3,
 | |
|     Amount = 4,
 | |
| };
 | |
| 
 | |
| /// Describes the behaviour of code path of a given entry point and a return point.
 | |
| enum class ExitMethod {
 | |
|     Undetermined, ///< Internal value. Only occur when analyzing JMP loop.
 | |
|     AlwaysReturn, ///< All code paths reach the return point.
 | |
|     Conditional,  ///< Code path reaches the return point or an END instruction conditionally.
 | |
|     AlwaysEnd,    ///< All code paths reach a END instruction.
 | |
| };
 | |
| 
 | |
| class Sampler {
 | |
| public:
 | |
|     // Use this constructor for bounded Samplers
 | |
|     explicit Sampler(std::size_t offset, std::size_t index, Tegra::Shader::TextureType type,
 | |
|                      bool is_array, bool is_shadow)
 | |
|         : offset{offset}, index{index}, type{type}, is_array{is_array}, is_shadow{is_shadow},
 | |
|           is_bindless{false} {}
 | |
| 
 | |
|     // Use this constructor for bindless Samplers
 | |
|     explicit Sampler(u32 cbuf_index, u32 cbuf_offset, std::size_t index,
 | |
|                      Tegra::Shader::TextureType type, bool is_array, bool is_shadow)
 | |
|         : offset{(static_cast<u64>(cbuf_index) << 32) | cbuf_offset}, index{index}, type{type},
 | |
|           is_array{is_array}, is_shadow{is_shadow}, is_bindless{true} {}
 | |
| 
 | |
|     // Use this only for serialization/deserialization
 | |
|     explicit Sampler(std::size_t offset, std::size_t index, Tegra::Shader::TextureType type,
 | |
|                      bool is_array, bool is_shadow, bool is_bindless)
 | |
|         : offset{offset}, index{index}, type{type}, is_array{is_array}, is_shadow{is_shadow},
 | |
|           is_bindless{is_bindless} {}
 | |
| 
 | |
|     std::size_t GetOffset() const {
 | |
|         return offset;
 | |
|     }
 | |
| 
 | |
|     std::size_t GetIndex() const {
 | |
|         return index;
 | |
|     }
 | |
| 
 | |
|     Tegra::Shader::TextureType GetType() const {
 | |
|         return type;
 | |
|     }
 | |
| 
 | |
|     bool IsArray() const {
 | |
|         return is_array;
 | |
|     }
 | |
| 
 | |
|     bool IsShadow() const {
 | |
|         return is_shadow;
 | |
|     }
 | |
| 
 | |
|     bool IsBindless() const {
 | |
|         return is_bindless;
 | |
|     }
 | |
| 
 | |
|     std::pair<u32, u32> GetBindlessCBuf() const {
 | |
|         return {static_cast<u32>(offset >> 32), static_cast<u32>(offset)};
 | |
|     }
 | |
| 
 | |
|     bool operator<(const Sampler& rhs) const {
 | |
|         return std::tie(index, offset, type, is_array, is_shadow, is_bindless) <
 | |
|                std::tie(rhs.index, rhs.offset, rhs.type, rhs.is_array, rhs.is_shadow,
 | |
|                         rhs.is_bindless);
 | |
|     }
 | |
| 
 | |
| private:
 | |
|     /// Offset in TSC memory from which to read the sampler object, as specified by the sampling
 | |
|     /// instruction.
 | |
|     std::size_t offset{};
 | |
|     std::size_t index{}; ///< Value used to index into the generated GLSL sampler array.
 | |
|     Tegra::Shader::TextureType type{}; ///< The type used to sample this texture (Texture2D, etc)
 | |
|     bool is_array{};    ///< Whether the texture is being sampled as an array texture or not.
 | |
|     bool is_shadow{};   ///< Whether the texture is being sampled as a depth texture or not.
 | |
|     bool is_bindless{}; ///< Whether this sampler belongs to a bindless texture or not.
 | |
| };
 | |
| 
 | |
| class ConstBuffer {
 | |
| public:
 | |
|     explicit ConstBuffer(u32 max_offset, bool is_indirect)
 | |
|         : max_offset{max_offset}, is_indirect{is_indirect} {}
 | |
| 
 | |
|     ConstBuffer() = default;
 | |
| 
 | |
|     void MarkAsUsed(u64 offset) {
 | |
|         max_offset = std::max(max_offset, static_cast<u32>(offset));
 | |
|     }
 | |
| 
 | |
|     void MarkAsUsedIndirect() {
 | |
|         is_indirect = true;
 | |
|     }
 | |
| 
 | |
|     bool IsIndirect() const {
 | |
|         return is_indirect;
 | |
|     }
 | |
| 
 | |
|     u32 GetSize() const {
 | |
|         return max_offset + sizeof(float);
 | |
|     }
 | |
| 
 | |
|     u32 GetMaxOffset() const {
 | |
|         return max_offset;
 | |
|     }
 | |
| 
 | |
| private:
 | |
|     u32 max_offset{};
 | |
|     bool is_indirect{};
 | |
| };
 | |
| 
 | |
| struct GlobalMemoryBase {
 | |
|     u32 cbuf_index{};
 | |
|     u32 cbuf_offset{};
 | |
| 
 | |
|     bool operator<(const GlobalMemoryBase& rhs) const {
 | |
|         return std::tie(cbuf_index, cbuf_offset) < std::tie(rhs.cbuf_index, rhs.cbuf_offset);
 | |
|     }
 | |
| };
 | |
| 
 | |
| struct GlobalMemoryUsage {
 | |
|     bool is_read{};
 | |
|     bool is_written{};
 | |
| };
 | |
| 
 | |
| struct MetaArithmetic {
 | |
|     bool precise{};
 | |
| };
 | |
| 
 | |
| struct MetaTexture {
 | |
|     const Sampler& sampler;
 | |
|     Node array{};
 | |
|     Node depth_compare{};
 | |
|     std::vector<Node> aoffi;
 | |
|     Node bias{};
 | |
|     Node lod{};
 | |
|     Node component{};
 | |
|     u32 element{};
 | |
| };
 | |
| 
 | |
| constexpr MetaArithmetic PRECISE = {true};
 | |
| constexpr MetaArithmetic NO_PRECISE = {false};
 | |
| 
 | |
| using Meta = std::variant<MetaArithmetic, MetaTexture, Tegra::Shader::HalfType>;
 | |
| 
 | |
| /// Holds any kind of operation that can be done in the IR
 | |
| class OperationNode final {
 | |
| public:
 | |
|     explicit OperationNode(OperationCode code) : code{code} {}
 | |
| 
 | |
|     explicit OperationNode(OperationCode code, Meta&& meta) : code{code}, meta{std::move(meta)} {}
 | |
| 
 | |
|     template <typename... T>
 | |
|     explicit OperationNode(OperationCode code, const T*... operands)
 | |
|         : OperationNode(code, {}, operands...) {}
 | |
| 
 | |
|     template <typename... T>
 | |
|     explicit OperationNode(OperationCode code, Meta&& meta, const T*... operands_)
 | |
|         : code{code}, meta{std::move(meta)}, operands{operands_...} {}
 | |
| 
 | |
|     explicit OperationNode(OperationCode code, Meta&& meta, std::vector<Node>&& operands)
 | |
|         : code{code}, meta{meta}, operands{std::move(operands)} {}
 | |
| 
 | |
|     explicit OperationNode(OperationCode code, std::vector<Node>&& operands)
 | |
|         : code{code}, operands{std::move(operands)} {}
 | |
| 
 | |
|     OperationCode GetCode() const {
 | |
|         return code;
 | |
|     }
 | |
| 
 | |
|     const Meta& GetMeta() const {
 | |
|         return meta;
 | |
|     }
 | |
| 
 | |
|     std::size_t GetOperandsCount() const {
 | |
|         return operands.size();
 | |
|     }
 | |
| 
 | |
|     Node operator[](std::size_t operand_index) const {
 | |
|         return operands.at(operand_index);
 | |
|     }
 | |
| 
 | |
| private:
 | |
|     const OperationCode code;
 | |
|     const Meta meta;
 | |
|     std::vector<Node> operands;
 | |
| };
 | |
| 
 | |
| /// Encloses inside any kind of node that returns a boolean conditionally-executed code
 | |
| class ConditionalNode final {
 | |
| public:
 | |
|     explicit ConditionalNode(Node condition, std::vector<Node>&& code)
 | |
|         : condition{condition}, code{std::move(code)} {}
 | |
| 
 | |
|     Node GetCondition() const {
 | |
|         return condition;
 | |
|     }
 | |
| 
 | |
|     const std::vector<Node>& GetCode() const {
 | |
|         return code;
 | |
|     }
 | |
| 
 | |
| private:
 | |
|     const Node condition;   ///< Condition to be satisfied
 | |
|     std::vector<Node> code; ///< Code to execute
 | |
| };
 | |
| 
 | |
| /// A general purpose register
 | |
| class GprNode final {
 | |
| public:
 | |
|     explicit constexpr GprNode(Tegra::Shader::Register index) : index{index} {}
 | |
| 
 | |
|     u32 GetIndex() const {
 | |
|         return static_cast<u32>(index);
 | |
|     }
 | |
| 
 | |
| private:
 | |
|     const Tegra::Shader::Register index;
 | |
| };
 | |
| 
 | |
| /// A 32-bits value that represents an immediate value
 | |
| class ImmediateNode final {
 | |
| public:
 | |
|     explicit constexpr ImmediateNode(u32 value) : value{value} {}
 | |
| 
 | |
|     u32 GetValue() const {
 | |
|         return value;
 | |
|     }
 | |
| 
 | |
| private:
 | |
|     const u32 value;
 | |
| };
 | |
| 
 | |
| /// One of Maxwell's internal flags
 | |
| class InternalFlagNode final {
 | |
| public:
 | |
|     explicit constexpr InternalFlagNode(InternalFlag flag) : flag{flag} {}
 | |
| 
 | |
|     InternalFlag GetFlag() const {
 | |
|         return flag;
 | |
|     }
 | |
| 
 | |
| private:
 | |
|     const InternalFlag flag;
 | |
| };
 | |
| 
 | |
| /// A predicate register, it can be negated without additional nodes
 | |
| class PredicateNode final {
 | |
| public:
 | |
|     explicit constexpr PredicateNode(Tegra::Shader::Pred index, bool negated)
 | |
|         : index{index}, negated{negated} {}
 | |
| 
 | |
|     Tegra::Shader::Pred GetIndex() const {
 | |
|         return index;
 | |
|     }
 | |
| 
 | |
|     bool IsNegated() const {
 | |
|         return negated;
 | |
|     }
 | |
| 
 | |
| private:
 | |
|     const Tegra::Shader::Pred index;
 | |
|     const bool negated;
 | |
| };
 | |
| 
 | |
| /// Attribute buffer memory (known as attributes or varyings in GLSL terms)
 | |
| class AbufNode final {
 | |
| public:
 | |
|     // Initialize for standard attributes (index is explicit).
 | |
|     explicit constexpr AbufNode(Tegra::Shader::Attribute::Index index, u32 element,
 | |
|                                 Node buffer = {})
 | |
|         : buffer{buffer}, index{index}, element{element} {}
 | |
| 
 | |
|     // Initialize for physical attributes (index is a variable value).
 | |
|     explicit constexpr AbufNode(Node physical_address, Node buffer = {})
 | |
|         : physical_address{physical_address}, buffer{buffer} {}
 | |
| 
 | |
|     Tegra::Shader::Attribute::Index GetIndex() const {
 | |
|         return index;
 | |
|     }
 | |
| 
 | |
|     u32 GetElement() const {
 | |
|         return element;
 | |
|     }
 | |
| 
 | |
|     Node GetBuffer() const {
 | |
|         return buffer;
 | |
|     }
 | |
| 
 | |
|     bool IsPhysicalBuffer() const {
 | |
|         return physical_address != nullptr;
 | |
|     }
 | |
| 
 | |
|     Node GetPhysicalAddress() const {
 | |
|         return physical_address;
 | |
|     }
 | |
| 
 | |
| private:
 | |
|     Node physical_address{};
 | |
|     Node buffer{};
 | |
|     Tegra::Shader::Attribute::Index index{};
 | |
|     u32 element{};
 | |
| };
 | |
| 
 | |
| /// Constant buffer node, usually mapped to uniform buffers in GLSL
 | |
| class CbufNode final {
 | |
| public:
 | |
|     explicit constexpr CbufNode(u32 index, Node offset) : index{index}, offset{offset} {}
 | |
| 
 | |
|     u32 GetIndex() const {
 | |
|         return index;
 | |
|     }
 | |
| 
 | |
|     Node GetOffset() const {
 | |
|         return offset;
 | |
|     }
 | |
| 
 | |
| private:
 | |
|     const u32 index;
 | |
|     const Node offset;
 | |
| };
 | |
| 
 | |
| /// Local memory node
 | |
| class LmemNode final {
 | |
| public:
 | |
|     explicit constexpr LmemNode(Node address) : address{address} {}
 | |
| 
 | |
|     Node GetAddress() const {
 | |
|         return address;
 | |
|     }
 | |
| 
 | |
| private:
 | |
|     const Node address;
 | |
| };
 | |
| 
 | |
| /// Global memory node
 | |
| class GmemNode final {
 | |
| public:
 | |
|     explicit constexpr GmemNode(Node real_address, Node base_address,
 | |
|                                 const GlobalMemoryBase& descriptor)
 | |
|         : real_address{real_address}, base_address{base_address}, descriptor{descriptor} {}
 | |
| 
 | |
|     Node GetRealAddress() const {
 | |
|         return real_address;
 | |
|     }
 | |
| 
 | |
|     Node GetBaseAddress() const {
 | |
|         return base_address;
 | |
|     }
 | |
| 
 | |
|     const GlobalMemoryBase& GetDescriptor() const {
 | |
|         return descriptor;
 | |
|     }
 | |
| 
 | |
| private:
 | |
|     const Node real_address;
 | |
|     const Node base_address;
 | |
|     const GlobalMemoryBase descriptor;
 | |
| };
 | |
| 
 | |
| /// Commentary, can be dropped
 | |
| class CommentNode final {
 | |
| public:
 | |
|     explicit CommentNode(std::string text) : text{std::move(text)} {}
 | |
| 
 | |
|     const std::string& GetText() const {
 | |
|         return text;
 | |
|     }
 | |
| 
 | |
| private:
 | |
|     std::string text;
 | |
| };
 | |
| 
 | |
| class ShaderIR final {
 | |
| public:
 | |
|     explicit ShaderIR(const ProgramCode& program_code, u32 main_offset);
 | |
|     ~ShaderIR();
 | |
| 
 | |
|     const std::map<u32, NodeBlock>& GetBasicBlocks() const {
 | |
|         return basic_blocks;
 | |
|     }
 | |
| 
 | |
|     const std::set<u32>& GetRegisters() const {
 | |
|         return used_registers;
 | |
|     }
 | |
| 
 | |
|     const std::set<Tegra::Shader::Pred>& GetPredicates() const {
 | |
|         return used_predicates;
 | |
|     }
 | |
| 
 | |
|     const std::set<Tegra::Shader::Attribute::Index>& GetInputAttributes() const {
 | |
|         return used_input_attributes;
 | |
|     }
 | |
| 
 | |
|     const std::set<Tegra::Shader::Attribute::Index>& GetOutputAttributes() const {
 | |
|         return used_output_attributes;
 | |
|     }
 | |
| 
 | |
|     const std::map<u32, ConstBuffer>& GetConstantBuffers() const {
 | |
|         return used_cbufs;
 | |
|     }
 | |
| 
 | |
|     const std::set<Sampler>& GetSamplers() const {
 | |
|         return used_samplers;
 | |
|     }
 | |
| 
 | |
|     const std::array<bool, Tegra::Engines::Maxwell3D::Regs::NumClipDistances>& GetClipDistances()
 | |
|         const {
 | |
|         return used_clip_distances;
 | |
|     }
 | |
| 
 | |
|     const std::map<GlobalMemoryBase, GlobalMemoryUsage>& GetGlobalMemory() const {
 | |
|         return used_global_memory;
 | |
|     }
 | |
| 
 | |
|     std::size_t GetLength() const {
 | |
|         return static_cast<std::size_t>(coverage_end * sizeof(u64));
 | |
|     }
 | |
| 
 | |
|     bool HasPhysicalAttributes() const {
 | |
|         return uses_physical_attributes;
 | |
|     }
 | |
| 
 | |
|     const Tegra::Shader::Header& GetHeader() const {
 | |
|         return header;
 | |
|     }
 | |
| 
 | |
| private:
 | |
|     void Decode();
 | |
| 
 | |
|     ExitMethod Scan(u32 begin, u32 end, std::set<u32>& labels);
 | |
| 
 | |
|     NodeBlock DecodeRange(u32 begin, u32 end);
 | |
| 
 | |
|     /**
 | |
|      * Decodes a single instruction from Tegra to IR.
 | |
|      * @param bb Basic block where the nodes will be written to.
 | |
|      * @param pc Program counter. Offset to decode.
 | |
|      * @return Next address to decode.
 | |
|      */
 | |
|     u32 DecodeInstr(NodeBlock& bb, u32 pc);
 | |
| 
 | |
|     u32 DecodeArithmetic(NodeBlock& bb, u32 pc);
 | |
|     u32 DecodeArithmeticImmediate(NodeBlock& bb, u32 pc);
 | |
|     u32 DecodeBfe(NodeBlock& bb, u32 pc);
 | |
|     u32 DecodeBfi(NodeBlock& bb, u32 pc);
 | |
|     u32 DecodeShift(NodeBlock& bb, u32 pc);
 | |
|     u32 DecodeArithmeticInteger(NodeBlock& bb, u32 pc);
 | |
|     u32 DecodeArithmeticIntegerImmediate(NodeBlock& bb, u32 pc);
 | |
|     u32 DecodeArithmeticHalf(NodeBlock& bb, u32 pc);
 | |
|     u32 DecodeArithmeticHalfImmediate(NodeBlock& bb, u32 pc);
 | |
|     u32 DecodeFfma(NodeBlock& bb, u32 pc);
 | |
|     u32 DecodeHfma2(NodeBlock& bb, u32 pc);
 | |
|     u32 DecodeConversion(NodeBlock& bb, u32 pc);
 | |
|     u32 DecodeMemory(NodeBlock& bb, u32 pc);
 | |
|     u32 DecodeTexture(NodeBlock& bb, u32 pc);
 | |
|     u32 DecodeFloatSetPredicate(NodeBlock& bb, u32 pc);
 | |
|     u32 DecodeIntegerSetPredicate(NodeBlock& bb, u32 pc);
 | |
|     u32 DecodeHalfSetPredicate(NodeBlock& bb, u32 pc);
 | |
|     u32 DecodePredicateSetRegister(NodeBlock& bb, u32 pc);
 | |
|     u32 DecodePredicateSetPredicate(NodeBlock& bb, u32 pc);
 | |
|     u32 DecodeRegisterSetPredicate(NodeBlock& bb, u32 pc);
 | |
|     u32 DecodeFloatSet(NodeBlock& bb, u32 pc);
 | |
|     u32 DecodeIntegerSet(NodeBlock& bb, u32 pc);
 | |
|     u32 DecodeHalfSet(NodeBlock& bb, u32 pc);
 | |
|     u32 DecodeVideo(NodeBlock& bb, u32 pc);
 | |
|     u32 DecodeXmad(NodeBlock& bb, u32 pc);
 | |
|     u32 DecodeOther(NodeBlock& bb, u32 pc);
 | |
| 
 | |
|     /// Internalizes node's data and returns a managed pointer to a clone of that node
 | |
|     Node StoreNode(NodeData&& node_data);
 | |
| 
 | |
|     /// Creates a conditional node
 | |
|     Node Conditional(Node condition, std::vector<Node>&& code);
 | |
|     /// Creates a commentary
 | |
|     Node Comment(std::string text);
 | |
|     /// Creates an u32 immediate
 | |
|     Node Immediate(u32 value);
 | |
|     /// Creates a s32 immediate
 | |
|     Node Immediate(s32 value) {
 | |
|         return Immediate(static_cast<u32>(value));
 | |
|     }
 | |
|     /// Creates a f32 immediate
 | |
|     Node Immediate(f32 value) {
 | |
|         u32 integral;
 | |
|         std::memcpy(&integral, &value, sizeof(u32));
 | |
|         return Immediate(integral);
 | |
|     }
 | |
| 
 | |
|     /// Generates a node for a passed register.
 | |
|     Node GetRegister(Tegra::Shader::Register reg);
 | |
|     /// Generates a node representing a 19-bit immediate value
 | |
|     Node GetImmediate19(Tegra::Shader::Instruction instr);
 | |
|     /// Generates a node representing a 32-bit immediate value
 | |
|     Node GetImmediate32(Tegra::Shader::Instruction instr);
 | |
|     /// Generates a node representing a constant buffer
 | |
|     Node GetConstBuffer(u64 index, u64 offset);
 | |
|     /// Generates a node representing a constant buffer with a variadic offset
 | |
|     Node GetConstBufferIndirect(u64 index, u64 offset, Node node);
 | |
|     /// Generates a node for a passed predicate. It can be optionally negated
 | |
|     Node GetPredicate(u64 pred, bool negated = false);
 | |
|     /// Generates a predicate node for an immediate true or false value
 | |
|     Node GetPredicate(bool immediate);
 | |
|     /// Generates a node representing an input attribute. Keeps track of used attributes.
 | |
|     Node GetInputAttribute(Tegra::Shader::Attribute::Index index, u64 element, Node buffer = {});
 | |
|     /// Generates a node representing a physical input attribute.
 | |
|     Node GetPhysicalInputAttribute(Tegra::Shader::Register physical_address, Node buffer = {});
 | |
|     /// Generates a node representing an output attribute. Keeps track of used attributes.
 | |
|     Node GetOutputAttribute(Tegra::Shader::Attribute::Index index, u64 element, Node buffer);
 | |
|     /// Generates a node representing an internal flag
 | |
|     Node GetInternalFlag(InternalFlag flag, bool negated = false);
 | |
|     /// Generates a node representing a local memory address
 | |
|     Node GetLocalMemory(Node address);
 | |
|     /// Generates a temporal, internally it uses a post-RZ register
 | |
|     Node GetTemporal(u32 id);
 | |
| 
 | |
|     /// Sets a register. src value must be a number-evaluated node.
 | |
|     void SetRegister(NodeBlock& bb, Tegra::Shader::Register dest, Node src);
 | |
|     /// Sets a predicate. src value must be a bool-evaluated node
 | |
|     void SetPredicate(NodeBlock& bb, u64 dest, Node src);
 | |
|     /// Sets an internal flag. src value must be a bool-evaluated node
 | |
|     void SetInternalFlag(NodeBlock& bb, InternalFlag flag, Node value);
 | |
|     /// Sets a local memory address. address and value must be a number-evaluated node
 | |
|     void SetLocalMemory(NodeBlock& bb, Node address, Node value);
 | |
|     /// Sets a temporal. Internally it uses a post-RZ register
 | |
|     void SetTemporal(NodeBlock& bb, u32 id, Node value);
 | |
| 
 | |
|     /// Sets internal flags from a float
 | |
|     void SetInternalFlagsFromFloat(NodeBlock& bb, Node value, bool sets_cc = true);
 | |
|     /// Sets internal flags from an integer
 | |
|     void SetInternalFlagsFromInteger(NodeBlock& bb, Node value, bool sets_cc = true);
 | |
| 
 | |
|     /// Conditionally absolute/negated float. Absolute is applied first
 | |
|     Node GetOperandAbsNegFloat(Node value, bool absolute, bool negate);
 | |
|     /// Conditionally saturates a float
 | |
|     Node GetSaturatedFloat(Node value, bool saturate = true);
 | |
| 
 | |
|     /// Converts an integer to different sizes.
 | |
|     Node ConvertIntegerSize(Node value, Tegra::Shader::Register::Size size, bool is_signed);
 | |
|     /// Conditionally absolute/negated integer. Absolute is applied first
 | |
|     Node GetOperandAbsNegInteger(Node value, bool absolute, bool negate, bool is_signed);
 | |
| 
 | |
|     /// Unpacks a half immediate from an instruction
 | |
|     Node UnpackHalfImmediate(Tegra::Shader::Instruction instr, bool has_negation);
 | |
|     /// Unpacks a binary value into a half float pair with a type format
 | |
|     Node UnpackHalfFloat(Node value, Tegra::Shader::HalfType type);
 | |
|     /// Merges a half pair into another value
 | |
|     Node HalfMerge(Node dest, Node src, Tegra::Shader::HalfMerge merge);
 | |
|     /// Conditionally absolute/negated half float pair. Absolute is applied first
 | |
|     Node GetOperandAbsNegHalf(Node value, bool absolute, bool negate);
 | |
|     /// Conditionally saturates a half float pair
 | |
|     Node GetSaturatedHalfFloat(Node value, bool saturate = true);
 | |
| 
 | |
|     /// Returns a predicate comparing two floats
 | |
|     Node GetPredicateComparisonFloat(Tegra::Shader::PredCondition condition, Node op_a, Node op_b);
 | |
|     /// Returns a predicate comparing two integers
 | |
|     Node GetPredicateComparisonInteger(Tegra::Shader::PredCondition condition, bool is_signed,
 | |
|                                        Node op_a, Node op_b);
 | |
|     /// Returns a predicate comparing two half floats. meta consumes how both pairs will be compared
 | |
|     Node GetPredicateComparisonHalf(Tegra::Shader::PredCondition condition, Node op_a, Node op_b);
 | |
| 
 | |
|     /// Returns a predicate combiner operation
 | |
|     OperationCode GetPredicateCombiner(Tegra::Shader::PredOperation operation);
 | |
| 
 | |
|     /// Returns a condition code evaluated from internal flags
 | |
|     Node GetConditionCode(Tegra::Shader::ConditionCode cc);
 | |
| 
 | |
|     /// Accesses a texture sampler
 | |
|     const Sampler& GetSampler(const Tegra::Shader::Sampler& sampler,
 | |
|                               Tegra::Shader::TextureType type, bool is_array, bool is_shadow);
 | |
| 
 | |
|     // Accesses a texture sampler for a bindless texture.
 | |
|     const Sampler& GetBindlessSampler(const Tegra::Shader::Register& reg,
 | |
|                                       Tegra::Shader::TextureType type, bool is_array,
 | |
|                                       bool is_shadow);
 | |
| 
 | |
|     /// Extracts a sequence of bits from a node
 | |
|     Node BitfieldExtract(Node value, u32 offset, u32 bits);
 | |
| 
 | |
|     void WriteTexInstructionFloat(NodeBlock& bb, Tegra::Shader::Instruction instr,
 | |
|                                   const Node4& components);
 | |
| 
 | |
|     void WriteTexsInstructionFloat(NodeBlock& bb, Tegra::Shader::Instruction instr,
 | |
|                                    const Node4& components);
 | |
|     void WriteTexsInstructionHalfFloat(NodeBlock& bb, Tegra::Shader::Instruction instr,
 | |
|                                        const Node4& components);
 | |
| 
 | |
|     Node4 GetTexCode(Tegra::Shader::Instruction instr, Tegra::Shader::TextureType texture_type,
 | |
|                      Tegra::Shader::TextureProcessMode process_mode, bool depth_compare,
 | |
|                      bool is_array, bool is_aoffi,
 | |
|                      std::optional<Tegra::Shader::Register> bindless_reg);
 | |
| 
 | |
|     Node4 GetTexsCode(Tegra::Shader::Instruction instr, Tegra::Shader::TextureType texture_type,
 | |
|                       Tegra::Shader::TextureProcessMode process_mode, bool depth_compare,
 | |
|                       bool is_array);
 | |
| 
 | |
|     Node4 GetTld4Code(Tegra::Shader::Instruction instr, Tegra::Shader::TextureType texture_type,
 | |
|                       bool depth_compare, bool is_array, bool is_aoffi);
 | |
| 
 | |
|     Node4 GetTldsCode(Tegra::Shader::Instruction instr, Tegra::Shader::TextureType texture_type,
 | |
|                       bool is_array);
 | |
| 
 | |
|     std::tuple<std::size_t, std::size_t> ValidateAndGetCoordinateElement(
 | |
|         Tegra::Shader::TextureType texture_type, bool depth_compare, bool is_array,
 | |
|         bool lod_bias_enabled, std::size_t max_coords, std::size_t max_inputs);
 | |
| 
 | |
|     std::vector<Node> GetAoffiCoordinates(Node aoffi_reg, std::size_t coord_count, bool is_tld4);
 | |
| 
 | |
|     Node4 GetTextureCode(Tegra::Shader::Instruction instr, Tegra::Shader::TextureType texture_type,
 | |
|                          Tegra::Shader::TextureProcessMode process_mode, std::vector<Node> coords,
 | |
|                          Node array, Node depth_compare, u32 bias_offset, std::vector<Node> aoffi,
 | |
|                          std::optional<Tegra::Shader::Register> bindless_reg);
 | |
| 
 | |
|     Node GetVideoOperand(Node op, bool is_chunk, bool is_signed, Tegra::Shader::VideoType type,
 | |
|                          u64 byte_height);
 | |
| 
 | |
|     void WriteLogicOperation(NodeBlock& bb, Tegra::Shader::Register dest,
 | |
|                              Tegra::Shader::LogicOperation logic_op, Node op_a, Node op_b,
 | |
|                              Tegra::Shader::PredicateResultMode predicate_mode,
 | |
|                              Tegra::Shader::Pred predicate, bool sets_cc);
 | |
|     void WriteLop3Instruction(NodeBlock& bb, Tegra::Shader::Register dest, Node op_a, Node op_b,
 | |
|                               Node op_c, Node imm_lut, bool sets_cc);
 | |
| 
 | |
|     Node TrackCbuf(Node tracked, const NodeBlock& code, s64 cursor) const;
 | |
| 
 | |
|     std::optional<u32> TrackImmediate(Node tracked, const NodeBlock& code, s64 cursor) const;
 | |
| 
 | |
|     std::pair<Node, s64> TrackRegister(const GprNode* tracked, const NodeBlock& code,
 | |
|                                        s64 cursor) const;
 | |
| 
 | |
|     std::tuple<Node, Node, GlobalMemoryBase> TrackAndGetGlobalMemory(
 | |
|         NodeBlock& bb, Tegra::Shader::Instruction instr, bool is_write);
 | |
| 
 | |
|     template <typename... T>
 | |
|     Node Operation(OperationCode code, const T*... operands) {
 | |
|         return StoreNode(OperationNode(code, operands...));
 | |
|     }
 | |
| 
 | |
|     template <typename... T>
 | |
|     Node Operation(OperationCode code, Meta&& meta, const T*... operands) {
 | |
|         return StoreNode(OperationNode(code, std::move(meta), operands...));
 | |
|     }
 | |
| 
 | |
|     Node Operation(OperationCode code, std::vector<Node>&& operands) {
 | |
|         return StoreNode(OperationNode(code, std::move(operands)));
 | |
|     }
 | |
| 
 | |
|     Node Operation(OperationCode code, Meta&& meta, std::vector<Node>&& operands) {
 | |
|         return StoreNode(OperationNode(code, std::move(meta), std::move(operands)));
 | |
|     }
 | |
| 
 | |
|     template <typename... T>
 | |
|     Node SignedOperation(OperationCode code, bool is_signed, const T*... operands) {
 | |
|         return StoreNode(OperationNode(SignedToUnsignedCode(code, is_signed), operands...));
 | |
|     }
 | |
| 
 | |
|     template <typename... T>
 | |
|     Node SignedOperation(OperationCode code, bool is_signed, Meta&& meta, const T*... operands) {
 | |
|         return StoreNode(
 | |
|             OperationNode(SignedToUnsignedCode(code, is_signed), std::move(meta), operands...));
 | |
|     }
 | |
| 
 | |
|     static OperationCode SignedToUnsignedCode(OperationCode operation_code, bool is_signed);
 | |
| 
 | |
|     const ProgramCode& program_code;
 | |
|     const u32 main_offset;
 | |
| 
 | |
|     u32 coverage_begin{};
 | |
|     u32 coverage_end{};
 | |
|     std::map<std::pair<u32, u32>, ExitMethod> exit_method_map;
 | |
| 
 | |
|     std::map<u32, NodeBlock> basic_blocks;
 | |
|     NodeBlock global_code;
 | |
| 
 | |
|     std::vector<std::unique_ptr<NodeData>> stored_nodes;
 | |
| 
 | |
|     std::set<u32> used_registers;
 | |
|     std::set<Tegra::Shader::Pred> used_predicates;
 | |
|     std::set<Tegra::Shader::Attribute::Index> used_input_attributes;
 | |
|     std::set<Tegra::Shader::Attribute::Index> used_output_attributes;
 | |
|     std::map<u32, ConstBuffer> used_cbufs;
 | |
|     std::set<Sampler> used_samplers;
 | |
|     std::array<bool, Tegra::Engines::Maxwell3D::Regs::NumClipDistances> used_clip_distances{};
 | |
|     std::map<GlobalMemoryBase, GlobalMemoryUsage> used_global_memory;
 | |
|     bool uses_physical_attributes{}; // Shader uses AL2P or physical attribute read/writes
 | |
| 
 | |
|     Tegra::Shader::Header header;
 | |
| };
 | |
| 
 | |
| } // namespace VideoCommon::Shader
 | 
