// Copyright 2018 yuzu Emulator Project // Licensed under GPLv2 or any later version // Refer to the license.txt file included. #pragma once #include <array> #include <cstring> #include <map> #include <optional> #include <set> #include <string> #include <tuple> #include <variant> #include <vector> #include "common/common_types.h" #include "video_core/engines/maxwell_3d.h" #include "video_core/engines/shader_bytecode.h" #include "video_core/engines/shader_header.h" namespace VideoCommon::Shader { class OperationNode; class ConditionalNode; class GprNode; class ImmediateNode; class InternalFlagNode; class PredicateNode; class AbufNode; ///< Attribute buffer class CbufNode; ///< Constant buffer class LmemNode; ///< Local memory class GmemNode; ///< Global memory class CommentNode; using ProgramCode = std::vector<u64>; using NodeData = std::variant<OperationNode, ConditionalNode, GprNode, ImmediateNode, InternalFlagNode, PredicateNode, AbufNode, CbufNode, LmemNode, GmemNode, CommentNode>; using Node = const NodeData*; using Node4 = std::array<Node, 4>; using NodeBlock = std::vector<Node>; constexpr u32 MAX_PROGRAM_LENGTH = 0x1000; enum class OperationCode { Assign, /// (float& dest, float src) -> void Select, /// (MetaArithmetic, bool pred, float a, float b) -> float FAdd, /// (MetaArithmetic, float a, float b) -> float FMul, /// (MetaArithmetic, float a, float b) -> float FDiv, /// (MetaArithmetic, float a, float b) -> float FFma, /// (MetaArithmetic, float a, float b, float c) -> float FNegate, /// (MetaArithmetic, float a) -> float FAbsolute, /// (MetaArithmetic, float a) -> float FClamp, /// (MetaArithmetic, float value, float min, float max) -> float FMin, /// (MetaArithmetic, float a, float b) -> float FMax, /// (MetaArithmetic, float a, float b) -> float FCos, /// (MetaArithmetic, float a) -> float FSin, /// (MetaArithmetic, float a) -> float FExp2, /// (MetaArithmetic, float a) -> float FLog2, /// (MetaArithmetic, float a) -> float FInverseSqrt, /// (MetaArithmetic, float a) -> float FSqrt, /// (MetaArithmetic, float a) -> float FRoundEven, /// (MetaArithmetic, float a) -> float FFloor, /// (MetaArithmetic, float a) -> float FCeil, /// (MetaArithmetic, float a) -> float FTrunc, /// (MetaArithmetic, float a) -> float FCastInteger, /// (MetaArithmetic, int a) -> float FCastUInteger, /// (MetaArithmetic, uint a) -> float IAdd, /// (MetaArithmetic, int a, int b) -> int IMul, /// (MetaArithmetic, int a, int b) -> int IDiv, /// (MetaArithmetic, int a, int b) -> int INegate, /// (MetaArithmetic, int a) -> int IAbsolute, /// (MetaArithmetic, int a) -> int IMin, /// (MetaArithmetic, int a, int b) -> int IMax, /// (MetaArithmetic, int a, int b) -> int ICastFloat, /// (MetaArithmetic, float a) -> int ICastUnsigned, /// (MetaArithmetic, uint a) -> int ILogicalShiftLeft, /// (MetaArithmetic, int a, uint b) -> int ILogicalShiftRight, /// (MetaArithmetic, int a, uint b) -> int IArithmeticShiftRight, /// (MetaArithmetic, int a, uint b) -> int IBitwiseAnd, /// (MetaArithmetic, int a, int b) -> int IBitwiseOr, /// (MetaArithmetic, int a, int b) -> int IBitwiseXor, /// (MetaArithmetic, int a, int b) -> int IBitwiseNot, /// (MetaArithmetic, int a) -> int IBitfieldInsert, /// (MetaArithmetic, int base, int insert, int offset, int bits) -> int IBitfieldExtract, /// (MetaArithmetic, int value, int offset, int offset) -> int IBitCount, /// (MetaArithmetic, int) -> int UAdd, /// (MetaArithmetic, uint a, uint b) -> uint UMul, /// (MetaArithmetic, uint a, uint b) -> uint UDiv, /// (MetaArithmetic, uint a, uint b) -> uint UMin, /// (MetaArithmetic, uint a, uint b) -> uint UMax, /// (MetaArithmetic, uint a, uint b) -> uint UCastFloat, /// (MetaArithmetic, float a) -> uint UCastSigned, /// (MetaArithmetic, int a) -> uint ULogicalShiftLeft, /// (MetaArithmetic, uint a, uint b) -> uint ULogicalShiftRight, /// (MetaArithmetic, uint a, uint b) -> uint UArithmeticShiftRight, /// (MetaArithmetic, uint a, uint b) -> uint UBitwiseAnd, /// (MetaArithmetic, uint a, uint b) -> uint UBitwiseOr, /// (MetaArithmetic, uint a, uint b) -> uint UBitwiseXor, /// (MetaArithmetic, uint a, uint b) -> uint UBitwiseNot, /// (MetaArithmetic, uint a) -> uint UBitfieldInsert, /// (MetaArithmetic, uint base, uint insert, int offset, int bits) -> uint UBitfieldExtract, /// (MetaArithmetic, uint value, int offset, int offset) -> uint UBitCount, /// (MetaArithmetic, uint) -> uint HAdd, /// (MetaArithmetic, f16vec2 a, f16vec2 b) -> f16vec2 HMul, /// (MetaArithmetic, f16vec2 a, f16vec2 b) -> f16vec2 HFma, /// (MetaArithmetic, f16vec2 a, f16vec2 b, f16vec2 c) -> f16vec2 HAbsolute, /// (f16vec2 a) -> f16vec2 HNegate, /// (f16vec2 a, bool first, bool second) -> f16vec2 HClamp, /// (f16vec2 src, float min, float max) -> f16vec2 HUnpack, /// (Tegra::Shader::HalfType, T value) -> f16vec2 HMergeF32, /// (f16vec2 src) -> float HMergeH0, /// (f16vec2 dest, f16vec2 src) -> f16vec2 HMergeH1, /// (f16vec2 dest, f16vec2 src) -> f16vec2 HPack2, /// (float a, float b) -> f16vec2 LogicalAssign, /// (bool& dst, bool src) -> void LogicalAnd, /// (bool a, bool b) -> bool LogicalOr, /// (bool a, bool b) -> bool LogicalXor, /// (bool a, bool b) -> bool LogicalNegate, /// (bool a) -> bool LogicalPick2, /// (bool2 pair, uint index) -> bool LogicalAll2, /// (bool2 a) -> bool LogicalAny2, /// (bool2 a) -> bool LogicalFLessThan, /// (float a, float b) -> bool LogicalFEqual, /// (float a, float b) -> bool LogicalFLessEqual, /// (float a, float b) -> bool LogicalFGreaterThan, /// (float a, float b) -> bool LogicalFNotEqual, /// (float a, float b) -> bool LogicalFGreaterEqual, /// (float a, float b) -> bool LogicalFIsNan, /// (float a) -> bool LogicalILessThan, /// (int a, int b) -> bool LogicalIEqual, /// (int a, int b) -> bool LogicalILessEqual, /// (int a, int b) -> bool LogicalIGreaterThan, /// (int a, int b) -> bool LogicalINotEqual, /// (int a, int b) -> bool LogicalIGreaterEqual, /// (int a, int b) -> bool LogicalULessThan, /// (uint a, uint b) -> bool LogicalUEqual, /// (uint a, uint b) -> bool LogicalULessEqual, /// (uint a, uint b) -> bool LogicalUGreaterThan, /// (uint a, uint b) -> bool LogicalUNotEqual, /// (uint a, uint b) -> bool LogicalUGreaterEqual, /// (uint a, uint b) -> bool Logical2HLessThan, /// (MetaHalfArithmetic, f16vec2 a, f16vec2) -> bool2 Logical2HEqual, /// (MetaHalfArithmetic, f16vec2 a, f16vec2) -> bool2 Logical2HLessEqual, /// (MetaHalfArithmetic, f16vec2 a, f16vec2) -> bool2 Logical2HGreaterThan, /// (MetaHalfArithmetic, f16vec2 a, f16vec2) -> bool2 Logical2HNotEqual, /// (MetaHalfArithmetic, f16vec2 a, f16vec2) -> bool2 Logical2HGreaterEqual, /// (MetaHalfArithmetic, f16vec2 a, f16vec2) -> bool2 Logical2HLessThanWithNan, /// (MetaHalfArithmetic, f16vec2 a, f16vec2) -> bool2 Logical2HEqualWithNan, /// (MetaHalfArithmetic, f16vec2 a, f16vec2) -> bool2 Logical2HLessEqualWithNan, /// (MetaHalfArithmetic, f16vec2 a, f16vec2) -> bool2 Logical2HGreaterThanWithNan, /// (MetaHalfArithmetic, f16vec2 a, f16vec2) -> bool2 Logical2HNotEqualWithNan, /// (MetaHalfArithmetic, f16vec2 a, f16vec2) -> bool2 Logical2HGreaterEqualWithNan, /// (MetaHalfArithmetic, f16vec2 a, f16vec2) -> bool2 Texture, /// (MetaTexture, float[N] coords) -> float4 TextureLod, /// (MetaTexture, float[N] coords) -> float4 TextureGather, /// (MetaTexture, float[N] coords) -> float4 TextureQueryDimensions, /// (MetaTexture, float a) -> float4 TextureQueryLod, /// (MetaTexture, float[N] coords) -> float4 TexelFetch, /// (MetaTexture, int[N], int) -> float4 Branch, /// (uint branch_target) -> void PushFlowStack, /// (uint branch_target) -> void PopFlowStack, /// () -> void Exit, /// () -> void Discard, /// () -> void EmitVertex, /// () -> void EndPrimitive, /// () -> void YNegate, /// () -> float Amount, }; enum class InternalFlag { Zero = 0, Sign = 1, Carry = 2, Overflow = 3, Amount = 4, }; /// Describes the behaviour of code path of a given entry point and a return point. enum class ExitMethod { Undetermined, ///< Internal value. Only occur when analyzing JMP loop. AlwaysReturn, ///< All code paths reach the return point. Conditional, ///< Code path reaches the return point or an END instruction conditionally. AlwaysEnd, ///< All code paths reach a END instruction. }; class Sampler { public: // Use this constructor for bounded Samplers explicit Sampler(std::size_t offset, std::size_t index, Tegra::Shader::TextureType type, bool is_array, bool is_shadow) : offset{offset}, index{index}, type{type}, is_array{is_array}, is_shadow{is_shadow}, is_bindless{false} {} // Use this constructor for bindless Samplers explicit Sampler(u32 cbuf_index, u32 cbuf_offset, std::size_t index, Tegra::Shader::TextureType type, bool is_array, bool is_shadow) : offset{(static_cast<u64>(cbuf_index) << 32) | cbuf_offset}, index{index}, type{type}, is_array{is_array}, is_shadow{is_shadow}, is_bindless{true} {} // Use this only for serialization/deserialization explicit Sampler(std::size_t offset, std::size_t index, Tegra::Shader::TextureType type, bool is_array, bool is_shadow, bool is_bindless) : offset{offset}, index{index}, type{type}, is_array{is_array}, is_shadow{is_shadow}, is_bindless{is_bindless} {} std::size_t GetOffset() const { return offset; } std::size_t GetIndex() const { return index; } Tegra::Shader::TextureType GetType() const { return type; } bool IsArray() const { return is_array; } bool IsShadow() const { return is_shadow; } bool IsBindless() const { return is_bindless; } std::pair<u32, u32> GetBindlessCBuf() const { return {static_cast<u32>(offset >> 32), static_cast<u32>(offset)}; } bool operator<(const Sampler& rhs) const { return std::tie(index, offset, type, is_array, is_shadow, is_bindless) < std::tie(rhs.index, rhs.offset, rhs.type, rhs.is_array, rhs.is_shadow, rhs.is_bindless); } private: /// Offset in TSC memory from which to read the sampler object, as specified by the sampling /// instruction. std::size_t offset{}; std::size_t index{}; ///< Value used to index into the generated GLSL sampler array. Tegra::Shader::TextureType type{}; ///< The type used to sample this texture (Texture2D, etc) bool is_array{}; ///< Whether the texture is being sampled as an array texture or not. bool is_shadow{}; ///< Whether the texture is being sampled as a depth texture or not. bool is_bindless{}; ///< Whether this sampler belongs to a bindless texture or not. }; class ConstBuffer { public: explicit ConstBuffer(u32 max_offset, bool is_indirect) : max_offset{max_offset}, is_indirect{is_indirect} {} ConstBuffer() = default; void MarkAsUsed(u64 offset) { max_offset = std::max(max_offset, static_cast<u32>(offset)); } void MarkAsUsedIndirect() { is_indirect = true; } bool IsIndirect() const { return is_indirect; } u32 GetSize() const { return max_offset + sizeof(float); } u32 GetMaxOffset() const { return max_offset; } private: u32 max_offset{}; bool is_indirect{}; }; struct GlobalMemoryBase { u32 cbuf_index{}; u32 cbuf_offset{}; bool operator<(const GlobalMemoryBase& rhs) const { return std::tie(cbuf_index, cbuf_offset) < std::tie(rhs.cbuf_index, rhs.cbuf_offset); } }; struct GlobalMemoryUsage { bool is_read{}; bool is_written{}; }; struct MetaArithmetic { bool precise{}; }; struct MetaTexture { const Sampler& sampler; Node array{}; Node depth_compare{}; std::vector<Node> aoffi; Node bias{}; Node lod{}; Node component{}; u32 element{}; }; constexpr MetaArithmetic PRECISE = {true}; constexpr MetaArithmetic NO_PRECISE = {false}; using Meta = std::variant<MetaArithmetic, MetaTexture, Tegra::Shader::HalfType>; /// Holds any kind of operation that can be done in the IR class OperationNode final { public: explicit OperationNode(OperationCode code) : code{code} {} explicit OperationNode(OperationCode code, Meta&& meta) : code{code}, meta{std::move(meta)} {} template <typename... T> explicit OperationNode(OperationCode code, const T*... operands) : OperationNode(code, {}, operands...) {} template <typename... T> explicit OperationNode(OperationCode code, Meta&& meta, const T*... operands_) : code{code}, meta{std::move(meta)}, operands{operands_...} {} explicit OperationNode(OperationCode code, Meta&& meta, std::vector<Node>&& operands) : code{code}, meta{meta}, operands{std::move(operands)} {} explicit OperationNode(OperationCode code, std::vector<Node>&& operands) : code{code}, operands{std::move(operands)} {} OperationCode GetCode() const { return code; } const Meta& GetMeta() const { return meta; } std::size_t GetOperandsCount() const { return operands.size(); } Node operator[](std::size_t operand_index) const { return operands.at(operand_index); } private: const OperationCode code; const Meta meta; std::vector<Node> operands; }; /// Encloses inside any kind of node that returns a boolean conditionally-executed code class ConditionalNode final { public: explicit ConditionalNode(Node condition, std::vector<Node>&& code) : condition{condition}, code{std::move(code)} {} Node GetCondition() const { return condition; } const std::vector<Node>& GetCode() const { return code; } private: const Node condition; ///< Condition to be satisfied std::vector<Node> code; ///< Code to execute }; /// A general purpose register class GprNode final { public: explicit constexpr GprNode(Tegra::Shader::Register index) : index{index} {} u32 GetIndex() const { return static_cast<u32>(index); } private: const Tegra::Shader::Register index; }; /// A 32-bits value that represents an immediate value class ImmediateNode final { public: explicit constexpr ImmediateNode(u32 value) : value{value} {} u32 GetValue() const { return value; } private: const u32 value; }; /// One of Maxwell's internal flags class InternalFlagNode final { public: explicit constexpr InternalFlagNode(InternalFlag flag) : flag{flag} {} InternalFlag GetFlag() const { return flag; } private: const InternalFlag flag; }; /// A predicate register, it can be negated without additional nodes class PredicateNode final { public: explicit constexpr PredicateNode(Tegra::Shader::Pred index, bool negated) : index{index}, negated{negated} {} Tegra::Shader::Pred GetIndex() const { return index; } bool IsNegated() const { return negated; } private: const Tegra::Shader::Pred index; const bool negated; }; /// Attribute buffer memory (known as attributes or varyings in GLSL terms) class AbufNode final { public: // Initialize for standard attributes (index is explicit). explicit constexpr AbufNode(Tegra::Shader::Attribute::Index index, u32 element, Node buffer = {}) : buffer{buffer}, index{index}, element{element} {} // Initialize for physical attributes (index is a variable value). explicit constexpr AbufNode(Node physical_address, Node buffer = {}) : physical_address{physical_address}, buffer{buffer} {} Tegra::Shader::Attribute::Index GetIndex() const { return index; } u32 GetElement() const { return element; } Node GetBuffer() const { return buffer; } bool IsPhysicalBuffer() const { return physical_address != nullptr; } Node GetPhysicalAddress() const { return physical_address; } private: Node physical_address{}; Node buffer{}; Tegra::Shader::Attribute::Index index{}; u32 element{}; }; /// Constant buffer node, usually mapped to uniform buffers in GLSL class CbufNode final { public: explicit constexpr CbufNode(u32 index, Node offset) : index{index}, offset{offset} {} u32 GetIndex() const { return index; } Node GetOffset() const { return offset; } private: const u32 index; const Node offset; }; /// Local memory node class LmemNode final { public: explicit constexpr LmemNode(Node address) : address{address} {} Node GetAddress() const { return address; } private: const Node address; }; /// Global memory node class GmemNode final { public: explicit constexpr GmemNode(Node real_address, Node base_address, const GlobalMemoryBase& descriptor) : real_address{real_address}, base_address{base_address}, descriptor{descriptor} {} Node GetRealAddress() const { return real_address; } Node GetBaseAddress() const { return base_address; } const GlobalMemoryBase& GetDescriptor() const { return descriptor; } private: const Node real_address; const Node base_address; const GlobalMemoryBase descriptor; }; /// Commentary, can be dropped class CommentNode final { public: explicit CommentNode(std::string text) : text{std::move(text)} {} const std::string& GetText() const { return text; } private: std::string text; }; class ShaderIR final { public: explicit ShaderIR(const ProgramCode& program_code, u32 main_offset); ~ShaderIR(); const std::map<u32, NodeBlock>& GetBasicBlocks() const { return basic_blocks; } const std::set<u32>& GetRegisters() const { return used_registers; } const std::set<Tegra::Shader::Pred>& GetPredicates() const { return used_predicates; } const std::set<Tegra::Shader::Attribute::Index>& GetInputAttributes() const { return used_input_attributes; } const std::set<Tegra::Shader::Attribute::Index>& GetOutputAttributes() const { return used_output_attributes; } const std::map<u32, ConstBuffer>& GetConstantBuffers() const { return used_cbufs; } const std::set<Sampler>& GetSamplers() const { return used_samplers; } const std::array<bool, Tegra::Engines::Maxwell3D::Regs::NumClipDistances>& GetClipDistances() const { return used_clip_distances; } const std::map<GlobalMemoryBase, GlobalMemoryUsage>& GetGlobalMemory() const { return used_global_memory; } std::size_t GetLength() const { return static_cast<std::size_t>(coverage_end * sizeof(u64)); } bool HasPhysicalAttributes() const { return uses_physical_attributes; } const Tegra::Shader::Header& GetHeader() const { return header; } private: void Decode(); ExitMethod Scan(u32 begin, u32 end, std::set<u32>& labels); NodeBlock DecodeRange(u32 begin, u32 end); /** * Decodes a single instruction from Tegra to IR. * @param bb Basic block where the nodes will be written to. * @param pc Program counter. Offset to decode. * @return Next address to decode. */ u32 DecodeInstr(NodeBlock& bb, u32 pc); u32 DecodeArithmetic(NodeBlock& bb, u32 pc); u32 DecodeArithmeticImmediate(NodeBlock& bb, u32 pc); u32 DecodeBfe(NodeBlock& bb, u32 pc); u32 DecodeBfi(NodeBlock& bb, u32 pc); u32 DecodeShift(NodeBlock& bb, u32 pc); u32 DecodeArithmeticInteger(NodeBlock& bb, u32 pc); u32 DecodeArithmeticIntegerImmediate(NodeBlock& bb, u32 pc); u32 DecodeArithmeticHalf(NodeBlock& bb, u32 pc); u32 DecodeArithmeticHalfImmediate(NodeBlock& bb, u32 pc); u32 DecodeFfma(NodeBlock& bb, u32 pc); u32 DecodeHfma2(NodeBlock& bb, u32 pc); u32 DecodeConversion(NodeBlock& bb, u32 pc); u32 DecodeMemory(NodeBlock& bb, u32 pc); u32 DecodeTexture(NodeBlock& bb, u32 pc); u32 DecodeFloatSetPredicate(NodeBlock& bb, u32 pc); u32 DecodeIntegerSetPredicate(NodeBlock& bb, u32 pc); u32 DecodeHalfSetPredicate(NodeBlock& bb, u32 pc); u32 DecodePredicateSetRegister(NodeBlock& bb, u32 pc); u32 DecodePredicateSetPredicate(NodeBlock& bb, u32 pc); u32 DecodeRegisterSetPredicate(NodeBlock& bb, u32 pc); u32 DecodeFloatSet(NodeBlock& bb, u32 pc); u32 DecodeIntegerSet(NodeBlock& bb, u32 pc); u32 DecodeHalfSet(NodeBlock& bb, u32 pc); u32 DecodeVideo(NodeBlock& bb, u32 pc); u32 DecodeXmad(NodeBlock& bb, u32 pc); u32 DecodeOther(NodeBlock& bb, u32 pc); /// Internalizes node's data and returns a managed pointer to a clone of that node Node StoreNode(NodeData&& node_data); /// Creates a conditional node Node Conditional(Node condition, std::vector<Node>&& code); /// Creates a commentary Node Comment(const std::string& text); /// Creates an u32 immediate Node Immediate(u32 value); /// Creates a s32 immediate Node Immediate(s32 value) { return Immediate(static_cast<u32>(value)); } /// Creates a f32 immediate Node Immediate(f32 value) { u32 integral; std::memcpy(&integral, &value, sizeof(u32)); return Immediate(integral); } /// Generates a node for a passed register. Node GetRegister(Tegra::Shader::Register reg); /// Generates a node representing a 19-bit immediate value Node GetImmediate19(Tegra::Shader::Instruction instr); /// Generates a node representing a 32-bit immediate value Node GetImmediate32(Tegra::Shader::Instruction instr); /// Generates a node representing a constant buffer Node GetConstBuffer(u64 index, u64 offset); /// Generates a node representing a constant buffer with a variadic offset Node GetConstBufferIndirect(u64 index, u64 offset, Node node); /// Generates a node for a passed predicate. It can be optionally negated Node GetPredicate(u64 pred, bool negated = false); /// Generates a predicate node for an immediate true or false value Node GetPredicate(bool immediate); /// Generates a node representing an input attribute. Keeps track of used attributes. Node GetInputAttribute(Tegra::Shader::Attribute::Index index, u64 element, Node buffer = {}); /// Generates a node representing a physical input attribute. Node GetPhysicalInputAttribute(Tegra::Shader::Register physical_address, Node buffer = {}); /// Generates a node representing an output attribute. Keeps track of used attributes. Node GetOutputAttribute(Tegra::Shader::Attribute::Index index, u64 element, Node buffer); /// Generates a node representing an internal flag Node GetInternalFlag(InternalFlag flag, bool negated = false); /// Generates a node representing a local memory address Node GetLocalMemory(Node address); /// Generates a temporal, internally it uses a post-RZ register Node GetTemporal(u32 id); /// Sets a register. src value must be a number-evaluated node. void SetRegister(NodeBlock& bb, Tegra::Shader::Register dest, Node src); /// Sets a predicate. src value must be a bool-evaluated node void SetPredicate(NodeBlock& bb, u64 dest, Node src); /// Sets an internal flag. src value must be a bool-evaluated node void SetInternalFlag(NodeBlock& bb, InternalFlag flag, Node value); /// Sets a local memory address. address and value must be a number-evaluated node void SetLocalMemory(NodeBlock& bb, Node address, Node value); /// Sets a temporal. Internally it uses a post-RZ register void SetTemporal(NodeBlock& bb, u32 id, Node value); /// Sets internal flags from a float void SetInternalFlagsFromFloat(NodeBlock& bb, Node value, bool sets_cc = true); /// Sets internal flags from an integer void SetInternalFlagsFromInteger(NodeBlock& bb, Node value, bool sets_cc = true); /// Conditionally absolute/negated float. Absolute is applied first Node GetOperandAbsNegFloat(Node value, bool absolute, bool negate); /// Conditionally saturates a float Node GetSaturatedFloat(Node value, bool saturate = true); /// Converts an integer to different sizes. Node ConvertIntegerSize(Node value, Tegra::Shader::Register::Size size, bool is_signed); /// Conditionally absolute/negated integer. Absolute is applied first Node GetOperandAbsNegInteger(Node value, bool absolute, bool negate, bool is_signed); /// Unpacks a half immediate from an instruction Node UnpackHalfImmediate(Tegra::Shader::Instruction instr, bool has_negation); /// Unpacks a binary value into a half float pair with a type format Node UnpackHalfFloat(Node value, Tegra::Shader::HalfType type); /// Merges a half pair into another value Node HalfMerge(Node dest, Node src, Tegra::Shader::HalfMerge merge); /// Conditionally absolute/negated half float pair. Absolute is applied first Node GetOperandAbsNegHalf(Node value, bool absolute, bool negate); /// Conditionally saturates a half float pair Node GetSaturatedHalfFloat(Node value, bool saturate = true); /// Returns a predicate comparing two floats Node GetPredicateComparisonFloat(Tegra::Shader::PredCondition condition, Node op_a, Node op_b); /// Returns a predicate comparing two integers Node GetPredicateComparisonInteger(Tegra::Shader::PredCondition condition, bool is_signed, Node op_a, Node op_b); /// Returns a predicate comparing two half floats. meta consumes how both pairs will be compared Node GetPredicateComparisonHalf(Tegra::Shader::PredCondition condition, Node op_a, Node op_b); /// Returns a predicate combiner operation OperationCode GetPredicateCombiner(Tegra::Shader::PredOperation operation); /// Returns a condition code evaluated from internal flags Node GetConditionCode(Tegra::Shader::ConditionCode cc); /// Accesses a texture sampler const Sampler& GetSampler(const Tegra::Shader::Sampler& sampler, Tegra::Shader::TextureType type, bool is_array, bool is_shadow); // Accesses a texture sampler for a bindless texture. const Sampler& GetBindlessSampler(const Tegra::Shader::Register& reg, Tegra::Shader::TextureType type, bool is_array, bool is_shadow); /// Extracts a sequence of bits from a node Node BitfieldExtract(Node value, u32 offset, u32 bits); void WriteTexInstructionFloat(NodeBlock& bb, Tegra::Shader::Instruction instr, const Node4& components); void WriteTexsInstructionFloat(NodeBlock& bb, Tegra::Shader::Instruction instr, const Node4& components); void WriteTexsInstructionHalfFloat(NodeBlock& bb, Tegra::Shader::Instruction instr, const Node4& components); Node4 GetTexCode(Tegra::Shader::Instruction instr, Tegra::Shader::TextureType texture_type, Tegra::Shader::TextureProcessMode process_mode, bool depth_compare, bool is_array, bool is_aoffi, std::optional<Tegra::Shader::Register> bindless_reg); Node4 GetTexsCode(Tegra::Shader::Instruction instr, Tegra::Shader::TextureType texture_type, Tegra::Shader::TextureProcessMode process_mode, bool depth_compare, bool is_array); Node4 GetTld4Code(Tegra::Shader::Instruction instr, Tegra::Shader::TextureType texture_type, bool depth_compare, bool is_array, bool is_aoffi); Node4 GetTldsCode(Tegra::Shader::Instruction instr, Tegra::Shader::TextureType texture_type, bool is_array); std::tuple<std::size_t, std::size_t> ValidateAndGetCoordinateElement( Tegra::Shader::TextureType texture_type, bool depth_compare, bool is_array, bool lod_bias_enabled, std::size_t max_coords, std::size_t max_inputs); std::vector<Node> GetAoffiCoordinates(Node aoffi_reg, std::size_t coord_count, bool is_tld4); Node4 GetTextureCode(Tegra::Shader::Instruction instr, Tegra::Shader::TextureType texture_type, Tegra::Shader::TextureProcessMode process_mode, std::vector<Node> coords, Node array, Node depth_compare, u32 bias_offset, std::vector<Node> aoffi, std::optional<Tegra::Shader::Register> bindless_reg); Node GetVideoOperand(Node op, bool is_chunk, bool is_signed, Tegra::Shader::VideoType type, u64 byte_height); void WriteLogicOperation(NodeBlock& bb, Tegra::Shader::Register dest, Tegra::Shader::LogicOperation logic_op, Node op_a, Node op_b, Tegra::Shader::PredicateResultMode predicate_mode, Tegra::Shader::Pred predicate, bool sets_cc); void WriteLop3Instruction(NodeBlock& bb, Tegra::Shader::Register dest, Node op_a, Node op_b, Node op_c, Node imm_lut, bool sets_cc); Node TrackCbuf(Node tracked, const NodeBlock& code, s64 cursor) const; std::optional<u32> TrackImmediate(Node tracked, const NodeBlock& code, s64 cursor) const; std::pair<Node, s64> TrackRegister(const GprNode* tracked, const NodeBlock& code, s64 cursor) const; std::tuple<Node, Node, GlobalMemoryBase> TrackAndGetGlobalMemory(NodeBlock& bb, Node addr_register, u32 immediate_offset, bool is_write); template <typename... T> Node Operation(OperationCode code, const T*... operands) { return StoreNode(OperationNode(code, operands...)); } template <typename... T> Node Operation(OperationCode code, Meta&& meta, const T*... operands) { return StoreNode(OperationNode(code, std::move(meta), operands...)); } Node Operation(OperationCode code, std::vector<Node>&& operands) { return StoreNode(OperationNode(code, std::move(operands))); } Node Operation(OperationCode code, Meta&& meta, std::vector<Node>&& operands) { return StoreNode(OperationNode(code, std::move(meta), std::move(operands))); } template <typename... T> Node SignedOperation(OperationCode code, bool is_signed, const T*... operands) { return StoreNode(OperationNode(SignedToUnsignedCode(code, is_signed), operands...)); } template <typename... T> Node SignedOperation(OperationCode code, bool is_signed, Meta&& meta, const T*... operands) { return StoreNode( OperationNode(SignedToUnsignedCode(code, is_signed), std::move(meta), operands...)); } static OperationCode SignedToUnsignedCode(OperationCode operation_code, bool is_signed); const ProgramCode& program_code; const u32 main_offset; u32 coverage_begin{}; u32 coverage_end{}; std::map<std::pair<u32, u32>, ExitMethod> exit_method_map; std::map<u32, NodeBlock> basic_blocks; NodeBlock global_code; std::vector<std::unique_ptr<NodeData>> stored_nodes; std::set<u32> used_registers; std::set<Tegra::Shader::Pred> used_predicates; std::set<Tegra::Shader::Attribute::Index> used_input_attributes; std::set<Tegra::Shader::Attribute::Index> used_output_attributes; std::map<u32, ConstBuffer> used_cbufs; std::set<Sampler> used_samplers; std::array<bool, Tegra::Engines::Maxwell3D::Regs::NumClipDistances> used_clip_distances{}; std::map<GlobalMemoryBase, GlobalMemoryUsage> used_global_memory; bool uses_physical_attributes{}; // Shader uses AL2P or physical attribute read/writes Tegra::Shader::Header header; }; } // namespace VideoCommon::Shader