suyu/src/video_core/engines/shader_bytecode.h

// Copyright 2018 yuzu Emulator Project
// Licensed under GPLv2 or any later version
// Refer to the license.txt file included.

#pragma once

#include <bitset>
#include <cstring>
#include <map>
#include <string>
#include <vector>

#include <boost/optional.hpp>

#include "common/bit_field.h"
#include "common/common_types.h"

namespace Tegra {
namespace Shader {

struct Register {
    /// Number of registers
    static constexpr size_t NumRegisters = 256;

    /// Register 255 is special cased to always be 0
    static constexpr size_t ZeroIndex = 255;

    enum class Size : u64 {
        Byte = 0,
        Short = 1,
        Word = 2,
        Long = 3,
    };

    constexpr Register() = default;

    constexpr Register(u64 value) : value(value) {}

    constexpr operator u64() const {
        return value;
    }

    template <typename T>
    constexpr u64 operator-(const T& oth) const {
        return value - oth;
    }

    template <typename T>
    constexpr u64 operator&(const T& oth) const {
        return value & oth;
    }

    constexpr u64 operator&(const Register& oth) const {
        return value & oth.value;
    }

    constexpr u64 operator~() const {
        return ~value;
    }

    u64 GetSwizzledIndex(u64 elem) const {
        elem = (value + elem) & 3;
        return (value & ~3) + elem;
    }

private:
    u64 value{};
};

union Attribute {
    Attribute() = default;

    constexpr explicit Attribute(u64 value) : value(value) {}

    enum class Index : u64 {
        Position = 7,
        Attribute_0 = 8,
        // This attribute contains a tuple of (~, ~, InstanceId, VertexId) when inside a vertex
        // shader, and a tuple of (TessCoord.x, TessCoord.y, TessCoord.z, ~) when inside a Tess Eval
        // shader.
        TessCoordInstanceIDVertexID = 47,
    };

    union {
        BitField<22, 2, u64> element;
        BitField<24, 6, Index> index;
        BitField<47, 3, u64> size;
    } fmt20;

    union {
        BitField<30, 2, u64> element;
        BitField<32, 6, Index> index;
    } fmt28;

    BitField<39, 8, u64> reg;
    u64 value{};
};

union Sampler {
    Sampler() = default;

    constexpr explicit Sampler(u64 value) : value(value) {}

    enum class Index : u64 {
        Sampler_0 = 8,
    };

    BitField<36, 13, Index> index;
    u64 value{};
};

} // namespace Shader
} // namespace Tegra

namespace std {

// TODO(bunnei): The below is forbidden by the C++ standard, but works fine. See #330.
template <>
struct make_unsigned<Tegra::Shader::Attribute> {
    using type = Tegra::Shader::Attribute;
};

template <>
struct make_unsigned<Tegra::Shader::Register> {
    using type = Tegra::Shader::Register;
};

} // namespace std

namespace Tegra {
namespace Shader {

enum class Pred : u64 {
    UnusedIndex = 0x7,
    NeverExecute = 0xF,
};

enum class PredCondition : u64 {
    LessThan = 1,
    Equal = 2,
    LessEqual = 3,
    GreaterThan = 4,
    NotEqual = 5,
    GreaterEqual = 6,
    NotEqualWithNan = 13,
    // TODO(Subv): Other condition types
};

enum class PredOperation : u64 {
    And = 0,
    Or = 1,
    Xor = 2,
};

enum class LogicOperation : u64 {
    And = 0,
    Or = 1,
    Xor = 2,
    PassB = 3,
};

enum class SubOp : u64 {
    Cos = 0x0,
    Sin = 0x1,
    Ex2 = 0x2,
    Lg2 = 0x3,
    Rcp = 0x4,
    Rsq = 0x5,
    Sqrt = 0x8,
};

enum class F2iRoundingOp : u64 {
    None = 0,
    Floor = 1,
    Ceil = 2,
    Trunc = 3,
};

enum class F2fRoundingOp : u64 {
    None = 0,
    Pass = 3,
    Round = 8,
    Floor = 9,
    Ceil = 10,
    Trunc = 11,
};

enum class UniformType : u64 {
    UnsignedByte = 0,
    SignedByte = 1,
    UnsignedShort = 2,
    SignedShort = 3,
    Single = 4,
    Double = 5,
};

union Instruction {
    Instruction& operator=(const Instruction& instr) {
        value = instr.value;
        return *this;
    }

    constexpr Instruction(u64 value) : value{value} {}

    BitField<0, 8, Register> gpr0;
    BitField<8, 8, Register> gpr8;
    union {
        BitField<16, 4, Pred> full_pred;
        BitField<16, 3, u64> pred_index;
    } pred;
    BitField<19, 1, u64> negate_pred;
    BitField<20, 8, Register> gpr20;
    BitField<20, 4, SubOp> sub_op;
    BitField<28, 8, Register> gpr28;
    BitField<39, 8, Register> gpr39;
    BitField<48, 16, u64> opcode;

    union {
        BitField<20, 19, u64> imm20_19;
        BitField<20, 32, s64> imm20_32;
        BitField<45, 1, u64> negate_b;
        BitField<46, 1, u64> abs_a;
        BitField<48, 1, u64> negate_a;
        BitField<49, 1, u64> abs_b;
        BitField<50, 1, u64> saturate_d;
        BitField<56, 1, u64> negate_imm;

        union {
            BitField<39, 3, u64> pred;
            BitField<42, 1, u64> negate_pred;
        } fmnmx;

        union {
            BitField<39, 1, u64> invert_a;
            BitField<40, 1, u64> invert_b;
            BitField<41, 2, LogicOperation> operation;
            BitField<44, 2, u64> unk44;
            BitField<48, 3, Pred> pred48;
        } lop;

        union {
            BitField<53, 2, LogicOperation> operation;
            BitField<55, 1, u64> invert_a;
            BitField<56, 1, u64> invert_b;
        } lop32i;

        float GetImm20_19() const {
            float result{};
            u32 imm{static_cast<u32>(imm20_19)};
            imm <<= 12;
            imm |= negate_imm ? 0x80000000 : 0;
            std::memcpy(&result, &imm, sizeof(imm));
            return result;
        }

        float GetImm20_32() const {
            float result{};
            s32 imm{static_cast<s32>(imm20_32)};
            std::memcpy(&result, &imm, sizeof(imm));
            return result;
        }

        s32 GetSignedImm20_20() const {
            u32 immediate = static_cast<u32>(imm20_19 | (negate_imm << 19));
            // Sign extend the 20-bit value.
            u32 mask = 1U << (20 - 1);
            return static_cast<s32>((immediate ^ mask) - mask);
        }
    } alu;

    union {
        BitField<48, 1, u64> is_signed;
    } shift;

    union {
        BitField<39, 5, u64> shift_amount;
        BitField<48, 1, u64> negate_b;
        BitField<49, 1, u64> negate_a;
    } alu_integer;

    union {
        BitField<54, 1, u64> saturate;
        BitField<56, 1, u64> negate_a;
    } iadd32i;

    union {
        BitField<20, 8, u64> shift_position;
        BitField<28, 8, u64> shift_length;
        BitField<48, 1, u64> negate_b;
        BitField<49, 1, u64> negate_a;

        u64 GetLeftShiftValue() const {
            return 32 - (shift_position + shift_length);
        }
    } bfe;

    union {
        BitField<48, 1, u64> negate_b;
        BitField<49, 1, u64> negate_c;
    } ffma;

    union {
        BitField<48, 3, UniformType> type;
        BitField<44, 2, u64> unknown;
    } ld_c;

    union {
        BitField<0, 3, u64> pred0;
        BitField<3, 3, u64> pred3;
        BitField<7, 1, u64> abs_a;
        BitField<39, 3, u64> pred39;
        BitField<42, 1, u64> neg_pred;
        BitField<43, 1, u64> neg_a;
        BitField<44, 1, u64> abs_b;
        BitField<45, 2, PredOperation> op;
        BitField<47, 1, u64> ftz;
        BitField<48, 4, PredCondition> cond;
        BitField<56, 1, u64> neg_b;
    } fsetp;

    union {
        BitField<0, 3, u64> pred0;
        BitField<3, 3, u64> pred3;
        BitField<39, 3, u64> pred39;
        BitField<42, 1, u64> neg_pred;
        BitField<45, 2, PredOperation> op;
        BitField<48, 1, u64> is_signed;
        BitField<49, 3, PredCondition> cond;
    } isetp;

    union {
        BitField<39, 3, u64> pred39;
        BitField<42, 1, u64> neg_pred;
        BitField<43, 1, u64> neg_a;
        BitField<44, 1, u64> abs_b;
        BitField<45, 2, PredOperation> op;
        BitField<48, 4, PredCondition> cond;
        BitField<52, 1, u64> bf;
        BitField<53, 1, u64> neg_b;
        BitField<54, 1, u64> abs_a;
        BitField<55, 1, u64> ftz;
        BitField<56, 1, u64> neg_imm;
    } fset;

    union {
        BitField<39, 3, u64> pred39;
        BitField<42, 1, u64> neg_pred;
        BitField<44, 1, u64> bf;
        BitField<45, 2, PredOperation> op;
        BitField<48, 1, u64> is_signed;
        BitField<49, 3, PredCondition> cond;
    } iset;

    union {
        BitField<8, 2, Register::Size> dest_size;
        BitField<10, 2, Register::Size> src_size;
        BitField<12, 1, u64> is_output_signed;
        BitField<13, 1, u64> is_input_signed;
        BitField<41, 2, u64> selector;
        BitField<45, 1, u64> negate_a;
        BitField<49, 1, u64> abs_a;

        union {
            BitField<39, 2, F2iRoundingOp> rounding;
        } f2i;

        union {
            BitField<39, 4, F2fRoundingOp> rounding;
        } f2f;
    } conversion;

    union {
        BitField<31, 4, u64> component_mask;

        bool IsComponentEnabled(size_t component) const {
            return ((1ull << component) & component_mask) != 0;
        }
    } tex;

    union {
        BitField<50, 3, u64> component_mask_selector;
        BitField<28, 8, Register> gpr28;

        bool HasTwoDestinations() const {
            return gpr28.Value() != Register::ZeroIndex;
        }

        bool IsComponentEnabled(size_t component) const {
            static constexpr std::array<size_t, 5> one_dest_mask{0x1, 0x2, 0x4, 0x8, 0x3};
            static constexpr std::array<size_t, 5> two_dest_mask{0x7, 0xb, 0xd, 0xe, 0xf};
            const auto& mask{HasTwoDestinations() ? two_dest_mask : one_dest_mask};

            ASSERT(component_mask_selector < mask.size());

            return ((1ull << component) & mask[component_mask_selector]) != 0;
        }
    } texs;

    union {
        BitField<20, 24, u64> target;
        BitField<5, 1, u64> constant_buffer;

        s32 GetBranchTarget() const {
            // Sign extend the branch target offset
            u32 mask = 1U << (24 - 1);
            u32 value = static_cast<u32>(target);
            // The branch offset is relative to the next instruction and is stored in bytes, so
            // divide it by the size of an instruction and add 1 to it.
            return static_cast<s32>((value ^ mask) - mask) / sizeof(Instruction) + 1;
        }
    } bra;

    union {
        BitField<20, 14, u64> offset;
        BitField<34, 5, u64> index;
    } cbuf34;

    union {
        BitField<20, 16, s64> offset;
        BitField<36, 5, u64> index;
    } cbuf36;

    BitField<61, 1, u64> is_b_imm;
    BitField<60, 1, u64> is_b_gpr;
    BitField<59, 1, u64> is_c_gpr;

    Attribute attribute;
    Sampler sampler;

    u64 value;
};
static_assert(sizeof(Instruction) == 0x8, "Incorrect structure size");
static_assert(std::is_standard_layout<Instruction>::value,
              "Structure does not have standard layout");

class OpCode {
public:
    enum class Id {
        KIL,
        SSY,
        BFE_C,
        BFE_R,
        BFE_IMM,
        BRA,
        LD_A,
        LD_C,
        ST_A,
        TEX,
        TEXQ, // Texture Query
        TEXS, // Texture Fetch with scalar/non-vec4 source/destinations
        TLDS, // Texture Load with scalar/non-vec4 source/destinations
        EXIT,
        IPA,
        FFMA_IMM, // Fused Multiply and Add
        FFMA_CR,
        FFMA_RC,
        FFMA_RR,
        FADD_C,
        FADD_R,
        FADD_IMM,
        FMUL_C,
        FMUL_R,
        FMUL_IMM,
        FMUL32_IMM,
        IADD_C,
        IADD_R,
        IADD_IMM,
        IADD32I,
        ISCADD_C, // Scale and Add
        ISCADD_R,
        ISCADD_IMM,
        MUFU,  // Multi-Function Operator
        RRO_C, // Range Reduction Operator
        RRO_R,
        RRO_IMM,
        F2F_C,
        F2F_R,
        F2F_IMM,
        F2I_C,
        F2I_R,
        F2I_IMM,
        I2F_C,
        I2F_R,
        I2F_IMM,
        I2I_C,
        I2I_R,
        I2I_IMM,
        LOP_C,
        LOP_R,
        LOP_IMM,
        LOP32I,
        MOV_C,
        MOV_R,
        MOV_IMM,
        MOV32_IMM,
        SHL_C,
        SHL_R,
        SHL_IMM,
        SHR_C,
        SHR_R,
        SHR_IMM,
        FMNMX_C,
        FMNMX_R,
        FMNMX_IMM,
        IMNMX_C,
        IMNMX_R,
        IMNMX_IMM,
        FSETP_C, // Set Predicate
        FSETP_R,
        FSETP_IMM,
        FSET_C,
        FSET_R,
        FSET_IMM,
        ISETP_C,
        ISETP_IMM,
        ISETP_R,
        ISET_R,
        ISET_C,
        ISET_IMM,
        PSETP,
        XMAD_IMM,
        XMAD_CR,
        XMAD_RC,
        XMAD_RR,
    };

    enum class Type {
        Trivial,
        Arithmetic,
        ArithmeticImmediate,
        ArithmeticInteger,
        ArithmeticIntegerImmediate,
        Bfe,
        Shift,
        Ffma,
        Flow,
        Memory,
        FloatSet,
        FloatSetPredicate,
        IntegerSet,
        IntegerSetPredicate,
        PredicateSetPredicate,
        Conversion,
        Unknown,
    };

    class Matcher {
    public:
        Matcher(const char* const name, u16 mask, u16 expected, OpCode::Id id, OpCode::Type type)
            : name{name}, mask{mask}, expected{expected}, id{id}, type{type} {}

        const char* GetName() const {
            return name;
        }

        u16 GetMask() const {
            return mask;
        }

        Id GetId() const {
            return id;
        }

        Type GetType() const {
            return type;
        }

        /**
         * Tests to see if the given instruction is the instruction this matcher represents.
         * @param instruction The instruction to test
         * @returns true if the given instruction matches.
         */
        bool Matches(u16 instruction) const {
            return (instruction & mask) == expected;
        }

    private:
        const char* name;
        u16 mask;
        u16 expected;
        Id id;
        Type type;
    };

    static boost::optional<const Matcher&> Decode(Instruction instr) {
        static const auto table{GetDecodeTable()};

        const auto matches_instruction = [instr](const auto& matcher) {
            return matcher.Matches(static_cast<u16>(instr.opcode));
        };

        auto iter = std::find_if(table.begin(), table.end(), matches_instruction);
        return iter != table.end() ? boost::optional<const Matcher&>(*iter) : boost::none;
    }

private:
    struct Detail {
    private:
        static constexpr size_t opcode_bitsize = 16;

        /**
         * Generates the mask and the expected value after masking from a given bitstring.
         * A '0' in a bitstring indicates that a zero must be present at that bit position.
         * A '1' in a bitstring indicates that a one must be present at that bit position.
         */
        static auto GetMaskAndExpect(const char* const bitstring) {
            u16 mask = 0, expect = 0;
            for (size_t i = 0; i < opcode_bitsize; i++) {
                const size_t bit_position = opcode_bitsize - i - 1;
                switch (bitstring[i]) {
                case '0':
                    mask |= 1 << bit_position;
                    break;
                case '1':
                    expect |= 1 << bit_position;
                    mask |= 1 << bit_position;
                    break;
                default:
                    // Ignore
                    break;
                }
            }
            return std::make_tuple(mask, expect);
        }

    public:
        /// Creates a matcher that can match and parse instructions based on bitstring.
        static auto GetMatcher(const char* const bitstring, OpCode::Id op, OpCode::Type type,
                               const char* const name) {
            const auto mask_expect = GetMaskAndExpect(bitstring);
            return Matcher(name, std::get<0>(mask_expect), std::get<1>(mask_expect), op, type);
        }
    };

    static std::vector<Matcher> GetDecodeTable() {
        std::vector<Matcher> table = {
#define INST(bitstring, op, type, name) Detail::GetMatcher(bitstring, op, type, name)
            INST("111000110011----", Id::KIL, Type::Flow, "KIL"),
            INST("111000101001----", Id::SSY, Type::Flow, "SSY"),
            INST("111000100100----", Id::BRA, Type::Flow, "BRA"),
            INST("1110111111011---", Id::LD_A, Type::Memory, "LD_A"),
            INST("1110111110010---", Id::LD_C, Type::Memory, "LD_C"),
            INST("1110111111110---", Id::ST_A, Type::Memory, "ST_A"),
            INST("1100000000111---", Id::TEX, Type::Memory, "TEX"),
            INST("1101111101001---", Id::TEXQ, Type::Memory, "TEXQ"),
            INST("1101100---------", Id::TEXS, Type::Memory, "TEXS"),
            INST("1101101---------", Id::TLDS, Type::Memory, "TLDS"),
            INST("111000110000----", Id::EXIT, Type::Trivial, "EXIT"),
            INST("11100000--------", Id::IPA, Type::Trivial, "IPA"),
            INST("001100101-------", Id::FFMA_IMM, Type::Ffma, "FFMA_IMM"),
            INST("010010011-------", Id::FFMA_CR, Type::Ffma, "FFMA_CR"),
            INST("010100011-------", Id::FFMA_RC, Type::Ffma, "FFMA_RC"),
            INST("010110011-------", Id::FFMA_RR, Type::Ffma, "FFMA_RR"),
            INST("0100110001011---", Id::FADD_C, Type::Arithmetic, "FADD_C"),
            INST("0101110001011---", Id::FADD_R, Type::Arithmetic, "FADD_R"),
            INST("0011100-01011---", Id::FADD_IMM, Type::Arithmetic, "FADD_IMM"),
            INST("0100110001101---", Id::FMUL_C, Type::Arithmetic, "FMUL_C"),
            INST("0101110001101---", Id::FMUL_R, Type::Arithmetic, "FMUL_R"),
            INST("0011100-01101---", Id::FMUL_IMM, Type::Arithmetic, "FMUL_IMM"),
            INST("00011110--------", Id::FMUL32_IMM, Type::ArithmeticImmediate, "FMUL32_IMM"),
            INST("0100110000010---", Id::IADD_C, Type::ArithmeticInteger, "IADD_C"),
            INST("0101110000010---", Id::IADD_R, Type::ArithmeticInteger, "IADD_R"),
            INST("0011100-00010---", Id::IADD_IMM, Type::ArithmeticInteger, "IADD_IMM"),
            INST("0001110---------", Id::IADD32I, Type::ArithmeticIntegerImmediate, "IADD32I"),
            INST("0100110000011---", Id::ISCADD_C, Type::ArithmeticInteger, "ISCADD_C"),
            INST("0101110000011---", Id::ISCADD_R, Type::ArithmeticInteger, "ISCADD_R"),
            INST("0011100-00011---", Id::ISCADD_IMM, Type::ArithmeticInteger, "ISCADD_IMM"),
            INST("0101000010000---", Id::MUFU, Type::Arithmetic, "MUFU"),
            INST("0100110010010---", Id::RRO_C, Type::Arithmetic, "RRO_C"),
            INST("0101110010010---", Id::RRO_R, Type::Arithmetic, "RRO_R"),
            INST("0011100-10010---", Id::RRO_IMM, Type::Arithmetic, "RRO_IMM"),
            INST("0100110010101---", Id::F2F_C, Type::Conversion, "F2F_C"),
            INST("0101110010101---", Id::F2F_R, Type::Conversion, "F2F_R"),
            INST("0011100-10101---", Id::F2F_IMM, Type::Conversion, "F2F_IMM"),
            INST("0100110010110---", Id::F2I_C, Type::Conversion, "F2I_C"),
            INST("0101110010110---", Id::F2I_R, Type::Conversion, "F2I_R"),
            INST("0011100-10110---", Id::F2I_IMM, Type::Conversion, "F2I_IMM"),
            INST("0100110010011---", Id::MOV_C, Type::Arithmetic, "MOV_C"),
            INST("0101110010011---", Id::MOV_R, Type::Arithmetic, "MOV_R"),
            INST("0011100-10011---", Id::MOV_IMM, Type::Arithmetic, "MOV_IMM"),
            INST("000000010000----", Id::MOV32_IMM, Type::ArithmeticImmediate, "MOV32_IMM"),
            INST("0100110001100---", Id::FMNMX_C, Type::Arithmetic, "FMNMX_C"),
            INST("0101110001100---", Id::FMNMX_R, Type::Arithmetic, "FMNMX_R"),
            INST("0011100-01100---", Id::FMNMX_IMM, Type::Arithmetic, "FMNMX_IMM"),
            INST("0100110000100---", Id::IMNMX_C, Type::Arithmetic, "FMNMX_IMM"),
            INST("0101110000100---", Id::IMNMX_R, Type::Arithmetic, "FMNMX_IMM"),
            INST("0011100-00100---", Id::IMNMX_IMM, Type::Arithmetic, "FMNMX_IMM"),
            INST("0100110000000---", Id::BFE_C, Type::Bfe, "BFE_C"),
            INST("0101110000000---", Id::BFE_R, Type::Bfe, "BFE_R"),
            INST("0011100-00000---", Id::BFE_IMM, Type::Bfe, "BFE_IMM"),
            INST("0100110001000---", Id::LOP_C, Type::ArithmeticInteger, "LOP_C"),
            INST("0101110001000---", Id::LOP_R, Type::ArithmeticInteger, "LOP_R"),
            INST("0011100001000---", Id::LOP_IMM, Type::ArithmeticInteger, "LOP_IMM"),
            INST("000001----------", Id::LOP32I, Type::ArithmeticIntegerImmediate, "LOP32I"),
            INST("0100110001001---", Id::SHL_C, Type::Shift, "SHL_C"),
            INST("0101110001001---", Id::SHL_R, Type::Shift, "SHL_R"),
            INST("0011100-01001---", Id::SHL_IMM, Type::Shift, "SHL_IMM"),
            INST("0100110000101---", Id::SHR_C, Type::Shift, "SHR_C"),
            INST("0101110000101---", Id::SHR_R, Type::Shift, "SHR_R"),
            INST("0011100-00101---", Id::SHR_IMM, Type::Shift, "SHR_IMM"),
            INST("0100110011100---", Id::I2I_C, Type::Conversion, "I2I_C"),
            INST("0101110011100---", Id::I2I_R, Type::Conversion, "I2I_R"),
            INST("01110001-1000---", Id::I2I_IMM, Type::Conversion, "I2I_IMM"),
            INST("0100110010111---", Id::I2F_C, Type::Conversion, "I2F_C"),
            INST("0101110010111---", Id::I2F_R, Type::Conversion, "I2F_R"),
            INST("0011100-10111---", Id::I2F_IMM, Type::Conversion, "I2F_IMM"),
            INST("01011000--------", Id::FSET_R, Type::FloatSet, "FSET_R"),
            INST("0100100---------", Id::FSET_C, Type::FloatSet, "FSET_C"),
            INST("0011000---------", Id::FSET_IMM, Type::FloatSet, "FSET_IMM"),
            INST("010010111011----", Id::FSETP_C, Type::FloatSetPredicate, "FSETP_C"),
            INST("010110111011----", Id::FSETP_R, Type::FloatSetPredicate, "FSETP_R"),
            INST("0011011-1011----", Id::FSETP_IMM, Type::FloatSetPredicate, "FSETP_IMM"),
            INST("010010110110----", Id::ISETP_C, Type::IntegerSetPredicate, "ISETP_C"),
            INST("010110110110----", Id::ISETP_R, Type::IntegerSetPredicate, "ISETP_R"),
            INST("0011011-0110----", Id::ISETP_IMM, Type::IntegerSetPredicate, "ISETP_IMM"),
            INST("010110110101----", Id::ISET_R, Type::IntegerSet, "ISET_R"),
            INST("010010110101----", Id::ISET_C, Type::IntegerSet, "ISET_C"),
            INST("0011011-0101----", Id::ISET_IMM, Type::IntegerSet, "ISET_IMM"),
            INST("0101000010010---", Id::PSETP, Type::PredicateSetPredicate, "PSETP"),
            INST("0011011-00------", Id::XMAD_IMM, Type::Arithmetic, "XMAD_IMM"),
            INST("0100111---------", Id::XMAD_CR, Type::Arithmetic, "XMAD_CR"),
            INST("010100010-------", Id::XMAD_RC, Type::Arithmetic, "XMAD_RC"),
            INST("0101101100------", Id::XMAD_RR, Type::Arithmetic, "XMAD_RR"),
        };
#undef INST
        std::stable_sort(table.begin(), table.end(), [](const auto& a, const auto& b) {
            // If a matcher has more bits in its mask it is more specific, so it
            // should come first.
            return std::bitset<16>(a.GetMask()).count() > std::bitset<16>(b.GetMask()).count();
        });

        return table;
    }
};

} // namespace Shader
} // namespace Tegra
-												shader_bytecode: Implement other variants of FMNMX.

											
										
										
											2018-05-24 23:37:18 +00:00
+								// Copyright 2018 yuzu Emulator Project
-												shader_bytecode: Add initial module for shader decoding.

											
										
										
											2018-04-05 01:43:40 +00:00
+								// Licensed under GPLv2 or any later version
 								// Refer to the license.txt file included.
 								#pragma once
-												shader_bytecode: Decode instructions based on bit strings.

											
										
										
											2018-04-21 00:49:05 +00:00
+								#include <bitset>
-												gl_shader_decompiler: Implement FMUL/FADD/FFMA immediate instructions.

											
										
										
											2018-04-16 00:45:56 +00:00
+								#include <cstring>
-												shader_bytecode: Add initial module for shader decoding.

											
										
										
											2018-04-05 01:43:40 +00:00
+								#include <map>
 								#include <string>
-												shader_bytecode: Decode instructions based on bit strings.

											
										
										
											2018-04-21 00:49:05 +00:00
+								#include <vector>
 								#include <boost/optional.hpp>
-												shader_bytecode: Add initial module for shader decoding.

											
										
										
											2018-04-05 01:43:40 +00:00
+								#include "common/bit_field.h"
-												shader_bytecode: Decode instructions based on bit strings.

											
										
										
											2018-04-21 00:49:05 +00:00
+								#include "common/common_types.h"
-												shader_bytecode: Add initial module for shader decoding.

											
										
										
											2018-04-05 01:43:40 +00:00
 								namespace Tegra {
 								namespace Shader {
 								struct Register {
-												gl_shader_decompiler: Boilerplate for handling integer instructions.

											
										
										
											2018-04-26 03:55:21 +00:00
+								    /// Number of registers
 								    static constexpr size_t NumRegisters = 256;
 								    /// Register 255 is special cased to always be 0
-												ShaderGen: Register id 255 is special and is hardcoded to return 0 (SR_ZERO).

											
										
										
											2018-04-20 14:04:54 +00:00
+								    static constexpr size_t ZeroIndex = 255;
-												shader_bytecode: Add decodings for i2i instructions.

											
										
										
											2018-04-28 02:19:14 +00:00
+								    enum class Size : u64 {
 								        Byte = 0,
 								        Short = 1,
 								        Word = 2,
 								        Long = 3,
 								    };
-												shader_bytecode: Make ctor's constexpr and explicit.

											
										
										
											2018-04-17 22:06:10 +00:00
+								    constexpr Register() = default;
-												shader_bytecode: Add initial module for shader decoding.

											
										
										
											2018-04-05 01:43:40 +00:00
 								    constexpr Register(u64 value) : value(value) {}
 								    constexpr operator u64() const {
 								        return value;
 								    }
 								    template <typename T>
 								    constexpr u64 operator-(const T& oth) const {
 								        return value - oth;
 								    }
 								    template <typename T>
 								    constexpr u64 operator&(const T& oth) const {
 								        return value & oth;
 								    }
 								    constexpr u64 operator&(const Register& oth) const {
 								        return value & oth.value;
 								    }
 								    constexpr u64 operator~() const {
 								        return ~value;
 								    }
-												gl_shader_decompiler: Boilerplate for handling integer instructions.

											
										
										
											2018-04-26 03:55:21 +00:00
+								    u64 GetSwizzledIndex(u64 elem) const {
 								        elem = (value + elem) & 3;
 								        return (value & ~3) + elem;
 								    }
-												shader_bytecode: Add initial module for shader decoding.

											
										
										
											2018-04-05 01:43:40 +00:00
+								private:
-												shader_bytecode: Make ctor's constexpr and explicit.

											
										
										
											2018-04-17 22:06:10 +00:00
+								    u64 value{};
-												shader_bytecode: Add initial module for shader decoding.

											
										
										
											2018-04-05 01:43:40 +00:00
+								};
 								union Attribute {
-												shaders: Fix GCC and clang build issues.

											
										
										
											2018-04-14 18:09:32 +00:00
+								    Attribute() = default;
-												shader_bytecode: Add initial module for shader decoding.

											
										
										
											2018-04-05 01:43:40 +00:00
-												shader_bytecode: Make ctor's constexpr and explicit.

											
										
										
											2018-04-17 22:06:10 +00:00
+								    constexpr explicit Attribute(u64 value) : value(value) {}
-												shader_bytecode: Add initial module for shader decoding.

											
										
										
											2018-04-05 01:43:40 +00:00
 								    enum class Index : u64 {
 								        Position = 7,
 								        Attribute_0 = 8,
-												Shaders: Implemented reading the gl_InstanceID and gl_VertexID variables in the vertex shader.

											
										
										
											2018-05-30 15:58:03 +00:00
+								        // This attribute contains a tuple of (~, ~, InstanceId, VertexId) when inside a vertex
 								        // shader, and a tuple of (TessCoord.x, TessCoord.y, TessCoord.z, ~) when inside a Tess Eval
 								        // shader.
 								        TessCoordInstanceIDVertexID = 47,
-												shader_bytecode: Add initial module for shader decoding.

											
										
										
											2018-04-05 01:43:40 +00:00
+								    };
-												gl_shader_decompiler: Implement negate, abs, etc. and lots of cleanup.

											
										
										
											2018-04-10 03:39:44 +00:00
+								    union {
 								        BitField<22, 2, u64> element;
 								        BitField<24, 6, Index> index;
 								        BitField<47, 3, u64> size;
 								    } fmt20;
 								    union {
 								        BitField<30, 2, u64> element;
 								        BitField<32, 6, Index> index;
 								    } fmt28;
-												shader_bytecode: Add initial module for shader decoding.

											
										
										
											2018-04-05 01:43:40 +00:00
 								    BitField<39, 8, u64> reg;
-												shader_bytecode: Make ctor's constexpr and explicit.

											
										
										
											2018-04-17 22:06:10 +00:00
+								    u64 value{};
-												shader_bytecode: Add initial module for shader decoding.

											
										
										
											2018-04-05 01:43:40 +00:00
+								};
-												gl_shader_decompiler: Add support for TEXS instruction.

											
										
										
											2018-04-10 05:26:15 +00:00
+								union Sampler {
 								    Sampler() = default;
-												shader_bytecode: Make ctor's constexpr and explicit.

											
										
										
											2018-04-17 22:06:10 +00:00
+								    constexpr explicit Sampler(u64 value) : value(value) {}
-												gl_shader_decompiler: Add support for TEXS instruction.

											
										
										
											2018-04-10 05:26:15 +00:00
 								    enum class Index : u64 {
 								        Sampler_0 = 8,
 								    };
 								    BitField<36, 13, Index> index;
-												shader_bytecode: Make ctor's constexpr and explicit.

											
										
										
											2018-04-17 22:06:10 +00:00
+								    u64 value{};
-												gl_shader_decompiler: Add support for TEXS instruction.

											
										
										
											2018-04-10 05:26:15 +00:00
+								};
-												shader_bytecode: Add initial module for shader decoding.

											
										
										
											2018-04-05 01:43:40 +00:00
+								} // namespace Shader
 								} // namespace Tegra
 								namespace std {
-												shader_bytecode: Decode instructions based on bit strings.

											
										
										
											2018-04-21 00:49:05 +00:00
+								// TODO(bunnei): The below is forbidden by the C++ standard, but works fine. See #330.
-												shader_bytecode: Add initial module for shader decoding.

											
										
										
											2018-04-05 01:43:40 +00:00
+								template <>
 								struct make_unsigned<Tegra::Shader::Attribute> {
 								    using type = Tegra::Shader::Attribute;
 								};
 								template <>
 								struct make_unsigned<Tegra::Shader::Register> {
 								    using type = Tegra::Shader::Register;
 								};
 								} // namespace std
 								namespace Tegra {
 								namespace Shader {
 								enum class Pred : u64 {
 								    UnusedIndex = 0x7,
-												ShaderGen: Implemented the fsetp instruction.

Predicate variables are now added to the generated shader code in the form of 'pX' where X is the predicate id.
These predicate variables are initialized to false on shader startup and are set via the fsetp instructions.

TODO:

* Not all the comparison types are implemented.
* Only the single-predicate version is implemented.

											
										
										
											2018-04-20 14:09:50 +00:00
+								    NeverExecute = 0xF,
 								};
 								enum class PredCondition : u64 {
 								    LessThan = 1,
 								    Equal = 2,
 								    LessEqual = 3,
 								    GreaterThan = 4,
 								    NotEqual = 5,
 								    GreaterEqual = 6,
-												gl_shader_decompiler: Implement predicate NotEqualWithNan.

											
										
										
											2018-06-30 07:00:39 +00:00
+								    NotEqualWithNan = 13,
-												ShaderGen: Implemented the fsetp instruction.

Predicate variables are now added to the generated shader code in the form of 'pX' where X is the predicate id.
These predicate variables are initialized to false on shader startup and are set via the fsetp instructions.

TODO:

* Not all the comparison types are implemented.
* Only the single-predicate version is implemented.

											
										
										
											2018-04-20 14:09:50 +00:00
+								    // TODO(Subv): Other condition types
 								};
 								enum class PredOperation : u64 {
 								    And = 0,
 								    Or = 1,
 								    Xor = 2,
-												shader_bytecode: Add initial module for shader decoding.

											
										
										
											2018-04-05 01:43:40 +00:00
+								};
-												GPU: Implemented the LOP32I instruction.

											
										
										
											2018-06-04 18:24:31 +00:00
+								enum class LogicOperation : u64 {
 								    And = 0,
 								    Or = 1,
 								    Xor = 2,
 								    PassB = 3,
 								};
-												shader_bytecode: Add SubOp decoding.

											
										
										
											2018-04-10 02:09:23 +00:00
+								enum class SubOp : u64 {
 								    Cos = 0x0,
 								    Sin = 0x1,
 								    Ex2 = 0x2,
 								    Lg2 = 0x3,
 								    Rcp = 0x4,
 								    Rsq = 0x5,
-												GPU: Implemented MUFU suboperation 8, sqrt.

											
										
										
											2018-07-03 00:48:15 +00:00
+								    Sqrt = 0x8,
-												shader_bytecode: Add SubOp decoding.

											
										
										
											2018-04-10 02:09:23 +00:00
+								};
-												gl_shader_decompiler: F2F: Implement rounding modes.

											
										
										
											2018-06-07 02:21:29 +00:00
+								enum class F2iRoundingOp : u64 {
-												GPU: Implemented the F2I_R shader instruction.

											
										
										
											2018-06-04 23:05:12 +00:00
+								    None = 0,
 								    Floor = 1,
 								    Ceil = 2,
 								    Trunc = 3,
 								};
-												gl_shader_decompiler: F2F: Implement rounding modes.

											
										
										
											2018-06-07 02:21:29 +00:00
+								enum class F2fRoundingOp : u64 {
 								    None = 0,
 								    Pass = 3,
 								    Round = 8,
 								    Floor = 9,
 								    Ceil = 10,
 								    Trunc = 11,
 								};
-												gl_shader_decompiler: Implement LD_C instruction.

											
										
										
											2018-06-06 03:46:23 +00:00
+								enum class UniformType : u64 {
 								    UnsignedByte = 0,
 								    SignedByte = 1,
 								    UnsignedShort = 2,
 								    SignedShort = 3,
 								    Single = 4,
 								    Double = 5,
 								};
-												shader_bytecode: Add initial module for shader decoding.

											
										
										
											2018-04-05 01:43:40 +00:00
+								union Instruction {
 								    Instruction& operator=(const Instruction& instr) {
-												shader_bytecode: Decode instructions based on bit strings.

											
										
										
											2018-04-21 00:49:05 +00:00
+								        value = instr.value;
-												shader_bytecode: Add initial module for shader decoding.

											
										
										
											2018-04-05 01:43:40 +00:00
+								        return *this;
 								    }
-												shader_bytecode: Decode instructions based on bit strings.

											
										
										
											2018-04-21 00:49:05 +00:00
+								    constexpr Instruction(u64 value) : value{value} {}
-												gl_shader_decompiler: Implement negate, abs, etc. and lots of cleanup.

											
										
										
											2018-04-10 03:39:44 +00:00
+								    BitField<0, 8, Register> gpr0;
 								    BitField<8, 8, Register> gpr8;
-												ShaderGen: Implemented predicated instruction execution.

Each predicated instruction will be wrapped in an `if (predicate) { instruction_body; }` in the GLSL, where `predicate` is one of the predicate boolean variables previously set by fsetp.

											
										
										
											2018-04-20 14:16:55 +00:00
+								    union {
 								        BitField<16, 4, Pred> full_pred;
 								        BitField<16, 3, u64> pred_index;
 								    } pred;
 								    BitField<19, 1, u64> negate_pred;
-												gl_shader_decompiler: Implement negate, abs, etc. and lots of cleanup.

											
										
										
											2018-04-10 03:39:44 +00:00
+								    BitField<20, 8, Register> gpr20;
-												GPU: Corrected the size of the MUFU subop field, and removed incorrect "min" operation.

											
										
										
											2018-06-30 19:48:25 +00:00
+								    BitField<20, 4, SubOp> sub_op;
-												gl_shader_decompiler: Implement negate, abs, etc. and lots of cleanup.

											
										
										
											2018-04-10 03:39:44 +00:00
+								    BitField<28, 8, Register> gpr28;
 								    BitField<39, 8, Register> gpr39;
-												shader_bytecode: Decode instructions based on bit strings.

											
										
										
											2018-04-21 00:49:05 +00:00
+								    BitField<48, 16, u64> opcode;
-												gl_shader_decompiler: Implement negate, abs, etc. and lots of cleanup.

											
										
										
											2018-04-10 03:39:44 +00:00
 								    union {
-												ShaderGen: Implemented the fmul32i shader instruction.

											
										
										
											2018-04-19 18:34:50 +00:00
+								        BitField<20, 19, u64> imm20_19;
-												GPU: Implemented the iadd32i shader instruction.

											
										
										
											2018-06-12 16:24:10 +00:00
+								        BitField<20, 32, s64> imm20_32;
-												gl_shader_decompiler: Implement negate, abs, etc. and lots of cleanup.

											
										
										
											2018-04-10 03:39:44 +00:00
+								        BitField<45, 1, u64> negate_b;
 								        BitField<46, 1, u64> abs_a;
 								        BitField<48, 1, u64> negate_a;
 								        BitField<49, 1, u64> abs_b;
-												gl_shader_decompiler: Implement saturate for float instructions.

											
										
										
											2018-06-09 06:36:33 +00:00
+								        BitField<50, 1, u64> saturate_d;
-												gl_shader_decompiler: Implement FMUL/FADD/FFMA immediate instructions.

											
										
										
											2018-04-16 00:45:56 +00:00
+								        BitField<56, 1, u64> negate_imm;
-												Shaders: Implemented the FMNMX shader instruction.

											
										
										
											2018-05-20 22:53:06 +00:00
+								        union {
 								            BitField<39, 3, u64> pred;
 								            BitField<42, 1, u64> negate_pred;
 								        } fmnmx;
-												gl_shader_decompiler: Implement LOP instructions.

											
										
										
											2018-06-17 17:26:11 +00:00
+								        union {
 								            BitField<39, 1, u64> invert_a;
 								            BitField<40, 1, u64> invert_b;
 								            BitField<41, 2, LogicOperation> operation;
 								            BitField<44, 2, u64> unk44;
 								            BitField<48, 3, Pred> pred48;
 								        } lop;
-												GPU: Implemented the LOP32I instruction.

											
										
										
											2018-06-04 18:24:31 +00:00
+								        union {
 								            BitField<53, 2, LogicOperation> operation;
 								            BitField<55, 1, u64> invert_a;
 								            BitField<56, 1, u64> invert_b;
-												gl_shader_decompiler: Refactor LOP32I instruction a bit in support of LOP.

											
										
										
											2018-06-17 16:49:34 +00:00
+								        } lop32i;
-												GPU: Implemented the LOP32I instruction.

											
										
										
											2018-06-04 18:24:31 +00:00
-												ShaderGen: Implemented the fmul32i shader instruction.

											
										
										
											2018-04-19 18:34:50 +00:00
+								        float GetImm20_19() const {
-												gl_shader_decompiler: Implement FMUL/FADD/FFMA immediate instructions.

											
										
										
											2018-04-16 00:45:56 +00:00
+								            float result{};
-												ShaderGen: Implemented the fmul32i shader instruction.

											
										
										
											2018-04-19 18:34:50 +00:00
+								            u32 imm{static_cast<u32>(imm20_19)};
-												gl_shader_decompiler: Implement FMUL/FADD/FFMA immediate instructions.

											
										
										
											2018-04-16 00:45:56 +00:00
+								            imm <<= 12;
 								            imm |= negate_imm ? 0x80000000 : 0;
 								            std::memcpy(&result, &imm, sizeof(imm));
 								            return result;
 								        }
-												ShaderGen: Implemented the fmul32i shader instruction.

											
										
										
											2018-04-19 18:34:50 +00:00
 								        float GetImm20_32() const {
 								            float result{};
-												GPU: Implemented the iadd32i shader instruction.

											
										
										
											2018-06-12 16:24:10 +00:00
+								            s32 imm{static_cast<s32>(imm20_32)};
-												ShaderGen: Implemented the fmul32i shader instruction.

											
										
										
											2018-04-19 18:34:50 +00:00
+								            std::memcpy(&result, &imm, sizeof(imm));
 								            return result;
 								        }
-												GPU: Implement the ISCADD shader instructions.

											
										
										
											2018-06-05 00:03:47 +00:00
-												gl_shader_decompiler: Implement SHL instruction.

											
										
										
											2018-06-05 02:15:19 +00:00
+								        s32 GetSignedImm20_20() const {
 								            u32 immediate = static_cast<u32>(imm20_19 | (negate_imm << 19));
-												GPU: Implement the ISCADD shader instructions.

											
										
										
											2018-06-05 00:03:47 +00:00
+								            // Sign extend the 20-bit value.
 								            u32 mask = 1U << (20 - 1);
 								            return static_cast<s32>((immediate ^ mask) - mask);
 								        }
-												gl_shader_decompiler: Implement SHL instruction.

											
										
										
											2018-06-05 02:15:19 +00:00
+								    } alu;
-												GPU: Implement the ISCADD shader instructions.

											
										
										
											2018-06-05 00:03:47 +00:00
-												gl_shader_decompiler: Implement SHR instruction.

											
										
										
											2018-06-09 04:01:17 +00:00
+								    union {
 								        BitField<48, 1, u64> is_signed;
 								    } shift;
-												gl_shader_decompiler: Implement SHL instruction.

											
										
										
											2018-06-05 02:15:19 +00:00
+								    union {
 								        BitField<39, 5, u64> shift_amount;
 								        BitField<48, 1, u64> negate_b;
 								        BitField<49, 1, u64> negate_a;
-												gl_shader_decompiler: Implement IADD instruction.

											
										
										
											2018-06-09 03:25:22 +00:00
+								    } alu_integer;
-												GPU: Implement the ISCADD shader instructions.

											
										
										
											2018-06-05 00:03:47 +00:00
-												GPU: Implemented the iadd32i shader instruction.

											
										
										
											2018-06-12 16:24:10 +00:00
+								    union {
 								        BitField<54, 1, u64> saturate;
 								        BitField<56, 1, u64> negate_a;
 								    } iadd32i;
-												gl_shader_decompiler: Implement BFE_IMM instruction.

											
										
										
											2018-06-07 04:58:12 +00:00
+								    union {
 								        BitField<20, 8, u64> shift_position;
 								        BitField<28, 8, u64> shift_length;
 								        BitField<48, 1, u64> negate_b;
 								        BitField<49, 1, u64> negate_a;
 								        u64 GetLeftShiftValue() const {
 								            return 32 - (shift_position + shift_length);
 								        }
 								    } bfe;
-												gl_shader_decompiler: Implement negate, abs, etc. and lots of cleanup.

											
										
										
											2018-04-10 03:39:44 +00:00
+								    union {
 								        BitField<48, 1, u64> negate_b;
 								        BitField<49, 1, u64> negate_c;
 								    } ffma;
-												gl_shader_decompiler: Implement LD_C instruction.

											
										
										
											2018-06-06 03:46:23 +00:00
+								    union {
 								        BitField<48, 3, UniformType> type;
 								        BitField<44, 2, u64> unknown;
 								    } ld_c;
-												ShaderGen: Implemented the fsetp instruction.

Predicate variables are now added to the generated shader code in the form of 'pX' where X is the predicate id.
These predicate variables are initialized to false on shader startup and are set via the fsetp instructions.

TODO:

* Not all the comparison types are implemented.
* Only the single-predicate version is implemented.

											
										
										
											2018-04-20 14:09:50 +00:00
+								    union {
 								        BitField<0, 3, u64> pred0;
 								        BitField<3, 3, u64> pred3;
 								        BitField<7, 1, u64> abs_a;
 								        BitField<39, 3, u64> pred39;
 								        BitField<42, 1, u64> neg_pred;
 								        BitField<43, 1, u64> neg_a;
 								        BitField<44, 1, u64> abs_b;
 								        BitField<45, 2, PredOperation> op;
 								        BitField<47, 1, u64> ftz;
 								        BitField<48, 4, PredCondition> cond;
 								        BitField<56, 1, u64> neg_b;
 								    } fsetp;
-												GPU: Implemented the ISETP_R and ISETP_C shader instructions.

											
										
										
											2018-06-04 16:12:03 +00:00
+								    union {
 								        BitField<0, 3, u64> pred0;
 								        BitField<3, 3, u64> pred3;
 								        BitField<39, 3, u64> pred39;
 								        BitField<42, 1, u64> neg_pred;
 								        BitField<45, 2, PredOperation> op;
 								        BitField<48, 1, u64> is_signed;
 								        BitField<49, 3, PredCondition> cond;
 								    } isetp;
-												Shaders: Added decodings for the FSET instructions.

											
										
										
											2018-04-25 03:42:54 +00:00
+								    union {
 								        BitField<39, 3, u64> pred39;
 								        BitField<42, 1, u64> neg_pred;
 								        BitField<43, 1, u64> neg_a;
 								        BitField<44, 1, u64> abs_b;
 								        BitField<45, 2, PredOperation> op;
 								        BitField<48, 4, PredCondition> cond;
-												GPU: Use the bf bit in FSET to determine whether to write 0xFFFFFFFF or 1.0f.

											
										
										
											2018-06-04 16:58:29 +00:00
+								        BitField<52, 1, u64> bf;
-												Shaders: Added decodings for the FSET instructions.

											
										
										
											2018-04-25 03:42:54 +00:00
+								        BitField<53, 1, u64> neg_b;
 								        BitField<54, 1, u64> abs_a;
 								        BitField<55, 1, u64> ftz;
 								        BitField<56, 1, u64> neg_imm;
 								    } fset;
-												GPU: Implement the iset family of shader instructions.

											
										
										
											2018-06-09 21:19:13 +00:00
 								    union {
 								        BitField<39, 3, u64> pred39;
 								        BitField<42, 1, u64> neg_pred;
 								        BitField<44, 1, u64> bf;
 								        BitField<45, 2, PredOperation> op;
 								        BitField<48, 1, u64> is_signed;
 								        BitField<49, 3, PredCondition> cond;
 								    } iset;
-												Shaders: Added decodings for the FSET instructions.

											
										
										
											2018-04-25 03:42:54 +00:00
-												shader_bytecode: Add decodings for i2i instructions.

											
										
										
											2018-04-28 02:19:14 +00:00
+								    union {
-												gl_shader_decompiler: Implement integer size conversions for I2I/I2F/F2I.

											
										
										
											2018-06-15 23:40:34 +00:00
+								        BitField<8, 2, Register::Size> dest_size;
 								        BitField<10, 2, Register::Size> src_size;
-												GPU: Implemented the F2I_R shader instruction.

											
										
										
											2018-06-04 23:05:12 +00:00
+								        BitField<12, 1, u64> is_output_signed;
 								        BitField<13, 1, u64> is_input_signed;
-												shader_bytecode: Add decodings for i2i instructions.

											
										
										
											2018-04-28 02:19:14 +00:00
+								        BitField<41, 2, u64> selector;
 								        BitField<45, 1, u64> negate_a;
 								        BitField<49, 1, u64> abs_a;
-												GPU: Implemented the F2I_R shader instruction.

											
										
										
											2018-06-04 23:05:12 +00:00
 								        union {
-												gl_shader_decompiler: F2F: Implement rounding modes.

											
										
										
											2018-06-07 02:21:29 +00:00
+								            BitField<39, 2, F2iRoundingOp> rounding;
-												GPU: Implemented the F2I_R shader instruction.

											
										
										
											2018-06-04 23:05:12 +00:00
+								        } f2i;
 								        union {
-												gl_shader_decompiler: F2F: Implement rounding modes.

											
										
										
											2018-06-07 02:21:29 +00:00
+								            BitField<39, 4, F2fRoundingOp> rounding;
-												GPU: Implemented the F2I_R shader instruction.

											
										
										
											2018-06-04 23:05:12 +00:00
+								        } f2f;
-												gl_shader_decompiler: Partially implement I2I_R, and I2F_R.

											
										
										
											2018-04-29 00:01:36 +00:00
+								    } conversion;
-												shader_bytecode: Add decodings for i2i instructions.

											
										
										
											2018-04-28 02:19:14 +00:00
-												gl_shader_decompiler: Implement TEX instruction.

											
										
										
											2018-06-01 03:22:21 +00:00
+								    union {
 								        BitField<31, 4, u64> component_mask;
 								        bool IsComponentEnabled(size_t component) const {
-												Build: Fixed some MSVC warnings in various parts of the code.

											
										
										
											2018-06-20 16:39:10 +00:00
+								            return ((1ull << component) & component_mask) != 0;
-												gl_shader_decompiler: Implement TEX instruction.

											
										
										
											2018-06-01 03:22:21 +00:00
+								        }
 								    } tex;
-												gl_shader_decompiler: Support multi-destination for TEXS.

											
										
										
											2018-06-01 02:57:32 +00:00
+								    union {
-												gl_shader_decompiler: Implement TEXS component mask.

											
										
										
											2018-06-03 16:08:17 +00:00
+								        BitField<50, 3, u64> component_mask_selector;
 								        BitField<28, 8, Register> gpr28;
 								        bool HasTwoDestinations() const {
 								            return gpr28.Value() != Register::ZeroIndex;
 								        }
 								        bool IsComponentEnabled(size_t component) const {
 								            static constexpr std::array<size_t, 5> one_dest_mask{0x1, 0x2, 0x4, 0x8, 0x3};
 								            static constexpr std::array<size_t, 5> two_dest_mask{0x7, 0xb, 0xd, 0xe, 0xf};
 								            const auto& mask{HasTwoDestinations() ? two_dest_mask : one_dest_mask};
 								            ASSERT(component_mask_selector < mask.size());
-												Build: Fixed some MSVC warnings in various parts of the code.

											
										
										
											2018-06-20 16:39:10 +00:00
+								            return ((1ull << component) & mask[component_mask_selector]) != 0;
-												gl_shader_decompiler: Implement TEXS component mask.

											
										
										
											2018-06-03 16:08:17 +00:00
+								        }
-												gl_shader_decompiler: Support multi-destination for TEXS.

											
										
										
											2018-06-01 02:57:32 +00:00
+								    } texs;
-												GPU: Partially implemented the shader BRA instruction.

											
										
										
											2018-06-02 19:45:50 +00:00
+								    union {
-												GPU: Corrected the branch targets for the shader bra instruction.

											
										
										
											2018-06-05 03:56:28 +00:00
+								        BitField<20, 24, u64> target;
-												GPU: Partially implemented the shader BRA instruction.

											
										
										
											2018-06-02 19:45:50 +00:00
+								        BitField<5, 1, u64> constant_buffer;
 								        s32 GetBranchTarget() const {
 								            // Sign extend the branch target offset
-												GPU: Corrected the branch targets for the shader bra instruction.

											
										
										
											2018-06-05 03:56:28 +00:00
+								            u32 mask = 1U << (24 - 1);
-												GPU: Partially implemented the shader BRA instruction.

											
										
										
											2018-06-02 19:45:50 +00:00
+								            u32 value = static_cast<u32>(target);
-												GPU: Corrected the branch targets for the shader bra instruction.

											
										
										
											2018-06-05 03:56:28 +00:00
+								            // The branch offset is relative to the next instruction and is stored in bytes, so
 								            // divide it by the size of an instruction and add 1 to it.
 								            return static_cast<s32>((value ^ mask) - mask) / sizeof(Instruction) + 1;
-												GPU: Partially implemented the shader BRA instruction.

											
										
										
											2018-06-02 19:45:50 +00:00
+								        }
 								    } bra;
-												gl_shader_decompiler: Refactor uniform handling to allow different decodings.

											
										
										
											2018-06-06 02:45:22 +00:00
+								    union {
 								        BitField<20, 14, u64> offset;
 								        BitField<34, 5, u64> index;
 								    } cbuf34;
 								    union {
 								        BitField<20, 16, s64> offset;
 								        BitField<36, 5, u64> index;
 								    } cbuf36;
-												gl_shader_decompiler: Implement FMUL/FADD/FFMA immediate instructions.

											
										
										
											2018-04-16 00:45:56 +00:00
+								    BitField<61, 1, u64> is_b_imm;
-												gl_shader_decompiler: Implement negate, abs, etc. and lots of cleanup.

											
										
										
											2018-04-10 03:39:44 +00:00
+								    BitField<60, 1, u64> is_b_gpr;
 								    BitField<59, 1, u64> is_c_gpr;
-												shader_bytecode: Add initial module for shader decoding.

											
										
										
											2018-04-05 01:43:40 +00:00
+								    Attribute attribute;
-												gl_shader_decompiler: Add support for TEXS instruction.

											
										
										
											2018-04-10 05:26:15 +00:00
+								    Sampler sampler;
-												shader_bytecode: Add initial module for shader decoding.

											
										
										
											2018-04-05 01:43:40 +00:00
-												shader_bytecode: Decode instructions based on bit strings.

											
										
										
											2018-04-21 00:49:05 +00:00
+								    u64 value;
-												shader_bytecode: Add initial module for shader decoding.

											
										
										
											2018-04-05 01:43:40 +00:00
+								};
 								static_assert(sizeof(Instruction) == 0x8, "Incorrect structure size");
 								static_assert(std::is_standard_layout<Instruction>::value,
 								              "Structure does not have standard layout");
-												shader_bytecode: Decode instructions based on bit strings.

											
										
										
											2018-04-21 00:49:05 +00:00
+								class OpCode {
 								public:
 								    enum class Id {
 								        KIL,
-												GPU: Stub the SSY shader instruction.

This instruction tells the GPU where the flow reconverges in a non-uniform control flow scenario, we can ignore this when generating GLSL code.

											
										
										
											2018-06-09 03:46:10 +00:00
+								        SSY,
-												shader_bytecode: Add instruction decodings for BFE, IMNMX, and XMAD.

											
										
										
											2018-06-06 03:48:38 +00:00
+								        BFE_C,
 								        BFE_R,
 								        BFE_IMM,
-												GPU: Added decoding for the BRA instruction.

											
										
										
											2018-06-02 19:22:55 +00:00
+								        BRA,
-												shader_bytecode: Decode instructions based on bit strings.

											
										
										
											2018-04-21 00:49:05 +00:00
+								        LD_A,
-												gl_shader_decompiler: Implement LD_C instruction.

											
										
										
											2018-06-06 03:46:23 +00:00
+								        LD_C,
-												shader_bytecode: Decode instructions based on bit strings.

											
										
										
											2018-04-21 00:49:05 +00:00
+								        ST_A,
-												gl_shader_decompiler: Implement TEX instruction.

											
										
										
											2018-06-01 03:22:21 +00:00
+								        TEX,
-												shader_bytecode: Add several more instruction decodings.

											
										
										
											2018-04-21 02:23:52 +00:00
+								        TEXQ, // Texture Query
 								        TEXS, // Texture Fetch with scalar/non-vec4 source/destinations
 								        TLDS, // Texture Load with scalar/non-vec4 source/destinations
-												shader_bytecode: Decode instructions based on bit strings.

											
										
										
											2018-04-21 00:49:05 +00:00
+								        EXIT,
 								        IPA,
-												shader_bytecode: Add several more instruction decodings.

											
										
										
											2018-04-21 02:23:52 +00:00
+								        FFMA_IMM, // Fused Multiply and Add
-												shader_bytecode: Decode instructions based on bit strings.

											
										
										
											2018-04-21 00:49:05 +00:00
+								        FFMA_CR,
 								        FFMA_RC,
 								        FFMA_RR,
 								        FADD_C,
 								        FADD_R,
 								        FADD_IMM,
 								        FMUL_C,
 								        FMUL_R,
 								        FMUL_IMM,
 								        FMUL32_IMM,
-												gl_shader_decompiler: Implement IADD instruction.

											
										
										
											2018-06-09 03:25:22 +00:00
+								        IADD_C,
 								        IADD_R,
 								        IADD_IMM,
-												GPU: Implemented the iadd32i shader instruction.

											
										
										
											2018-06-12 16:24:10 +00:00
+								        IADD32I,
-												GPU: Added decodings for the ISCADD instructions.

											
										
										
											2018-06-04 23:29:51 +00:00
+								        ISCADD_C, // Scale and Add
 								        ISCADD_R,
 								        ISCADD_IMM,
-												gl_shader_decompiler: Implement RRO as a register move.

											
										
										
											2018-06-01 04:03:23 +00:00
+								        MUFU,  // Multi-Function Operator
 								        RRO_C, // Range Reduction Operator
 								        RRO_R,
 								        RRO_IMM,
-												shader_bytecode: Add several more instruction decodings.

											
										
										
											2018-04-21 02:23:52 +00:00
+								        F2F_C,
 								        F2F_R,
 								        F2F_IMM,
 								        F2I_C,
 								        F2I_R,
 								        F2I_IMM,
 								        I2F_C,
 								        I2F_R,
 								        I2F_IMM,
-												Shaders: Added bit decodings for the I2I instruction.

											
										
										
											2018-04-25 17:52:55 +00:00
+								        I2I_C,
 								        I2I_R,
 								        I2I_IMM,
-												gl_shader_decompiler: Implement LOP instructions.

											
										
										
											2018-06-17 17:26:11 +00:00
+								        LOP_C,
 								        LOP_R,
 								        LOP_IMM,
-												shader_bytecode: Add several more instruction decodings.

											
										
										
											2018-04-21 02:23:52 +00:00
+								        LOP32I,
 								        MOV_C,
 								        MOV_R,
 								        MOV_IMM,
-												gl_shader_decompiler: Implement MOV32_IMM instruction.

											
										
										
											2018-04-27 03:21:17 +00:00
+								        MOV32_IMM,
-												gl_shader_decompiler: Implement SHL instruction.

											
										
										
											2018-06-05 02:15:19 +00:00
+								        SHL_C,
 								        SHL_R,
 								        SHL_IMM,
-												shader_bytecode: Add several more instruction decodings.

											
										
										
											2018-04-21 02:23:52 +00:00
+								        SHR_C,
 								        SHR_R,
 								        SHR_IMM,
-												shader_bytecode: Implement other variants of FMNMX.

											
										
										
											2018-05-24 23:37:18 +00:00
+								        FMNMX_C,
 								        FMNMX_R,
 								        FMNMX_IMM,
-												shader_bytecode: Add instruction decodings for BFE, IMNMX, and XMAD.

											
										
										
											2018-06-06 03:48:38 +00:00
+								        IMNMX_C,
 								        IMNMX_R,
 								        IMNMX_IMM,
-												shader_bytecode: Add several more instruction decodings.

											
										
										
											2018-04-21 02:23:52 +00:00
+								        FSETP_C, // Set Predicate
-												shader_bytecode: Decode instructions based on bit strings.

											
										
										
											2018-04-21 00:49:05 +00:00
+								        FSETP_R,
 								        FSETP_IMM,
-												Shaders: Added decodings for the FSET instructions.

											
										
										
											2018-04-25 03:42:54 +00:00
+								        FSET_C,
 								        FSET_R,
 								        FSET_IMM,
-												shader_bytecode: Add several more instruction decodings.

											
										
										
											2018-04-21 02:23:52 +00:00
+								        ISETP_C,
 								        ISETP_IMM,
 								        ISETP_R,
-												GPU: Added decodings for the ISET family of instructions.

											
										
										
											2018-06-09 20:56:50 +00:00
+								        ISET_R,
 								        ISET_C,
 								        ISET_IMM,
-												ShadersDecompiler: Added decoding for the PSETP instruction.

											
										
										
											2018-05-19 16:41:14 +00:00
+								        PSETP,
-												shader_bytecode: Add instruction decodings for BFE, IMNMX, and XMAD.

											
										
										
											2018-06-06 03:48:38 +00:00
+								        XMAD_IMM,
 								        XMAD_CR,
 								        XMAD_RC,
 								        XMAD_RR,
-												shader_bytecode: Decode instructions based on bit strings.

											
										
										
											2018-04-21 00:49:05 +00:00
+								    };
 								    enum class Type {
 								        Trivial,
 								        Arithmetic,
-												GPU: Don't mark uniform buffers and registers as used for instructions which don't have them.

Like the MOV32I and FMUL32I instructions.
This fixes a potential crash when using these instructions.

											
										
										
											2018-06-19 00:50:35 +00:00
+								        ArithmeticImmediate,
-												gl_shader_decompiler: Implement IADD instruction.

											
										
										
											2018-06-09 03:25:22 +00:00
+								        ArithmeticInteger,
-												GPU: Implemented the iadd32i shader instruction.

											
										
										
											2018-06-12 16:24:10 +00:00
+								        ArithmeticIntegerImmediate,
-												gl_shader_decompiler: Implement BFE_IMM instruction.

											
										
										
											2018-06-07 04:58:12 +00:00
+								        Bfe,
-												gl_shader_decompiler: Implement SHL instruction.

											
										
										
											2018-06-05 02:15:19 +00:00
+								        Shift,
-												shader_bytecode: Decode instructions based on bit strings.

											
										
										
											2018-04-21 00:49:05 +00:00
+								        Ffma,
 								        Flow,
 								        Memory,
-												Shaders: Added decodings for the FSET instructions.

											
										
										
											2018-04-25 03:42:54 +00:00
+								        FloatSet,
 								        FloatSetPredicate,
-												GPU: Added decodings for the ISET family of instructions.

											
										
										
											2018-06-09 20:56:50 +00:00
+								        IntegerSet,
-												Shaders: Added decodings for the FSET instructions.

											
										
										
											2018-04-25 03:42:54 +00:00
+								        IntegerSetPredicate,
-												ShadersDecompiler: Added decoding for the PSETP instruction.

											
										
										
											2018-05-19 16:41:14 +00:00
+								        PredicateSetPredicate,
-												gl_shader_decompiler: Partially implement I2I_R, and I2F_R.

											
										
										
											2018-04-29 00:01:36 +00:00
+								        Conversion,
-												shader_bytecode: Decode instructions based on bit strings.

											
										
										
											2018-04-21 00:49:05 +00:00
+								        Unknown,
 								    };
 								    class Matcher {
 								    public:
 								        Matcher(const char* const name, u16 mask, u16 expected, OpCode::Id id, OpCode::Type type)
 								            : name{name}, mask{mask}, expected{expected}, id{id}, type{type} {}
 								        const char* GetName() const {
 								            return name;
 								        }
 								        u16 GetMask() const {
 								            return mask;
 								        }
 								        Id GetId() const {
 								            return id;
 								        }
 								        Type GetType() const {
 								            return type;
 								        }
 								        /**
 								         * Tests to see if the given instruction is the instruction this matcher represents.
 								         * @param instruction The instruction to test
 								         * @returns true if the given instruction matches.
 								         */
 								        bool Matches(u16 instruction) const {
 								            return (instruction & mask) == expected;
 								        }
 								    private:
 								        const char* name;
 								        u16 mask;
 								        u16 expected;
 								        Id id;
 								        Type type;
 								    };
 								    static boost::optional<const Matcher&> Decode(Instruction instr) {
 								        static const auto table{GetDecodeTable()};
 								        const auto matches_instruction = [instr](const auto& matcher) {
 								            return matcher.Matches(static_cast<u16>(instr.opcode));
 								        };
 								        auto iter = std::find_if(table.begin(), table.end(), matches_instruction);
 								        return iter != table.end() ? boost::optional<const Matcher&>(*iter) : boost::none;
 								    }
 								private:
 								    struct Detail {
 								    private:
 								        static constexpr size_t opcode_bitsize = 16;
 								        /**
 								         * Generates the mask and the expected value after masking from a given bitstring.
 								         * A '0' in a bitstring indicates that a zero must be present at that bit position.
 								         * A '1' in a bitstring indicates that a one must be present at that bit position.
 								         */
 								        static auto GetMaskAndExpect(const char* const bitstring) {
 								            u16 mask = 0, expect = 0;
 								            for (size_t i = 0; i < opcode_bitsize; i++) {
 								                const size_t bit_position = opcode_bitsize - i - 1;
 								                switch (bitstring[i]) {
 								                case '0':
 								                    mask |= 1 << bit_position;
 								                    break;
 								                case '1':
 								                    expect |= 1 << bit_position;
 								                    mask |= 1 << bit_position;
 								                    break;
 								                default:
 								                    // Ignore
 								                    break;
 								                }
 								            }
 								            return std::make_tuple(mask, expect);
 								        }
 								    public:
 								        /// Creates a matcher that can match and parse instructions based on bitstring.
 								        static auto GetMatcher(const char* const bitstring, OpCode::Id op, OpCode::Type type,
 								                               const char* const name) {
 								            const auto mask_expect = GetMaskAndExpect(bitstring);
 								            return Matcher(name, std::get<0>(mask_expect), std::get<1>(mask_expect), op, type);
 								        }
 								    };
 								    static std::vector<Matcher> GetDecodeTable() {
 								        std::vector<Matcher> table = {
 								#define INST(bitstring, op, type, name) Detail::GetMatcher(bitstring, op, type, name)
 								            INST("111000110011----", Id::KIL, Type::Flow, "KIL"),
-												GPU: Stub the SSY shader instruction.

This instruction tells the GPU where the flow reconverges in a non-uniform control flow scenario, we can ignore this when generating GLSL code.

											
										
										
											2018-06-09 03:46:10 +00:00
+								            INST("111000101001----", Id::SSY, Type::Flow, "SSY"),
-												GPU: Added decoding for the BRA instruction.

											
										
										
											2018-06-02 19:22:55 +00:00
+								            INST("111000100100----", Id::BRA, Type::Flow, "BRA"),
-												shader_bytecode: Decode instructions based on bit strings.

											
										
										
											2018-04-21 00:49:05 +00:00
+								            INST("1110111111011---", Id::LD_A, Type::Memory, "LD_A"),
-												gl_shader_decompiler: Implement LD_C instruction.

											
										
										
											2018-06-06 03:46:23 +00:00
+								            INST("1110111110010---", Id::LD_C, Type::Memory, "LD_C"),
-												shader_bytecode: Decode instructions based on bit strings.

											
										
										
											2018-04-21 00:49:05 +00:00
+								            INST("1110111111110---", Id::ST_A, Type::Memory, "ST_A"),
-												gl_shader_decompiler: Implement TEX instruction.

											
										
										
											2018-06-01 03:22:21 +00:00
+								            INST("1100000000111---", Id::TEX, Type::Memory, "TEX"),
-												shader_bytecode: Add several more instruction decodings.

											
										
										
											2018-04-21 02:23:52 +00:00
+								            INST("1101111101001---", Id::TEXQ, Type::Memory, "TEXQ"),
-												shader_bytecode: Decode instructions based on bit strings.

											
										
										
											2018-04-21 00:49:05 +00:00
+								            INST("1101100---------", Id::TEXS, Type::Memory, "TEXS"),
-												shader_bytecode: Add several more instruction decodings.

											
										
										
											2018-04-21 02:23:52 +00:00
+								            INST("1101101---------", Id::TLDS, Type::Memory, "TLDS"),
-												shader_bytecode: Decode instructions based on bit strings.

											
										
										
											2018-04-21 00:49:05 +00:00
+								            INST("111000110000----", Id::EXIT, Type::Trivial, "EXIT"),
 								            INST("11100000--------", Id::IPA, Type::Trivial, "IPA"),
 								            INST("001100101-------", Id::FFMA_IMM, Type::Ffma, "FFMA_IMM"),
 								            INST("010010011-------", Id::FFMA_CR, Type::Ffma, "FFMA_CR"),
 								            INST("010100011-------", Id::FFMA_RC, Type::Ffma, "FFMA_RC"),
 								            INST("010110011-------", Id::FFMA_RR, Type::Ffma, "FFMA_RR"),
 								            INST("0100110001011---", Id::FADD_C, Type::Arithmetic, "FADD_C"),
 								            INST("0101110001011---", Id::FADD_R, Type::Arithmetic, "FADD_R"),
 								            INST("0011100-01011---", Id::FADD_IMM, Type::Arithmetic, "FADD_IMM"),
 								            INST("0100110001101---", Id::FMUL_C, Type::Arithmetic, "FMUL_C"),
 								            INST("0101110001101---", Id::FMUL_R, Type::Arithmetic, "FMUL_R"),
 								            INST("0011100-01101---", Id::FMUL_IMM, Type::Arithmetic, "FMUL_IMM"),
-												GPU: Don't mark uniform buffers and registers as used for instructions which don't have them.

Like the MOV32I and FMUL32I instructions.
This fixes a potential crash when using these instructions.

											
										
										
											2018-06-19 00:50:35 +00:00
+								            INST("00011110--------", Id::FMUL32_IMM, Type::ArithmeticImmediate, "FMUL32_IMM"),
-												gl_shader_decompiler: Implement IADD instruction.

											
										
										
											2018-06-09 03:25:22 +00:00
+								            INST("0100110000010---", Id::IADD_C, Type::ArithmeticInteger, "IADD_C"),
 								            INST("0101110000010---", Id::IADD_R, Type::ArithmeticInteger, "IADD_R"),
 								            INST("0011100-00010---", Id::IADD_IMM, Type::ArithmeticInteger, "IADD_IMM"),
-												GPU: Implemented the iadd32i shader instruction.

											
										
										
											2018-06-12 16:24:10 +00:00
+								            INST("0001110---------", Id::IADD32I, Type::ArithmeticIntegerImmediate, "IADD32I"),
-												gl_shader_decompiler: Implement IADD instruction.

											
										
										
											2018-06-09 03:25:22 +00:00
+								            INST("0100110000011---", Id::ISCADD_C, Type::ArithmeticInteger, "ISCADD_C"),
 								            INST("0101110000011---", Id::ISCADD_R, Type::ArithmeticInteger, "ISCADD_R"),
 								            INST("0011100-00011---", Id::ISCADD_IMM, Type::ArithmeticInteger, "ISCADD_IMM"),
-												shader_bytecode: Decode instructions based on bit strings.

											
										
										
											2018-04-21 00:49:05 +00:00
+								            INST("0101000010000---", Id::MUFU, Type::Arithmetic, "MUFU"),
-												gl_shader_decompiler: Implement RRO as a register move.

											
										
										
											2018-06-01 04:03:23 +00:00
+								            INST("0100110010010---", Id::RRO_C, Type::Arithmetic, "RRO_C"),
 								            INST("0101110010010---", Id::RRO_R, Type::Arithmetic, "RRO_R"),
 								            INST("0011100-10010---", Id::RRO_IMM, Type::Arithmetic, "RRO_IMM"),
-												gl_shader_decompiler: Partially implement F2F_R instruction.

											
										
										
											2018-05-30 03:10:44 +00:00
+								            INST("0100110010101---", Id::F2F_C, Type::Conversion, "F2F_C"),
 								            INST("0101110010101---", Id::F2F_R, Type::Conversion, "F2F_R"),
 								            INST("0011100-10101---", Id::F2F_IMM, Type::Conversion, "F2F_IMM"),
-												GPU: Implemented the F2I_R shader instruction.

											
										
										
											2018-06-04 23:05:12 +00:00
+								            INST("0100110010110---", Id::F2I_C, Type::Conversion, "F2I_C"),
 								            INST("0101110010110---", Id::F2I_R, Type::Conversion, "F2I_R"),
 								            INST("0011100-10110---", Id::F2I_IMM, Type::Conversion, "F2I_IMM"),
-												shader_bytecode: Add several more instruction decodings.

											
										
										
											2018-04-21 02:23:52 +00:00
+								            INST("0100110010011---", Id::MOV_C, Type::Arithmetic, "MOV_C"),
 								            INST("0101110010011---", Id::MOV_R, Type::Arithmetic, "MOV_R"),
 								            INST("0011100-10011---", Id::MOV_IMM, Type::Arithmetic, "MOV_IMM"),
-												GPU: Don't mark uniform buffers and registers as used for instructions which don't have them.

Like the MOV32I and FMUL32I instructions.
This fixes a potential crash when using these instructions.

											
										
										
											2018-06-19 00:50:35 +00:00
+								            INST("000000010000----", Id::MOV32_IMM, Type::ArithmeticImmediate, "MOV32_IMM"),
-												shader_bytecode: Implement other variants of FMNMX.

											
										
										
											2018-05-24 23:37:18 +00:00
+								            INST("0100110001100---", Id::FMNMX_C, Type::Arithmetic, "FMNMX_C"),
 								            INST("0101110001100---", Id::FMNMX_R, Type::Arithmetic, "FMNMX_R"),
 								            INST("0011100-01100---", Id::FMNMX_IMM, Type::Arithmetic, "FMNMX_IMM"),
-												shader_bytecode: Add instruction decodings for BFE, IMNMX, and XMAD.

											
										
										
											2018-06-06 03:48:38 +00:00
+								            INST("0100110000100---", Id::IMNMX_C, Type::Arithmetic, "FMNMX_IMM"),
 								            INST("0101110000100---", Id::IMNMX_R, Type::Arithmetic, "FMNMX_IMM"),
 								            INST("0011100-00100---", Id::IMNMX_IMM, Type::Arithmetic, "FMNMX_IMM"),
-												gl_shader_decompiler: Implement BFE_IMM instruction.

											
										
										
											2018-06-07 04:58:12 +00:00
+								            INST("0100110000000---", Id::BFE_C, Type::Bfe, "BFE_C"),
 								            INST("0101110000000---", Id::BFE_R, Type::Bfe, "BFE_R"),
 								            INST("0011100-00000---", Id::BFE_IMM, Type::Bfe, "BFE_IMM"),
-												gl_shader_decompiler: Implement LOP instructions.

											
										
										
											2018-06-17 17:26:11 +00:00
+								            INST("0100110001000---", Id::LOP_C, Type::ArithmeticInteger, "LOP_C"),
 								            INST("0101110001000---", Id::LOP_R, Type::ArithmeticInteger, "LOP_R"),
 								            INST("0011100001000---", Id::LOP_IMM, Type::ArithmeticInteger, "LOP_IMM"),
-												gl_shader_decompiler: Refactor LOP32I instruction a bit in support of LOP.

											
										
										
											2018-06-17 16:49:34 +00:00
+								            INST("000001----------", Id::LOP32I, Type::ArithmeticIntegerImmediate, "LOP32I"),
-												gl_shader_decompiler: Implement SHL instruction.

											
										
										
											2018-06-05 02:15:19 +00:00
+								            INST("0100110001001---", Id::SHL_C, Type::Shift, "SHL_C"),
 								            INST("0101110001001---", Id::SHL_R, Type::Shift, "SHL_R"),
 								            INST("0011100-01001---", Id::SHL_IMM, Type::Shift, "SHL_IMM"),
 								            INST("0100110000101---", Id::SHR_C, Type::Shift, "SHR_C"),
 								            INST("0101110000101---", Id::SHR_R, Type::Shift, "SHR_R"),
 								            INST("0011100-00101---", Id::SHR_IMM, Type::Shift, "SHR_IMM"),
-												gl_shader_decompiler: Partially implement I2I_R, and I2F_R.

											
										
										
											2018-04-29 00:01:36 +00:00
+								            INST("0100110011100---", Id::I2I_C, Type::Conversion, "I2I_C"),
 								            INST("0101110011100---", Id::I2I_R, Type::Conversion, "I2I_R"),
 								            INST("01110001-1000---", Id::I2I_IMM, Type::Conversion, "I2I_IMM"),
 								            INST("0100110010111---", Id::I2F_C, Type::Conversion, "I2F_C"),
 								            INST("0101110010111---", Id::I2F_R, Type::Conversion, "I2F_R"),
 								            INST("0011100-10111---", Id::I2F_IMM, Type::Conversion, "I2F_IMM"),
-												Shaders: Added decodings for the FSET instructions.

											
										
										
											2018-04-25 03:42:54 +00:00
+								            INST("01011000--------", Id::FSET_R, Type::FloatSet, "FSET_R"),
 								            INST("0100100---------", Id::FSET_C, Type::FloatSet, "FSET_C"),
 								            INST("0011000---------", Id::FSET_IMM, Type::FloatSet, "FSET_IMM"),
 								            INST("010010111011----", Id::FSETP_C, Type::FloatSetPredicate, "FSETP_C"),
 								            INST("010110111011----", Id::FSETP_R, Type::FloatSetPredicate, "FSETP_R"),
 								            INST("0011011-1011----", Id::FSETP_IMM, Type::FloatSetPredicate, "FSETP_IMM"),
 								            INST("010010110110----", Id::ISETP_C, Type::IntegerSetPredicate, "ISETP_C"),
 								            INST("010110110110----", Id::ISETP_R, Type::IntegerSetPredicate, "ISETP_R"),
 								            INST("0011011-0110----", Id::ISETP_IMM, Type::IntegerSetPredicate, "ISETP_IMM"),
-												GPU: Added decodings for the ISET family of instructions.

											
										
										
											2018-06-09 20:56:50 +00:00
+								            INST("010110110101----", Id::ISET_R, Type::IntegerSet, "ISET_R"),
 								            INST("010010110101----", Id::ISET_C, Type::IntegerSet, "ISET_C"),
 								            INST("0011011-0101----", Id::ISET_IMM, Type::IntegerSet, "ISET_IMM"),
-												ShadersDecompiler: Added decoding for the PSETP instruction.

											
										
										
											2018-05-19 16:41:14 +00:00
+								            INST("0101000010010---", Id::PSETP, Type::PredicateSetPredicate, "PSETP"),
-												shader_bytecode: Add instruction decodings for BFE, IMNMX, and XMAD.

											
										
										
											2018-06-06 03:48:38 +00:00
+								            INST("0011011-00------", Id::XMAD_IMM, Type::Arithmetic, "XMAD_IMM"),
 								            INST("0100111---------", Id::XMAD_CR, Type::Arithmetic, "XMAD_CR"),
 								            INST("010100010-------", Id::XMAD_RC, Type::Arithmetic, "XMAD_RC"),
 								            INST("0101101100------", Id::XMAD_RR, Type::Arithmetic, "XMAD_RR"),
-												shader_bytecode: Decode instructions based on bit strings.

											
										
										
											2018-04-21 00:49:05 +00:00
+								        };
 								#undef INST
 								        std::stable_sort(table.begin(), table.end(), [](const auto& a, const auto& b) {
 								            // If a matcher has more bits in its mask it is more specific, so it
 								            // should come first.
 								            return std::bitset<16>(a.GetMask()).count() > std::bitset<16>(b.GetMask()).count();
 								        });
 								        return table;
 								    }
 								};
-												shader_bytecode: Add initial module for shader decoding.

											
										
										
											2018-04-05 01:43:40 +00:00
+								} // namespace Shader
 								} // namespace Tegra