#pragma once #include "ShaderParam.h" #include "RSXFragmentProgram.h" #include // Helper for GPR occupancy tracking struct temp_register { bool aliased_r0 = false; bool aliased_h0 = false; bool aliased_h1 = false; bool last_write_half[4] = { false, false, false, false }; u32 real_index = -1; u32 h0_writes = 0u; // Number of writes to the first 64-bits of the register u32 h1_writes = 0u; // Number of writes to the last 64-bits of the register void tag(u32 index, bool half_register, bool x, bool y, bool z, bool w) { if (half_register) { if (index & 1) { if (x) last_write_half[2] = true; if (y) last_write_half[2] = true; if (z) last_write_half[3] = true; if (w) last_write_half[3] = true; aliased_h1 = true; h1_writes++; } else { if (x) last_write_half[0] = true; if (y) last_write_half[0] = true; if (z) last_write_half[1] = true; if (w) last_write_half[1] = true; aliased_h0 = true; h0_writes++; } } else { if (x) last_write_half[0] = false; if (y) last_write_half[1] = false; if (z) last_write_half[2] = false; if (w) last_write_half[3] = false; aliased_r0 = true; h0_writes++; h1_writes++; } if (real_index == umax) { if (half_register) real_index = index >> 1; else real_index = index; } } bool requires_gather(u8 channel) const { //Data fetched from the single precision register requires merging of the two half registers ensure(channel < 4); if (aliased_h0 && channel < 2) { return last_write_half[channel]; } if (aliased_h1 && channel > 1) { return last_write_half[channel]; } return false; } bool requires_split(u32 /*index*/) const { //Data fetched from any of the two half registers requires sync with the full register if (!(last_write_half[0] || last_write_half[1]) && aliased_r0) { //r0 has been written to //TODO: Check for specific elements in real32 register return true; } return false; } std::string gather_r() const { std::string h0 = "h" + std::to_string(real_index << 1); std::string h1 = "h" + std::to_string(real_index << 1 | 1); std::string reg = "r" + std::to_string(real_index); std::string ret = "//Invalid gather"; if (aliased_h0 && aliased_h1) ret = "(gather(" + h0 + ", " + h1 + "))"; else if (aliased_h0) ret = "(gather(" + h0 + "), " + reg + ".zw)"; else if (aliased_h1) ret = "(" + reg + ".xy, gather(" + h1 + "))"; return ret; } }; /** * This class is used to translate RSX Fragment program to GLSL/HLSL code * Backend with text based shader can subclass this class and implement : * - virtual std::string getFloatTypeName(usz elementCount) = 0; * - virtual std::string getHalfTypeName(usz elementCount) = 0; * - virtual std::string getFunction(enum class FUNCTION) = 0; * - virtual std::string saturate(const std::string &code) = 0; * - virtual std::string compareFunction(enum class COMPARE, const std::string &, const std::string &) = 0; * - virtual void insertHeader(std::stringstream &OS) = 0; * - virtual void insertInputs(std::stringstream &OS) = 0; * - virtual void insertOutputs(std::stringstream &OS) = 0; * - virtual void insertConstants(std::stringstream &OS) = 0; * - virtual void insertMainStart(std::stringstream &OS) = 0; * - virtual void insertMainEnd(std::stringstream &OS) = 0; */ class FragmentProgramDecompiler { enum OPFLAGS { no_src_mask = 1, src_cast_f32 = 2, skip_type_cast = 4, texture_ref = 8, op_extern = src_cast_f32 | skip_type_cast, }; OPDEST dst; SRC0 src0; SRC1 src1; SRC2 src2; u32 opflags; std::string main; u32& m_size; u32 m_const_index = 0; u32 m_offset; u32 m_location = 0; u32 m_loop_count; int m_code_level; std::vector m_end_offsets; std::vector m_else_offsets; std::array temp_registers; std::string GetMask() const; void SetDst(std::string code, u32 flags = 0); void AddCode(const std::string& code); std::string AddReg(u32 index, bool fp16); bool HasReg(u32 index, bool fp16); std::string AddCond(); std::string AddConst(); std::string AddTex(); void AddFlowOp(const std::string& code); std::string Format(const std::string& code, bool ignore_redirects = false); //Technically a temporary workaround until we know what type3 is std::string AddType3(); //Support the transform-2d temp result for use with TEXBEM std::string AddX2d(); //Prevents operations from overflowing the desired range (tested with fp_dynamic3 autotest sample, DS2 for src1.input_prec_mod) std::string ClampValue(const std::string& code, u32 precision); /** * Returns true if the dst set is not a vector (i.e only a single component) */ bool DstExpectsSca() const; void AddCodeCond(const std::string& lhs, const std::string& rhs); std::string GetRawCond(); std::string GetCond(); template std::string GetSRC(T src); std::string BuildCode(); static u32 GetData(const u32 d) { return d << 16 | d >> 16; } /** * Emits code if opcode is an SCT/SCB one and returns true, * otherwise do nothing and return false. * NOTE: What does SCT means ??? */ bool handle_sct_scb(u32 opcode); /** * Emits code if opcode is an TEX SRB one and returns true, * otherwise do nothing and return false. * NOTE: What does TEX SRB means ??? */ bool handle_tex_srb(u32 opcode); protected: const RSXFragmentProgram &m_prog; u32 m_ctrl = 0; /** returns the type name of float vectors. */ virtual std::string getFloatTypeName(usz elementCount) = 0; /** returns the type name of half vectors. */ virtual std::string getHalfTypeName(usz elementCount) = 0; /** returns string calling function where arguments are passed via * $0 $1 $2 substring. */ virtual std::string getFunction(FUNCTION) = 0; /** returns string calling comparison function on 2 args passed as strings. */ virtual std::string compareFunction(COMPARE, const std::string &, const std::string &) = 0; /** Insert header of shader file (eg #version, "system constants"...) */ virtual void insertHeader(std::stringstream &OS) = 0; /** Insert global declaration of fragments inputs. */ virtual void insertInputs(std::stringstream &OS) = 0; /** insert global declaration of fragments outputs. */ virtual void insertOutputs(std::stringstream &OS) = 0; /** insert declaration of shader constants. */ virtual void insertConstants(std::stringstream &OS) = 0; /** insert helper function definitions. */ virtual void insertGlobalFunctions(std::stringstream &OS) = 0; /** insert beginning of main (signature, temporary declaration...) */ virtual void insertMainStart(std::stringstream &OS) = 0; /** insert end of main function (return value, output copy...) */ virtual void insertMainEnd(std::stringstream &OS) = 0; public: enum : u16 { in_wpos = (1 << 0), in_diff_color = (1 << 1), in_spec_color = (1 << 2), in_fogc = (1 << 3), in_tc0 = (1 << 4), in_tc1 = (1 << 5), in_tc2 = (1 << 6), in_tc3 = (1 << 7), in_tc4 = (1 << 8), in_tc5 = (1 << 9), in_tc6 = (1 << 10), in_tc7 = (1 << 11), in_tc8 = (1 << 12), in_tc9 = (1 << 13), in_ssa = (1 << 14) }; struct { u16 in_register_mask = 0; u16 common_access_sampler_mask = 0; u16 shadow_sampler_mask = 0; u16 redirected_sampler_mask = 0; bool has_lit_op = false; bool has_gather_op = false; bool has_no_output = false; bool has_discard_op = false; bool has_tex_op = false; bool has_divsq = false; bool has_clamp = false; bool has_w_access = false; bool has_exp_tex_op = false; } properties; struct { bool has_native_half_support = false; bool emulate_depth_compare = false; } device_props; ParamArray m_parr; FragmentProgramDecompiler(const RSXFragmentProgram &prog, u32& size); FragmentProgramDecompiler(const FragmentProgramDecompiler&) = delete; FragmentProgramDecompiler(FragmentProgramDecompiler&&) = delete; std::string Decompile(); };