2015-05-19 18:17:08 +02:00
|
|
|
#include "stdafx.h"
|
|
|
|
|
#include "Emu/Memory/Memory.h"
|
|
|
|
|
#include "Emu/System.h"
|
|
|
|
|
|
2015-06-19 17:49:38 +02:00
|
|
|
#include "FragmentProgramDecompiler.h"
|
|
|
|
|
|
2016-05-13 16:01:48 +02:00
|
|
|
#include <algorithm>
|
|
|
|
|
|
2016-01-10 20:09:56 +01:00
|
|
|
FragmentProgramDecompiler::FragmentProgramDecompiler(const RSXFragmentProgram &prog, u32& size) :
|
2016-01-24 22:24:28 +01:00
|
|
|
m_prog(prog),
|
2015-05-19 18:17:08 +02:00
|
|
|
m_size(size),
|
|
|
|
|
m_const_index(0),
|
|
|
|
|
m_location(0),
|
2016-01-24 22:24:28 +01:00
|
|
|
m_ctrl(prog.ctrl)
|
2015-05-19 18:17:08 +02:00
|
|
|
{
|
|
|
|
|
m_size = 0;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
void FragmentProgramDecompiler::SetDst(std::string code, bool append_mask)
|
|
|
|
|
{
|
|
|
|
|
if (!src0.exec_if_eq && !src0.exec_if_gr && !src0.exec_if_lt) return;
|
|
|
|
|
|
|
|
|
|
switch (src1.scale)
|
|
|
|
|
{
|
|
|
|
|
case 0: break;
|
|
|
|
|
case 1: code = "(" + code + " * 2.0)"; break;
|
|
|
|
|
case 2: code = "(" + code + " * 4.0)"; break;
|
|
|
|
|
case 3: code = "(" + code + " * 8.0)"; break;
|
|
|
|
|
case 5: code = "(" + code + " / 2.0)"; break;
|
|
|
|
|
case 6: code = "(" + code + " / 4.0)"; break;
|
|
|
|
|
case 7: code = "(" + code + " / 8.0)"; break;
|
|
|
|
|
|
|
|
|
|
default:
|
2015-08-12 20:38:17 +02:00
|
|
|
LOG_ERROR(RSX, "Bad scale: %d", u32{ src1.scale });
|
2015-05-19 18:17:08 +02:00
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
2017-07-05 00:16:59 +02:00
|
|
|
if (!dst.no_dest)
|
2017-03-07 11:40:38 +01:00
|
|
|
{
|
2017-11-13 20:07:23 +01:00
|
|
|
if (dst.exp_tex)
|
|
|
|
|
{
|
2018-01-24 22:09:27 +01:00
|
|
|
//Expand [0,1] to [-1, 1]. Confirmed by Castlevania: LOS
|
2017-11-13 20:07:23 +01:00
|
|
|
AddCode("//exp tex flag is set");
|
|
|
|
|
code = "((" + code + "- 0.5) * 2.)";
|
|
|
|
|
}
|
2017-07-05 00:16:59 +02:00
|
|
|
|
|
|
|
|
if (dst.saturate)
|
2018-01-24 22:09:27 +01:00
|
|
|
{
|
2017-07-05 00:16:59 +02:00
|
|
|
code = saturate(code);
|
2018-01-24 22:09:27 +01:00
|
|
|
}
|
|
|
|
|
else if (dst.prec)
|
|
|
|
|
{
|
|
|
|
|
switch (dst.opcode)
|
|
|
|
|
{
|
|
|
|
|
case RSX_FP_OPCODE_NRM:
|
|
|
|
|
case RSX_FP_OPCODE_MAX:
|
|
|
|
|
case RSX_FP_OPCODE_MIN:
|
|
|
|
|
case RSX_FP_OPCODE_COS:
|
|
|
|
|
case RSX_FP_OPCODE_SIN:
|
|
|
|
|
case RSX_FP_OPCODE_REFL:
|
|
|
|
|
case RSX_FP_OPCODE_EX2:
|
|
|
|
|
case RSX_FP_OPCODE_FRC:
|
|
|
|
|
case RSX_FP_OPCODE_LIT:
|
|
|
|
|
case RSX_FP_OPCODE_LIF:
|
|
|
|
|
case RSX_FP_OPCODE_LRP:
|
|
|
|
|
case RSX_FP_OPCODE_LG2:
|
|
|
|
|
break;
|
|
|
|
|
case RSX_FP_OPCODE_MOV:
|
|
|
|
|
//NOTE: Sometimes varying inputs from VS are out of range so do not exempt any input types, unless fp16 (Naruto UNS)
|
|
|
|
|
if (dst.fp16 && src0.fp16 && src0.reg_type == RSX_FP_REGISTER_TYPE_TEMP)
|
|
|
|
|
break;
|
|
|
|
|
default:
|
|
|
|
|
{
|
|
|
|
|
//fp16 precsion flag on f32 register; ignore
|
|
|
|
|
if (dst.prec == 1 && !dst.fp16)
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
//clamp value to allowed range
|
|
|
|
|
code = ClampValue(code, dst.prec);
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
2017-03-07 11:40:38 +01:00
|
|
|
}
|
2015-05-19 18:17:08 +02:00
|
|
|
|
|
|
|
|
code += (append_mask ? "$m" : "");
|
|
|
|
|
|
|
|
|
|
if (dst.no_dest)
|
|
|
|
|
{
|
|
|
|
|
if (dst.set_cond)
|
|
|
|
|
{
|
|
|
|
|
AddCode("$ifcond " + m_parr.AddParam(PF_PARAM_NONE, getFloatTypeName(4), "cc" + std::to_string(src0.cond_mod_reg_index)) + "$m = " + code + ";");
|
|
|
|
|
}
|
|
|
|
|
else
|
|
|
|
|
{
|
|
|
|
|
AddCode("$ifcond " + code + ";");
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
std::string dest = AddReg(dst.dest_reg, dst.fp16) + "$m";
|
|
|
|
|
|
|
|
|
|
AddCodeCond(Format(dest), code);
|
|
|
|
|
//AddCode("$ifcond " + dest + code + (append_mask ? "$m;" : ";"));
|
|
|
|
|
|
|
|
|
|
if (dst.set_cond)
|
|
|
|
|
{
|
|
|
|
|
AddCode(m_parr.AddParam(PF_PARAM_NONE, getFloatTypeName(4), "cc" + std::to_string(src0.cond_mod_reg_index)) + "$m = " + dest + ";");
|
|
|
|
|
}
|
2017-11-30 19:47:25 +01:00
|
|
|
|
|
|
|
|
u32 reg_index = dst.fp16 ? dst.dest_reg >> 1 : dst.dest_reg;
|
2018-02-23 20:48:51 +01:00
|
|
|
temp_registers[reg_index].tag(dst.dest_reg, !!dst.fp16, dst.mask_x, dst.mask_y, dst.mask_z, dst.mask_w);
|
2015-05-19 18:17:08 +02:00
|
|
|
}
|
|
|
|
|
|
2017-05-21 21:14:59 +02:00
|
|
|
void FragmentProgramDecompiler::AddFlowOp(std::string code)
|
|
|
|
|
{
|
|
|
|
|
//Flow operations can only consider conditionals and have no dst
|
|
|
|
|
|
|
|
|
|
if (src0.exec_if_gr && src0.exec_if_lt && src0.exec_if_eq)
|
|
|
|
|
{
|
|
|
|
|
AddCode(code + ";");
|
|
|
|
|
return;
|
|
|
|
|
}
|
|
|
|
|
else if (!src0.exec_if_gr && !src0.exec_if_lt && !src0.exec_if_eq)
|
|
|
|
|
{
|
|
|
|
|
AddCode("//" + code + ";");
|
|
|
|
|
return;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
//We have a conditional expression
|
|
|
|
|
std::string cond = GetRawCond();
|
|
|
|
|
|
|
|
|
|
AddCode("if (any(" + cond + ")) " + code + ";");
|
|
|
|
|
}
|
|
|
|
|
|
2015-05-19 18:17:08 +02:00
|
|
|
void FragmentProgramDecompiler::AddCode(const std::string& code)
|
|
|
|
|
{
|
|
|
|
|
main.append(m_code_level, '\t') += Format(code) + "\n";
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
std::string FragmentProgramDecompiler::GetMask()
|
|
|
|
|
{
|
|
|
|
|
std::string ret;
|
|
|
|
|
|
|
|
|
|
static const char dst_mask[4] =
|
|
|
|
|
{
|
|
|
|
|
'x', 'y', 'z', 'w',
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
if (dst.mask_x) ret += dst_mask[0];
|
|
|
|
|
if (dst.mask_y) ret += dst_mask[1];
|
|
|
|
|
if (dst.mask_z) ret += dst_mask[2];
|
|
|
|
|
if (dst.mask_w) ret += dst_mask[3];
|
|
|
|
|
|
|
|
|
|
return ret.empty() || strncmp(ret.c_str(), dst_mask, 4) == 0 ? "" : ("." + ret);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
std::string FragmentProgramDecompiler::AddReg(u32 index, int fp16)
|
|
|
|
|
{
|
2015-05-23 00:04:42 +02:00
|
|
|
return m_parr.AddParam(PF_PARAM_NONE, getFloatTypeName(4), std::string(fp16 ? "h" : "r") + std::to_string(index), getFloatTypeName(4) + "(0., 0., 0., 0.)");
|
2015-05-19 18:17:08 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
bool FragmentProgramDecompiler::HasReg(u32 index, int fp16)
|
|
|
|
|
{
|
|
|
|
|
return m_parr.HasParam(PF_PARAM_NONE, getFloatTypeName(4),
|
|
|
|
|
std::string(fp16 ? "h" : "r") + std::to_string(index));
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
std::string FragmentProgramDecompiler::AddCond()
|
|
|
|
|
{
|
|
|
|
|
return m_parr.AddParam(PF_PARAM_NONE, getFloatTypeName(4), "cc" + std::to_string(src0.cond_reg_index));
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
std::string FragmentProgramDecompiler::AddConst()
|
|
|
|
|
{
|
|
|
|
|
std::string name = std::string("fc") + std::to_string(m_size + 4 * 4);
|
|
|
|
|
if (m_parr.HasParam(PF_PARAM_UNIFORM, getFloatTypeName(4), name))
|
|
|
|
|
{
|
|
|
|
|
return name;
|
|
|
|
|
}
|
|
|
|
|
|
2016-01-26 20:42:54 +01:00
|
|
|
auto data = (be_t<u32>*) ((char*)m_prog.addr + m_size + 4 * SIZE_32(u32));
|
2015-05-19 18:17:08 +02:00
|
|
|
|
|
|
|
|
m_offset = 2 * 4 * sizeof(u32);
|
|
|
|
|
u32 x = GetData(data[0]);
|
|
|
|
|
u32 y = GetData(data[1]);
|
|
|
|
|
u32 z = GetData(data[2]);
|
|
|
|
|
u32 w = GetData(data[3]);
|
|
|
|
|
return m_parr.AddParam(PF_PARAM_UNIFORM, getFloatTypeName(4), name,
|
|
|
|
|
std::string(getFloatTypeName(4) + "(") + std::to_string((float&)x) + ", " + std::to_string((float&)y)
|
|
|
|
|
+ ", " + std::to_string((float&)z) + ", " + std::to_string((float&)w) + ")");
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
std::string FragmentProgramDecompiler::AddTex()
|
|
|
|
|
{
|
2016-01-24 22:24:28 +01:00
|
|
|
std::string sampler;
|
|
|
|
|
switch (m_prog.get_texture_dimension(dst.tex_num))
|
|
|
|
|
{
|
2016-03-30 21:52:29 +02:00
|
|
|
case rsx::texture_dimension_extended::texture_dimension_1d:
|
2016-01-27 00:34:34 +01:00
|
|
|
sampler = "sampler1D";
|
|
|
|
|
break;
|
2016-03-30 21:52:29 +02:00
|
|
|
case rsx::texture_dimension_extended::texture_dimension_cubemap:
|
2016-01-24 22:24:28 +01:00
|
|
|
sampler = "samplerCube";
|
|
|
|
|
break;
|
2016-03-30 21:52:29 +02:00
|
|
|
case rsx::texture_dimension_extended::texture_dimension_2d:
|
2016-01-24 22:24:28 +01:00
|
|
|
sampler = "sampler2D";
|
|
|
|
|
break;
|
2016-03-30 21:52:29 +02:00
|
|
|
case rsx::texture_dimension_extended::texture_dimension_3d:
|
2016-01-24 22:24:28 +01:00
|
|
|
sampler = "sampler3D";
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
return m_parr.AddParam(PF_PARAM_UNIFORM, sampler, std::string("tex") + std::to_string(dst.tex_num));
|
2015-05-19 18:17:08 +02:00
|
|
|
}
|
|
|
|
|
|
2017-03-21 12:53:52 +01:00
|
|
|
std::string FragmentProgramDecompiler::AddType3()
|
|
|
|
|
{
|
|
|
|
|
return m_parr.AddParam(PF_PARAM_NONE, getFloatTypeName(4), "src3", getFloatTypeName(4) + "(1., 1., 1., 1.)");
|
|
|
|
|
}
|
|
|
|
|
|
2017-12-10 23:34:44 +01:00
|
|
|
std::string FragmentProgramDecompiler::AddX2d()
|
|
|
|
|
{
|
|
|
|
|
return m_parr.AddParam(PF_PARAM_NONE, getFloatTypeName(4), "x2d", getFloatTypeName(4) + "(0., 0., 0., 0.)");
|
|
|
|
|
}
|
|
|
|
|
|
2017-03-07 11:40:38 +01:00
|
|
|
//Both of these were tested with a trace SoulCalibur IV title screen
|
2018-04-29 08:41:51 +02:00
|
|
|
//Failure to catch causes infinite values since there is a lot of rcp(0)
|
2017-03-07 11:40:38 +01:00
|
|
|
std::string FragmentProgramDecompiler::NotZero(const std::string& code)
|
|
|
|
|
{
|
2018-01-24 10:09:02 +01:00
|
|
|
return "(max(abs(" + code + "), 0.0000000001) * sign(" + code + "))";
|
2017-03-07 11:40:38 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
std::string FragmentProgramDecompiler::NotZeroPositive(const std::string& code)
|
|
|
|
|
{
|
2018-01-24 10:09:02 +01:00
|
|
|
return "max(abs(" + code + "), 0.0000000001)";
|
2017-03-07 11:40:38 +01:00
|
|
|
}
|
|
|
|
|
|
2017-11-13 20:07:23 +01:00
|
|
|
std::string FragmentProgramDecompiler::ClampValue(const std::string& code, u32 precision)
|
2017-03-07 11:40:38 +01:00
|
|
|
{
|
2018-04-29 08:41:51 +02:00
|
|
|
//FP16 is expected to overflow a lot easier at 0+-65504
|
|
|
|
|
//FP32 can still work up to 0+-3.4E38
|
2017-03-07 11:40:38 +01:00
|
|
|
//See http://http.download.nvidia.com/developer/Papers/2005/FP_Specials/FP_Specials.pdf
|
|
|
|
|
|
2017-11-13 20:07:23 +01:00
|
|
|
switch (precision)
|
2017-03-07 11:40:38 +01:00
|
|
|
{
|
|
|
|
|
case 0:
|
|
|
|
|
break;
|
|
|
|
|
case 1:
|
2017-07-05 00:16:59 +02:00
|
|
|
return "clamp(" + code + ", -65504., 65504.)";
|
2017-03-07 11:40:38 +01:00
|
|
|
case 2:
|
2017-07-05 00:16:59 +02:00
|
|
|
return "clamp(" + code + ", -2., 2.)";
|
2017-11-13 20:07:23 +01:00
|
|
|
case 3:
|
|
|
|
|
return "clamp(" + code + ", -1., 1.)";
|
|
|
|
|
case 4:
|
|
|
|
|
return "clamp(" + code + ", 0., 1.)";
|
2017-03-07 11:40:38 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return code;
|
|
|
|
|
}
|
|
|
|
|
|
2017-06-22 19:09:05 +02:00
|
|
|
bool FragmentProgramDecompiler::DstExpectsSca()
|
|
|
|
|
{
|
|
|
|
|
int writes = 0;
|
|
|
|
|
|
|
|
|
|
if (dst.mask_x) writes++;
|
|
|
|
|
if (dst.mask_y) writes++;
|
|
|
|
|
if (dst.mask_z) writes++;
|
|
|
|
|
if (dst.mask_w) writes++;
|
|
|
|
|
|
|
|
|
|
return (writes == 1);
|
|
|
|
|
}
|
|
|
|
|
|
2017-12-10 23:34:44 +01:00
|
|
|
std::string FragmentProgramDecompiler::Format(const std::string& code, bool ignore_redirects)
|
2015-05-19 18:17:08 +02:00
|
|
|
{
|
|
|
|
|
const std::pair<std::string, std::function<std::string()>> repl_list[] =
|
|
|
|
|
{
|
|
|
|
|
{ "$$", []() -> std::string { return "$"; } },
|
|
|
|
|
{ "$0", [this]() -> std::string {return GetSRC<SRC0>(src0);} },//std::bind(std::mem_fn(&GLFragmentDecompilerThread::GetSRC<SRC0>), *this, src0) },
|
|
|
|
|
{ "$1", [this]() -> std::string {return GetSRC<SRC1>(src1);} },//std::bind(std::mem_fn(&GLFragmentDecompilerThread::GetSRC<SRC1>), this, src1) },
|
|
|
|
|
{ "$2", [this]() -> std::string {return GetSRC<SRC2>(src2);} },//std::bind(std::mem_fn(&GLFragmentDecompilerThread::GetSRC<SRC2>), this, src2) },
|
|
|
|
|
{ "$t", std::bind(std::mem_fn(&FragmentProgramDecompiler::AddTex), this) },
|
2017-02-10 10:08:46 +01:00
|
|
|
{ "$_i", [this]() -> std::string {return std::to_string(dst.tex_num);} },
|
2015-05-19 18:17:08 +02:00
|
|
|
{ "$m", std::bind(std::mem_fn(&FragmentProgramDecompiler::GetMask), this) },
|
|
|
|
|
{ "$ifcond ", [this]() -> std::string
|
2018-02-23 20:48:51 +01:00
|
|
|
{
|
|
|
|
|
const std::string& cond = GetCond();
|
|
|
|
|
if (cond == "true") return "";
|
|
|
|
|
return "if(" + cond + ") ";
|
|
|
|
|
}
|
2015-05-19 18:17:08 +02:00
|
|
|
},
|
|
|
|
|
{ "$cond", std::bind(std::mem_fn(&FragmentProgramDecompiler::GetCond), this) },
|
2018-02-23 20:48:51 +01:00
|
|
|
{ "$_c", std::bind(std::mem_fn(&FragmentProgramDecompiler::AddConst), this) },
|
|
|
|
|
{ "$float4", [this]() -> std::string { return getFloatTypeName(4); } }
|
2015-05-19 18:17:08 +02:00
|
|
|
};
|
|
|
|
|
|
2017-12-10 23:34:44 +01:00
|
|
|
if (!ignore_redirects)
|
|
|
|
|
{
|
|
|
|
|
//Special processing redirects
|
2017-12-11 09:37:20 +01:00
|
|
|
switch (dst.opcode)
|
|
|
|
|
{
|
|
|
|
|
case RSX_FP_OPCODE_TEXBEM:
|
|
|
|
|
case RSX_FP_OPCODE_TXPBEM:
|
2017-12-10 23:34:44 +01:00
|
|
|
{
|
|
|
|
|
//Redirect parameter 0 to the x2d temp register for TEXBEM
|
|
|
|
|
//TODO: Organize this a little better
|
|
|
|
|
std::pair<std::string, std::string> repl[] = { { "$0", "x2d" } };
|
|
|
|
|
std::string result = fmt::replace_all(code, repl);
|
|
|
|
|
|
2017-12-11 15:44:45 +01:00
|
|
|
return fmt::replace_all(result, repl_list);
|
2017-12-10 23:34:44 +01:00
|
|
|
}
|
2017-12-11 09:37:20 +01:00
|
|
|
}
|
2017-12-10 23:34:44 +01:00
|
|
|
}
|
|
|
|
|
|
2015-05-19 18:17:08 +02:00
|
|
|
return fmt::replace_all(code, repl_list);
|
|
|
|
|
}
|
|
|
|
|
|
2017-05-21 21:14:59 +02:00
|
|
|
std::string FragmentProgramDecompiler::GetRawCond()
|
2015-05-19 18:17:08 +02:00
|
|
|
{
|
|
|
|
|
static const char f[4] = { 'x', 'y', 'z', 'w' };
|
|
|
|
|
|
|
|
|
|
std::string swizzle, cond;
|
|
|
|
|
swizzle += f[src0.cond_swizzle_x];
|
|
|
|
|
swizzle += f[src0.cond_swizzle_y];
|
|
|
|
|
swizzle += f[src0.cond_swizzle_z];
|
|
|
|
|
swizzle += f[src0.cond_swizzle_w];
|
|
|
|
|
swizzle = swizzle == "xyzw" ? "" : "." + swizzle;
|
|
|
|
|
|
|
|
|
|
if (src0.exec_if_gr && src0.exec_if_eq)
|
|
|
|
|
cond = compareFunction(COMPARE::FUNCTION_SGE, AddCond() + swizzle, getFloatTypeName(4) + "(0., 0., 0., 0.)");
|
|
|
|
|
else if (src0.exec_if_lt && src0.exec_if_eq)
|
|
|
|
|
cond = compareFunction(COMPARE::FUNCTION_SLE, AddCond() + swizzle, getFloatTypeName(4) + "(0., 0., 0., 0.)");
|
|
|
|
|
else if (src0.exec_if_gr && src0.exec_if_lt)
|
|
|
|
|
cond = compareFunction(COMPARE::FUNCTION_SNE, AddCond() + swizzle, getFloatTypeName(4) + "(0., 0., 0., 0.)");
|
|
|
|
|
else if (src0.exec_if_gr)
|
|
|
|
|
cond = compareFunction(COMPARE::FUNCTION_SGT, AddCond() + swizzle, getFloatTypeName(4) + "(0., 0., 0., 0.)");
|
|
|
|
|
else if (src0.exec_if_lt)
|
|
|
|
|
cond = compareFunction(COMPARE::FUNCTION_SLT, AddCond() + swizzle, getFloatTypeName(4) + "(0., 0., 0., 0.)");
|
|
|
|
|
else //if(src0.exec_if_eq)
|
|
|
|
|
cond = compareFunction(COMPARE::FUNCTION_SEQ, AddCond() + swizzle, getFloatTypeName(4) + "(0., 0., 0., 0.)");
|
|
|
|
|
|
2017-05-21 21:14:59 +02:00
|
|
|
return cond;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
std::string FragmentProgramDecompiler::GetCond()
|
|
|
|
|
{
|
|
|
|
|
if (src0.exec_if_gr && src0.exec_if_lt && src0.exec_if_eq)
|
|
|
|
|
{
|
|
|
|
|
return "true";
|
|
|
|
|
}
|
|
|
|
|
else if (!src0.exec_if_gr && !src0.exec_if_lt && !src0.exec_if_eq)
|
|
|
|
|
{
|
|
|
|
|
return "false";
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return "any(" + GetRawCond() + ")";
|
2015-05-19 18:17:08 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void FragmentProgramDecompiler::AddCodeCond(const std::string& dst, const std::string& src)
|
|
|
|
|
{
|
|
|
|
|
if (src0.exec_if_gr && src0.exec_if_lt && src0.exec_if_eq)
|
|
|
|
|
{
|
|
|
|
|
AddCode(dst + " = " + src + ";");
|
|
|
|
|
return;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (!src0.exec_if_gr && !src0.exec_if_lt && !src0.exec_if_eq)
|
|
|
|
|
{
|
|
|
|
|
AddCode("//" + dst + " = " + src + ";");
|
|
|
|
|
return;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static const char f[4] = { 'x', 'y', 'z', 'w' };
|
2017-05-21 21:14:59 +02:00
|
|
|
std::string cond = GetRawCond();
|
2015-05-19 18:17:08 +02:00
|
|
|
|
|
|
|
|
ShaderVariable dst_var(dst);
|
2018-04-29 08:41:51 +02:00
|
|
|
dst_var.simplify();
|
2015-05-19 18:17:08 +02:00
|
|
|
|
|
|
|
|
//const char *c_mask = f;
|
|
|
|
|
|
|
|
|
|
if (dst_var.swizzles[0].length() == 1)
|
|
|
|
|
{
|
|
|
|
|
AddCode("if (" + cond + ".x) " + dst + " = " + src + ";");
|
|
|
|
|
}
|
|
|
|
|
else
|
|
|
|
|
{
|
|
|
|
|
for (int i = 0; i < dst_var.swizzles[0].length(); ++i)
|
|
|
|
|
{
|
|
|
|
|
AddCode("if (" + cond + "." + f[i] + ") " + dst + "." + f[i] + " = " + src + "." + f[i] + ";");
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
template<typename T> std::string FragmentProgramDecompiler::GetSRC(T src)
|
|
|
|
|
{
|
|
|
|
|
std::string ret;
|
2017-11-22 15:38:36 +01:00
|
|
|
bool apply_precision_modifier = !!src1.input_prec_mod;
|
2015-05-19 18:17:08 +02:00
|
|
|
|
|
|
|
|
switch (src.reg_type)
|
|
|
|
|
{
|
2016-06-10 00:03:43 +02:00
|
|
|
case RSX_FP_REGISTER_TYPE_TEMP:
|
2017-11-30 19:47:25 +01:00
|
|
|
|
|
|
|
|
if (!src.fp16)
|
|
|
|
|
{
|
|
|
|
|
if (dst.opcode == RSX_FP_OPCODE_UP16 ||
|
|
|
|
|
dst.opcode == RSX_FP_OPCODE_UP2 ||
|
|
|
|
|
dst.opcode == RSX_FP_OPCODE_UP4 ||
|
|
|
|
|
dst.opcode == RSX_FP_OPCODE_UPB ||
|
|
|
|
|
dst.opcode == RSX_FP_OPCODE_UPG)
|
|
|
|
|
{
|
|
|
|
|
auto ® = temp_registers[src.tmp_reg_index];
|
2018-02-23 20:48:51 +01:00
|
|
|
if (reg.requires_gather(src.swizzle_x))
|
2018-01-24 22:09:27 +01:00
|
|
|
{
|
|
|
|
|
properties.has_gather_op = true;
|
2018-02-23 20:48:51 +01:00
|
|
|
AddReg(src.tmp_reg_index, src.fp16);
|
|
|
|
|
ret = getFloatTypeName(4) + reg.gather_r();
|
|
|
|
|
break;
|
2018-01-24 22:09:27 +01:00
|
|
|
}
|
2017-11-30 19:47:25 +01:00
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2015-05-19 18:17:08 +02:00
|
|
|
ret += AddReg(src.tmp_reg_index, src.fp16);
|
|
|
|
|
break;
|
|
|
|
|
|
2016-06-10 00:03:43 +02:00
|
|
|
case RSX_FP_REGISTER_TYPE_INPUT:
|
2015-05-19 18:17:08 +02:00
|
|
|
{
|
|
|
|
|
static const std::string reg_table[] =
|
|
|
|
|
{
|
2016-09-27 11:54:35 +02:00
|
|
|
"wpos",
|
2015-05-19 18:17:08 +02:00
|
|
|
"diff_color", "spec_color",
|
|
|
|
|
"fogc",
|
|
|
|
|
"tc0", "tc1", "tc2", "tc3", "tc4", "tc5", "tc6", "tc7", "tc8", "tc9",
|
|
|
|
|
"ssa"
|
|
|
|
|
};
|
|
|
|
|
|
2017-11-22 15:38:36 +01:00
|
|
|
//TODO: Investigate effect of input modifier on this type
|
|
|
|
|
|
2015-05-19 18:17:08 +02:00
|
|
|
switch (dst.src_attr_reg_num)
|
|
|
|
|
{
|
2018-01-24 22:09:27 +01:00
|
|
|
case 0x00:
|
|
|
|
|
ret += reg_table[0];
|
|
|
|
|
properties.has_wpos_input = true;
|
|
|
|
|
break;
|
2015-05-19 18:17:08 +02:00
|
|
|
default:
|
|
|
|
|
if (dst.src_attr_reg_num < sizeof(reg_table) / sizeof(reg_table[0]))
|
|
|
|
|
{
|
|
|
|
|
ret += m_parr.AddParam(PF_PARAM_IN, getFloatTypeName(4), reg_table[dst.src_attr_reg_num]);
|
|
|
|
|
}
|
|
|
|
|
else
|
|
|
|
|
{
|
2015-08-12 20:38:17 +02:00
|
|
|
LOG_ERROR(RSX, "Bad src reg num: %d", u32{ dst.src_attr_reg_num });
|
2015-05-19 18:17:08 +02:00
|
|
|
ret += m_parr.AddParam(PF_PARAM_IN, getFloatTypeName(4), "unk");
|
|
|
|
|
Emu.Pause();
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
2016-06-10 00:03:43 +02:00
|
|
|
case RSX_FP_REGISTER_TYPE_CONSTANT:
|
2015-05-19 18:17:08 +02:00
|
|
|
ret += AddConst();
|
2017-11-22 15:38:36 +01:00
|
|
|
apply_precision_modifier = false;
|
2015-05-19 18:17:08 +02:00
|
|
|
break;
|
|
|
|
|
|
2016-06-10 00:03:43 +02:00
|
|
|
case RSX_FP_REGISTER_TYPE_UNKNOWN: // ??? Used by a few games, what is it?
|
2017-03-21 12:53:52 +01:00
|
|
|
LOG_ERROR(RSX, "Src type 3 used, opcode=0x%X, dst=0x%X s0=0x%X s1=0x%X s2=0x%X",
|
|
|
|
|
dst.opcode, dst.HEX, src0.HEX, src1.HEX, src2.HEX);
|
|
|
|
|
|
|
|
|
|
ret += AddType3();
|
2017-11-22 15:38:36 +01:00
|
|
|
apply_precision_modifier = false;
|
2015-10-17 19:47:18 +02:00
|
|
|
break;
|
2015-09-10 16:30:14 +02:00
|
|
|
|
2015-05-19 18:17:08 +02:00
|
|
|
default:
|
2015-08-12 20:38:17 +02:00
|
|
|
LOG_ERROR(RSX, "Bad src type %d", u32{ src.reg_type });
|
2015-05-19 18:17:08 +02:00
|
|
|
Emu.Pause();
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static const char f[4] = { 'x', 'y', 'z', 'w' };
|
|
|
|
|
|
|
|
|
|
std::string swizzle = "";
|
|
|
|
|
swizzle += f[src.swizzle_x];
|
|
|
|
|
swizzle += f[src.swizzle_y];
|
|
|
|
|
swizzle += f[src.swizzle_z];
|
|
|
|
|
swizzle += f[src.swizzle_w];
|
|
|
|
|
|
|
|
|
|
if (strncmp(swizzle.c_str(), f, 4) != 0) ret += "." + swizzle;
|
|
|
|
|
|
2017-11-17 17:43:57 +01:00
|
|
|
//Warning: Modifier order matters. e.g neg should be applied after precision clamping (tested with Naruto UNS)
|
2015-05-19 18:17:08 +02:00
|
|
|
if (src.abs) ret = "abs(" + ret + ")";
|
2017-11-22 15:38:36 +01:00
|
|
|
if (apply_precision_modifier) ret = ClampValue(ret, src1.input_prec_mod);
|
2015-05-19 18:17:08 +02:00
|
|
|
if (src.neg) ret = "-" + ret;
|
|
|
|
|
|
|
|
|
|
return ret;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
std::string FragmentProgramDecompiler::BuildCode()
|
|
|
|
|
{
|
|
|
|
|
std::stringstream OS;
|
|
|
|
|
insertHeader(OS);
|
2017-12-02 13:13:13 +01:00
|
|
|
OS << "\n";
|
2015-05-19 18:17:08 +02:00
|
|
|
insertConstants(OS);
|
2017-12-02 13:13:13 +01:00
|
|
|
OS << "\n";
|
2018-04-29 08:41:51 +02:00
|
|
|
insertInputs(OS);
|
2017-12-02 13:13:13 +01:00
|
|
|
OS << "\n";
|
2015-05-19 18:17:08 +02:00
|
|
|
insertOutputs(OS);
|
2017-12-02 13:13:13 +01:00
|
|
|
OS << "\n";
|
|
|
|
|
|
|
|
|
|
//Insert global function definitions
|
|
|
|
|
insertGlobalFunctions(OS);
|
2017-11-30 19:47:25 +01:00
|
|
|
|
2018-01-24 22:09:27 +01:00
|
|
|
//Declare register gather/merge if needed
|
|
|
|
|
if (properties.has_gather_op)
|
|
|
|
|
{
|
|
|
|
|
std::string float2 = getFloatTypeName(2);
|
|
|
|
|
std::string float4 = getFloatTypeName(4);
|
|
|
|
|
|
|
|
|
|
OS << float4 << " gather(" << float4 << " _h0, " << float4 << " _h1)\n";
|
|
|
|
|
OS << "{\n";
|
|
|
|
|
OS << " float x = uintBitsToFloat(packHalf2x16(_h0.xy));\n";
|
|
|
|
|
OS << " float y = uintBitsToFloat(packHalf2x16(_h0.zw));\n";
|
|
|
|
|
OS << " float z = uintBitsToFloat(packHalf2x16(_h1.xy));\n";
|
|
|
|
|
OS << " float w = uintBitsToFloat(packHalf2x16(_h1.zw));\n";
|
|
|
|
|
OS << " return " << float4 << "(x, y, z, w);\n";
|
|
|
|
|
OS << "}\n\n";
|
|
|
|
|
|
|
|
|
|
OS << float2 << " gather(" << float4 << " _h)\n";
|
|
|
|
|
OS << "{\n";
|
|
|
|
|
OS << " float x = uintBitsToFloat(packHalf2x16(_h.xy));\n";
|
|
|
|
|
OS << " float y = uintBitsToFloat(packHalf2x16(_h.zw));\n";
|
|
|
|
|
OS << " return " << float2 << "(x, y);\n";
|
|
|
|
|
OS << "}\n\n";
|
|
|
|
|
}
|
2017-11-30 19:47:25 +01:00
|
|
|
|
2015-05-19 18:17:08 +02:00
|
|
|
insertMainStart(OS);
|
|
|
|
|
OS << main << std::endl;
|
|
|
|
|
insertMainEnd(OS);
|
|
|
|
|
|
|
|
|
|
return OS.str();
|
|
|
|
|
}
|
|
|
|
|
|
2015-11-16 00:37:44 +01:00
|
|
|
bool FragmentProgramDecompiler::handle_sct(u32 opcode)
|
|
|
|
|
{
|
|
|
|
|
switch (opcode)
|
|
|
|
|
{
|
|
|
|
|
case RSX_FP_OPCODE_ADD: SetDst("($0 + $1)"); return true;
|
2017-03-07 11:40:38 +01:00
|
|
|
case RSX_FP_OPCODE_DIV: SetDst("($0 / " + NotZero("$1.x") + ")"); return true;
|
2016-01-03 18:40:19 +01:00
|
|
|
// Note: DIVSQ is not IEEE compliant. divsq(0, 0) is 0 (Super Puzzle Fighter II Turbo HD Remix).
|
|
|
|
|
// sqrt(x, 0) might be equal to some big value (in absolute) whose sign is sign(x) but it has to be proven.
|
2017-03-07 11:40:38 +01:00
|
|
|
case RSX_FP_OPCODE_DIVSQ: SetDst("($0 / sqrt(" + NotZeroPositive("$1.x") + "))"); return true;
|
2015-11-16 00:37:44 +01:00
|
|
|
case RSX_FP_OPCODE_DP2: SetDst(getFunction(FUNCTION::FUNCTION_DP2)); return true;
|
|
|
|
|
case RSX_FP_OPCODE_DP3: SetDst(getFunction(FUNCTION::FUNCTION_DP3)); return true;
|
|
|
|
|
case RSX_FP_OPCODE_DP4: SetDst(getFunction(FUNCTION::FUNCTION_DP4)); return true;
|
|
|
|
|
case RSX_FP_OPCODE_DP2A: SetDst(getFunction(FUNCTION::FUNCTION_DP2A)); return true;
|
|
|
|
|
case RSX_FP_OPCODE_MAD: SetDst("($0 * $1 + $2)"); return true;
|
|
|
|
|
case RSX_FP_OPCODE_MAX: SetDst("max($0, $1)"); return true;
|
|
|
|
|
case RSX_FP_OPCODE_MIN: SetDst("min($0, $1)"); return true;
|
|
|
|
|
case RSX_FP_OPCODE_MOV: SetDst("$0"); return true;
|
|
|
|
|
case RSX_FP_OPCODE_MUL: SetDst("($0 * $1)"); return true;
|
2018-04-29 08:41:51 +02:00
|
|
|
// Note: It's highly likely that RCP is not IEEE compliant but a game that uses rcp(0) has to be found
|
2017-06-30 12:59:02 +02:00
|
|
|
case RSX_FP_OPCODE_RCP: SetDst("(1. / " + NotZero("$0.x") + ").xxxx"); return true;
|
2016-01-03 18:40:19 +01:00
|
|
|
// Note: RSQ is not IEEE compliant. rsq(0) is some big number (Silent Hill 3 HD)
|
|
|
|
|
// It is not know what happens if 0 is negative.
|
2017-03-14 14:05:59 +01:00
|
|
|
case RSX_FP_OPCODE_RSQ: SetDst("(1. / sqrt(" + NotZeroPositive("$0.x") + ").xxxx)"); return true;
|
2015-11-16 00:37:44 +01:00
|
|
|
case RSX_FP_OPCODE_SEQ: SetDst(getFloatTypeName(4) + "(" + compareFunction(COMPARE::FUNCTION_SEQ, "$0", "$1") + ")"); return true;
|
|
|
|
|
case RSX_FP_OPCODE_SFL: SetDst(getFunction(FUNCTION::FUNCTION_SFL)); return true;
|
|
|
|
|
case RSX_FP_OPCODE_SGE: SetDst(getFloatTypeName(4) + "(" + compareFunction(COMPARE::FUNCTION_SGE, "$0", "$1") + ")"); return true;
|
|
|
|
|
case RSX_FP_OPCODE_SGT: SetDst(getFloatTypeName(4) + "(" + compareFunction(COMPARE::FUNCTION_SGT, "$0", "$1") + ")"); return true;
|
|
|
|
|
case RSX_FP_OPCODE_SLE: SetDst(getFloatTypeName(4) + "(" + compareFunction(COMPARE::FUNCTION_SLE, "$0", "$1") + ")"); return true;
|
|
|
|
|
case RSX_FP_OPCODE_SLT: SetDst(getFloatTypeName(4) + "(" + compareFunction(COMPARE::FUNCTION_SLT, "$0", "$1") + ")"); return true;
|
|
|
|
|
case RSX_FP_OPCODE_SNE: SetDst(getFloatTypeName(4) + "(" + compareFunction(COMPARE::FUNCTION_SNE, "$0", "$1") + ")"); return true;
|
|
|
|
|
case RSX_FP_OPCODE_STR: SetDst(getFunction(FUNCTION::FUNCTION_STR)); return true;
|
|
|
|
|
}
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
bool FragmentProgramDecompiler::handle_scb(u32 opcode)
|
|
|
|
|
{
|
|
|
|
|
switch (opcode)
|
|
|
|
|
{
|
|
|
|
|
case RSX_FP_OPCODE_ADD: SetDst("($0 + $1)"); return true;
|
|
|
|
|
case RSX_FP_OPCODE_COS: SetDst("cos($0.xxxx)"); return true;
|
2017-03-07 11:40:38 +01:00
|
|
|
case RSX_FP_OPCODE_DIV: SetDst("($0 / " + NotZero("$1.x") + ")"); return true;
|
2016-01-03 18:40:19 +01:00
|
|
|
// Note: DIVSQ is not IEEE compliant. sqrt(0, 0) is 0 (Super Puzzle Fighter II Turbo HD Remix).
|
|
|
|
|
// sqrt(x, 0) might be equal to some big value (in absolute) whose sign is sign(x) but it has to be proven.
|
2017-03-07 11:40:38 +01:00
|
|
|
case RSX_FP_OPCODE_DIVSQ: SetDst("($0 / sqrt(" + NotZeroPositive("$1.x") + "))"); return true;
|
2015-11-16 00:37:44 +01:00
|
|
|
case RSX_FP_OPCODE_DP2: SetDst(getFunction(FUNCTION::FUNCTION_DP2)); return true;
|
|
|
|
|
case RSX_FP_OPCODE_DP3: SetDst(getFunction(FUNCTION::FUNCTION_DP3)); return true;
|
|
|
|
|
case RSX_FP_OPCODE_DP4: SetDst(getFunction(FUNCTION::FUNCTION_DP4)); return true;
|
|
|
|
|
case RSX_FP_OPCODE_DP2A: SetDst(getFunction(FUNCTION::FUNCTION_DP2A)); return true;
|
|
|
|
|
case RSX_FP_OPCODE_DST: SetDst("vec4(distance($0, $1))"); return true;
|
2016-06-04 09:23:45 +02:00
|
|
|
case RSX_FP_OPCODE_REFL: SetDst(getFunction(FUNCTION::FUNCTION_REFL)); return true;
|
2015-11-16 00:37:44 +01:00
|
|
|
case RSX_FP_OPCODE_EX2: SetDst("exp2($0.xxxx)"); return true;
|
|
|
|
|
case RSX_FP_OPCODE_FLR: SetDst("floor($0)"); return true;
|
|
|
|
|
case RSX_FP_OPCODE_FRC: SetDst(getFunction(FUNCTION::FUNCTION_FRACT)); return true;
|
2018-01-24 22:09:27 +01:00
|
|
|
case RSX_FP_OPCODE_LIT:
|
|
|
|
|
SetDst("lit_legacy($0)");
|
|
|
|
|
properties.has_lit_op = true;
|
|
|
|
|
return true;
|
2015-11-16 00:37:44 +01:00
|
|
|
case RSX_FP_OPCODE_LIF: SetDst(getFloatTypeName(4) + "(1.0, $0.y, ($0.y > 0 ? pow(2.0, $0.w) : 0.0), 1.0)"); return true;
|
2016-06-04 09:23:45 +02:00
|
|
|
case RSX_FP_OPCODE_LRP: SetDst(getFloatTypeName(4) + "($2 * (1 - $0) + $1 * $0)"); return true;
|
2017-12-10 23:01:28 +01:00
|
|
|
case RSX_FP_OPCODE_LG2: SetDst("log2(" + NotZeroPositive("$0.x") + ").xxxx"); return true;
|
2015-11-16 00:37:44 +01:00
|
|
|
case RSX_FP_OPCODE_MAD: SetDst("($0 * $1 + $2)"); return true;
|
|
|
|
|
case RSX_FP_OPCODE_MAX: SetDst("max($0, $1)"); return true;
|
|
|
|
|
case RSX_FP_OPCODE_MIN: SetDst("min($0, $1)"); return true;
|
|
|
|
|
case RSX_FP_OPCODE_MOV: SetDst("$0"); return true;
|
|
|
|
|
case RSX_FP_OPCODE_MUL: SetDst("($0 * $1)"); return true;
|
2017-12-01 13:57:28 +01:00
|
|
|
//Pack operations. See https://www.khronos.org/registry/OpenGL/extensions/NV/NV_fragment_program.txt
|
|
|
|
|
case RSX_FP_OPCODE_PK2: SetDst(getFloatTypeName(4) + "(uintBitsToFloat(packHalf2x16($0.xy)))"); return true;
|
2017-11-29 17:09:59 +01:00
|
|
|
case RSX_FP_OPCODE_PK4: SetDst(getFloatTypeName(4) + "(uintBitsToFloat(packSnorm4x8($0)))"); return true;
|
2017-12-01 13:57:28 +01:00
|
|
|
case RSX_FP_OPCODE_PK16: SetDst(getFloatTypeName(4) + "(uintBitsToFloat(packSnorm2x16($0.xy)))"); return true;
|
|
|
|
|
case RSX_FP_OPCODE_PKG:
|
|
|
|
|
//Should be similar to PKB but with gamma correction, see description of PK4UBG in khronos page
|
2017-11-29 17:09:59 +01:00
|
|
|
case RSX_FP_OPCODE_PKB: SetDst(getFloatTypeName(4) + "(uintBitsToFloat(packUnorm4x8($0)))"); return true;
|
2015-11-16 00:37:44 +01:00
|
|
|
case RSX_FP_OPCODE_SEQ: SetDst(getFloatTypeName(4) + "(" + compareFunction(COMPARE::FUNCTION_SEQ, "$0", "$1") + ")"); return true;
|
|
|
|
|
case RSX_FP_OPCODE_SFL: SetDst(getFunction(FUNCTION::FUNCTION_SFL)); return true;
|
|
|
|
|
case RSX_FP_OPCODE_SGE: SetDst(getFloatTypeName(4) + "(" + compareFunction(COMPARE::FUNCTION_SGE, "$0", "$1") + ")"); return true;
|
|
|
|
|
case RSX_FP_OPCODE_SGT: SetDst(getFloatTypeName(4) + "(" + compareFunction(COMPARE::FUNCTION_SGT, "$0", "$1") + ")"); return true;
|
|
|
|
|
case RSX_FP_OPCODE_SIN: SetDst("sin($0.xxxx)"); return true;
|
|
|
|
|
case RSX_FP_OPCODE_SLE: SetDst(getFloatTypeName(4) + "(" + compareFunction(COMPARE::FUNCTION_SLE, "$0", "$1") + ")"); return true;
|
|
|
|
|
case RSX_FP_OPCODE_SLT: SetDst(getFloatTypeName(4) + "(" + compareFunction(COMPARE::FUNCTION_SLT, "$0", "$1") + ")"); return true;
|
|
|
|
|
case RSX_FP_OPCODE_SNE: SetDst(getFloatTypeName(4) + "(" + compareFunction(COMPARE::FUNCTION_SNE, "$0", "$1") + ")"); return true;
|
|
|
|
|
case RSX_FP_OPCODE_STR: SetDst(getFunction(FUNCTION::FUNCTION_STR)); return true;
|
|
|
|
|
}
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
bool FragmentProgramDecompiler::handle_tex_srb(u32 opcode)
|
|
|
|
|
{
|
|
|
|
|
switch (opcode)
|
|
|
|
|
{
|
|
|
|
|
case RSX_FP_OPCODE_DDX: SetDst(getFunction(FUNCTION::FUNCTION_DFDX)); return true;
|
|
|
|
|
case RSX_FP_OPCODE_DDY: SetDst(getFunction(FUNCTION::FUNCTION_DFDY)); return true;
|
2017-03-07 11:40:38 +01:00
|
|
|
case RSX_FP_OPCODE_NRM: SetDst("normalize($0.xyz)"); return true;
|
2017-12-10 23:01:28 +01:00
|
|
|
case RSX_FP_OPCODE_BEM: SetDst("$0.xyxy + $1.xxxx * $2.xzxz + $1.yyyy * $2.ywyw"); return true;
|
2017-03-07 11:40:38 +01:00
|
|
|
case RSX_FP_OPCODE_TEXBEM:
|
2017-12-10 23:34:44 +01:00
|
|
|
//Untested, should be x2d followed by TEX
|
|
|
|
|
AddX2d();
|
2017-12-11 10:03:31 +01:00
|
|
|
AddCode(Format("x2d = $0.xyxy + $1.xxxx * $2.xzxz + $1.yyyy * $2.ywyw;", true));
|
2015-12-10 02:52:27 +01:00
|
|
|
case RSX_FP_OPCODE_TEX:
|
2016-01-24 22:24:28 +01:00
|
|
|
switch (m_prog.get_texture_dimension(dst.tex_num))
|
2015-12-10 02:52:27 +01:00
|
|
|
{
|
2016-03-30 21:52:29 +02:00
|
|
|
case rsx::texture_dimension_extended::texture_dimension_1d:
|
2016-01-27 00:34:34 +01:00
|
|
|
SetDst(getFunction(FUNCTION::FUNCTION_TEXTURE_SAMPLE1D));
|
|
|
|
|
return true;
|
2016-03-30 21:52:29 +02:00
|
|
|
case rsx::texture_dimension_extended::texture_dimension_2d:
|
2018-03-13 11:49:28 +01:00
|
|
|
if (m_prog.shadow_textures & (1 << dst.tex_num))
|
2017-09-18 19:58:51 +02:00
|
|
|
{
|
|
|
|
|
m_shadow_sampled_textures |= (1 << dst.tex_num);
|
2018-03-13 11:49:28 +01:00
|
|
|
SetDst(getFunction(FUNCTION::FUNCTION_TEXTURE_SHADOW2D) + ".xxxx");
|
2017-09-18 19:58:51 +02:00
|
|
|
return true;
|
|
|
|
|
}
|
2016-09-29 08:54:32 +02:00
|
|
|
if (m_prog.redirected_textures & (1 << dst.tex_num))
|
|
|
|
|
SetDst(getFunction(FUNCTION::FUNCTION_TEXTURE_SAMPLE2D_DEPTH_RGBA));
|
|
|
|
|
else
|
|
|
|
|
SetDst(getFunction(FUNCTION::FUNCTION_TEXTURE_SAMPLE2D));
|
2017-06-14 00:33:53 +02:00
|
|
|
m_2d_sampled_textures |= (1 << dst.tex_num);
|
2015-12-10 02:52:27 +01:00
|
|
|
return true;
|
2016-03-30 21:52:29 +02:00
|
|
|
case rsx::texture_dimension_extended::texture_dimension_cubemap:
|
2016-01-27 00:34:34 +01:00
|
|
|
SetDst(getFunction(FUNCTION::FUNCTION_TEXTURE_SAMPLECUBE));
|
2015-12-10 02:52:27 +01:00
|
|
|
return true;
|
2016-03-30 21:52:29 +02:00
|
|
|
case rsx::texture_dimension_extended::texture_dimension_3d:
|
2016-01-24 22:24:28 +01:00
|
|
|
SetDst(getFunction(FUNCTION::FUNCTION_TEXTURE_SAMPLE3D));
|
|
|
|
|
return true;
|
2015-12-10 02:52:27 +01:00
|
|
|
}
|
|
|
|
|
return false;
|
2017-03-07 11:40:38 +01:00
|
|
|
case RSX_FP_OPCODE_TXPBEM:
|
2017-12-11 09:37:20 +01:00
|
|
|
//Untested, should be x2d followed by TXP
|
|
|
|
|
AddX2d();
|
2017-12-11 10:03:31 +01:00
|
|
|
AddCode(Format("x2d = $0.xyxy + $1.xxxx * $2.xzxz + $1.yyyy * $2.ywyw;", true));
|
2015-12-10 02:52:27 +01:00
|
|
|
case RSX_FP_OPCODE_TXP:
|
2016-01-24 22:24:28 +01:00
|
|
|
switch (m_prog.get_texture_dimension(dst.tex_num))
|
2015-12-10 02:52:27 +01:00
|
|
|
{
|
2016-03-30 21:52:29 +02:00
|
|
|
case rsx::texture_dimension_extended::texture_dimension_1d:
|
2016-01-27 00:34:34 +01:00
|
|
|
SetDst(getFunction(FUNCTION::FUNCTION_TEXTURE_SAMPLE1D_PROJ));
|
|
|
|
|
return true;
|
2016-03-30 21:52:29 +02:00
|
|
|
case rsx::texture_dimension_extended::texture_dimension_2d:
|
2017-06-22 19:09:05 +02:00
|
|
|
//Note shadow comparison only returns a true/false result!
|
2018-03-13 11:49:28 +01:00
|
|
|
if (m_prog.shadow_textures & (1 << dst.tex_num))
|
2017-06-28 00:03:09 +02:00
|
|
|
{
|
2017-06-14 00:33:53 +02:00
|
|
|
m_shadow_sampled_textures |= (1 << dst.tex_num);
|
2018-03-13 11:49:28 +01:00
|
|
|
SetDst(getFunction(FUNCTION::FUNCTION_TEXTURE_SHADOW2D_PROJ) + ".xxxx");
|
2017-06-28 00:03:09 +02:00
|
|
|
}
|
|
|
|
|
else
|
|
|
|
|
SetDst(getFunction(FUNCTION::FUNCTION_TEXTURE_SAMPLE2D_PROJ));
|
2015-12-10 02:52:27 +01:00
|
|
|
return true;
|
2016-03-30 21:52:29 +02:00
|
|
|
case rsx::texture_dimension_extended::texture_dimension_cubemap:
|
2016-01-27 00:34:34 +01:00
|
|
|
SetDst(getFunction(FUNCTION::FUNCTION_TEXTURE_SAMPLECUBE_PROJ));
|
2015-12-10 02:52:27 +01:00
|
|
|
return true;
|
2016-03-30 21:52:29 +02:00
|
|
|
case rsx::texture_dimension_extended::texture_dimension_3d:
|
2016-01-24 22:24:28 +01:00
|
|
|
SetDst(getFunction(FUNCTION::FUNCTION_TEXTURE_SAMPLE3D_PROJ));
|
|
|
|
|
return true;
|
2015-12-10 02:52:27 +01:00
|
|
|
}
|
|
|
|
|
return false;
|
2016-05-29 17:33:41 +02:00
|
|
|
case RSX_FP_OPCODE_TXD:
|
|
|
|
|
switch (m_prog.get_texture_dimension(dst.tex_num))
|
|
|
|
|
{
|
|
|
|
|
case rsx::texture_dimension_extended::texture_dimension_1d:
|
|
|
|
|
SetDst(getFunction(FUNCTION::FUNCTION_TEXTURE_SAMPLE1D_GRAD));
|
|
|
|
|
return true;
|
|
|
|
|
case rsx::texture_dimension_extended::texture_dimension_2d:
|
|
|
|
|
SetDst(getFunction(FUNCTION::FUNCTION_TEXTURE_SAMPLE2D_GRAD));
|
2017-06-14 00:33:53 +02:00
|
|
|
m_2d_sampled_textures |= (1 << dst.tex_num);
|
2016-05-29 17:33:41 +02:00
|
|
|
return true;
|
|
|
|
|
case rsx::texture_dimension_extended::texture_dimension_cubemap:
|
|
|
|
|
SetDst(getFunction(FUNCTION::FUNCTION_TEXTURE_SAMPLECUBE_GRAD));
|
|
|
|
|
return true;
|
|
|
|
|
case rsx::texture_dimension_extended::texture_dimension_3d:
|
|
|
|
|
SetDst(getFunction(FUNCTION::FUNCTION_TEXTURE_SAMPLE3D_GRAD));
|
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
return false;
|
2017-03-07 11:40:38 +01:00
|
|
|
case RSX_FP_OPCODE_TXB:
|
2018-03-23 12:47:03 +01:00
|
|
|
switch (m_prog.get_texture_dimension(dst.tex_num))
|
|
|
|
|
{
|
|
|
|
|
case rsx::texture_dimension_extended::texture_dimension_1d:
|
|
|
|
|
SetDst(getFunction(FUNCTION::FUNCTION_TEXTURE_SAMPLE1D_BIAS));
|
|
|
|
|
return true;
|
|
|
|
|
case rsx::texture_dimension_extended::texture_dimension_2d:
|
|
|
|
|
SetDst(getFunction(FUNCTION::FUNCTION_TEXTURE_SAMPLE2D_BIAS));
|
|
|
|
|
m_2d_sampled_textures |= (1 << dst.tex_num);
|
|
|
|
|
return true;
|
|
|
|
|
case rsx::texture_dimension_extended::texture_dimension_cubemap:
|
|
|
|
|
SetDst(getFunction(FUNCTION::FUNCTION_TEXTURE_SAMPLECUBE_BIAS));
|
|
|
|
|
return true;
|
|
|
|
|
case rsx::texture_dimension_extended::texture_dimension_3d:
|
|
|
|
|
SetDst(getFunction(FUNCTION::FUNCTION_TEXTURE_SAMPLE3D_BIAS));
|
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
return false;
|
2016-01-10 00:16:13 +01:00
|
|
|
case RSX_FP_OPCODE_TXL:
|
2016-01-24 22:24:28 +01:00
|
|
|
switch (m_prog.get_texture_dimension(dst.tex_num))
|
2016-01-10 00:16:13 +01:00
|
|
|
{
|
2016-03-30 21:52:29 +02:00
|
|
|
case rsx::texture_dimension_extended::texture_dimension_1d:
|
2016-01-27 00:34:34 +01:00
|
|
|
SetDst(getFunction(FUNCTION::FUNCTION_TEXTURE_SAMPLE1D_LOD));
|
|
|
|
|
return true;
|
2016-03-30 21:52:29 +02:00
|
|
|
case rsx::texture_dimension_extended::texture_dimension_2d:
|
2016-01-27 00:34:34 +01:00
|
|
|
SetDst(getFunction(FUNCTION::FUNCTION_TEXTURE_SAMPLE2D_LOD));
|
2017-06-14 00:33:53 +02:00
|
|
|
m_2d_sampled_textures |= (1 << dst.tex_num);
|
2016-01-10 00:16:13 +01:00
|
|
|
return true;
|
2016-03-30 21:52:29 +02:00
|
|
|
case rsx::texture_dimension_extended::texture_dimension_cubemap:
|
2016-01-27 00:34:34 +01:00
|
|
|
SetDst(getFunction(FUNCTION::FUNCTION_TEXTURE_SAMPLECUBE_LOD));
|
2016-01-10 00:16:13 +01:00
|
|
|
return true;
|
2016-03-30 21:52:29 +02:00
|
|
|
case rsx::texture_dimension_extended::texture_dimension_3d:
|
2016-01-24 22:24:28 +01:00
|
|
|
SetDst(getFunction(FUNCTION::FUNCTION_TEXTURE_SAMPLE3D_LOD));
|
|
|
|
|
return true;
|
2016-01-10 00:16:13 +01:00
|
|
|
}
|
|
|
|
|
return false;
|
2017-12-01 13:57:28 +01:00
|
|
|
//Unpack operations. See https://www.khronos.org/registry/OpenGL/extensions/NV/NV_fragment_program.txt
|
|
|
|
|
case RSX_FP_OPCODE_UP2: SetDst("unpackHalf2x16(floatBitsToUint($0.x)).xyxy"); return true;
|
|
|
|
|
case RSX_FP_OPCODE_UP4: SetDst("unpackSnorm4x8(floatBitsToUint($0.x))"); return true;
|
2017-12-12 21:29:56 +01:00
|
|
|
case RSX_FP_OPCODE_UP16: SetDst("unpackSnorm2x16(floatBitsToUint($0.x)).xyxy"); return true;
|
2017-12-01 13:57:28 +01:00
|
|
|
case RSX_FP_OPCODE_UPG:
|
|
|
|
|
//Same as UPB with gamma correction
|
2017-11-29 17:09:59 +01:00
|
|
|
case RSX_FP_OPCODE_UPB: SetDst("(unpackUnorm4x8(floatBitsToUint($0.x)))"); return true;
|
2015-11-16 00:37:44 +01:00
|
|
|
}
|
|
|
|
|
return false;
|
|
|
|
|
};
|
|
|
|
|
|
2015-05-19 18:17:08 +02:00
|
|
|
std::string FragmentProgramDecompiler::Decompile()
|
|
|
|
|
{
|
2016-01-26 20:42:54 +01:00
|
|
|
auto data = (be_t<u32>*) m_prog.addr;
|
2015-05-19 18:17:08 +02:00
|
|
|
m_size = 0;
|
|
|
|
|
m_location = 0;
|
|
|
|
|
m_loop_count = 0;
|
|
|
|
|
m_code_level = 1;
|
|
|
|
|
|
|
|
|
|
enum
|
|
|
|
|
{
|
|
|
|
|
FORCE_NONE,
|
|
|
|
|
FORCE_SCT,
|
|
|
|
|
FORCE_SCB,
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
int forced_unit = FORCE_NONE;
|
|
|
|
|
|
2018-02-25 14:07:55 +01:00
|
|
|
//Add the output registers. They are statically written to and have guaranteed initialization (except r1.z which == wpos.z)
|
|
|
|
|
//This can be used instead of an explicit clear pass in some games (Motorstorm)
|
|
|
|
|
if (m_ctrl & CELL_GCM_SHADER_CONTROL_32_BITS_EXPORTS)
|
|
|
|
|
{
|
|
|
|
|
AddReg(0, CELL_GCM_FALSE);
|
|
|
|
|
AddReg(2, CELL_GCM_FALSE);
|
|
|
|
|
AddReg(3, CELL_GCM_FALSE);
|
|
|
|
|
AddReg(4, CELL_GCM_FALSE);
|
|
|
|
|
}
|
|
|
|
|
else
|
|
|
|
|
{
|
|
|
|
|
AddReg(0, CELL_GCM_TRUE);
|
|
|
|
|
AddReg(4, CELL_GCM_TRUE);
|
|
|
|
|
AddReg(6, CELL_GCM_TRUE);
|
|
|
|
|
AddReg(8, CELL_GCM_TRUE);
|
|
|
|
|
}
|
|
|
|
|
|
2015-05-19 18:17:08 +02:00
|
|
|
while (true)
|
|
|
|
|
{
|
2016-05-13 16:01:48 +02:00
|
|
|
for (auto found = std::find(m_end_offsets.begin(), m_end_offsets.end(), m_size);
|
2018-02-25 14:07:55 +01:00
|
|
|
found != m_end_offsets.end();
|
2016-05-13 16:01:48 +02:00
|
|
|
found = std::find(m_end_offsets.begin(), m_end_offsets.end(), m_size))
|
2015-05-19 18:17:08 +02:00
|
|
|
{
|
2016-05-13 16:01:48 +02:00
|
|
|
m_end_offsets.erase(found);
|
2015-05-19 18:17:08 +02:00
|
|
|
m_code_level--;
|
|
|
|
|
AddCode("}");
|
|
|
|
|
m_loop_count--;
|
|
|
|
|
}
|
|
|
|
|
|
2016-05-13 16:01:48 +02:00
|
|
|
for (auto found = std::find(m_else_offsets.begin(), m_else_offsets.end(), m_size);
|
2018-02-25 14:07:55 +01:00
|
|
|
found != m_else_offsets.end();
|
2016-05-13 16:01:48 +02:00
|
|
|
found = std::find(m_else_offsets.begin(), m_else_offsets.end(), m_size))
|
2015-05-19 18:17:08 +02:00
|
|
|
{
|
2016-05-13 16:01:48 +02:00
|
|
|
m_else_offsets.erase(found);
|
2015-05-19 18:17:08 +02:00
|
|
|
m_code_level--;
|
|
|
|
|
AddCode("}");
|
|
|
|
|
AddCode("else");
|
|
|
|
|
AddCode("{");
|
|
|
|
|
m_code_level++;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
dst.HEX = GetData(data[0]);
|
|
|
|
|
src0.HEX = GetData(data[1]);
|
|
|
|
|
src1.HEX = GetData(data[2]);
|
|
|
|
|
src2.HEX = GetData(data[3]);
|
|
|
|
|
|
|
|
|
|
m_offset = 4 * sizeof(u32);
|
|
|
|
|
|
|
|
|
|
const u32 opcode = dst.opcode | (src1.opcode_is_branch << 6);
|
|
|
|
|
|
|
|
|
|
auto SIP = [&]()
|
|
|
|
|
{
|
|
|
|
|
switch (opcode)
|
|
|
|
|
{
|
2017-06-01 14:53:25 +02:00
|
|
|
case RSX_FP_OPCODE_BRK:
|
|
|
|
|
if (m_loop_count) AddFlowOp("break");
|
|
|
|
|
else LOG_ERROR(RSX, "BRK opcode found outside of a loop");
|
|
|
|
|
break;
|
2018-02-03 09:37:42 +01:00
|
|
|
case RSX_FP_OPCODE_CAL:
|
|
|
|
|
LOG_ERROR(RSX, "Unimplemented SIP instruction: CAL");
|
|
|
|
|
break;
|
|
|
|
|
case RSX_FP_OPCODE_FENCT:
|
|
|
|
|
AddCode("//FENCT");
|
|
|
|
|
forced_unit = FORCE_SCT;
|
|
|
|
|
break;
|
|
|
|
|
case RSX_FP_OPCODE_FENCB:
|
|
|
|
|
AddCode("//FENCB");
|
|
|
|
|
forced_unit = FORCE_SCB;
|
|
|
|
|
break;
|
2015-05-19 18:17:08 +02:00
|
|
|
case RSX_FP_OPCODE_IFE:
|
|
|
|
|
AddCode("if($cond)");
|
2015-05-22 01:56:49 +02:00
|
|
|
if (src2.end_offset != src1.else_offset)
|
|
|
|
|
m_else_offsets.push_back(src1.else_offset << 2);
|
2015-05-19 18:17:08 +02:00
|
|
|
m_end_offsets.push_back(src2.end_offset << 2);
|
|
|
|
|
AddCode("{");
|
|
|
|
|
m_code_level++;
|
|
|
|
|
break;
|
|
|
|
|
case RSX_FP_OPCODE_LOOP:
|
|
|
|
|
if (!src0.exec_if_eq && !src0.exec_if_gr && !src0.exec_if_lt)
|
|
|
|
|
{
|
2017-06-01 14:53:25 +02:00
|
|
|
AddCode(fmt::format("//$ifcond for(int i%u = %u; i%u < %u; i%u += %u) {} //-> %u //LOOP",
|
2015-05-19 18:17:08 +02:00
|
|
|
m_loop_count, src1.init_counter, m_loop_count, src1.end_counter, m_loop_count, src1.increment, src2.end_offset));
|
|
|
|
|
}
|
|
|
|
|
else
|
|
|
|
|
{
|
2015-08-12 20:38:17 +02:00
|
|
|
AddCode(fmt::format("$ifcond for(int i%u = %u; i%u < %u; i%u += %u) //LOOP",
|
2015-05-19 18:17:08 +02:00
|
|
|
m_loop_count, src1.init_counter, m_loop_count, src1.end_counter, m_loop_count, src1.increment));
|
|
|
|
|
m_loop_count++;
|
|
|
|
|
m_end_offsets.push_back(src2.end_offset << 2);
|
|
|
|
|
AddCode("{");
|
|
|
|
|
m_code_level++;
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
case RSX_FP_OPCODE_REP:
|
|
|
|
|
if (!src0.exec_if_eq && !src0.exec_if_gr && !src0.exec_if_lt)
|
|
|
|
|
{
|
2017-06-01 14:53:25 +02:00
|
|
|
AddCode(fmt::format("//$ifcond for(int i%u = %u; i%u < %u; i%u += %u) {} //-> %u //REP",
|
2015-05-19 18:17:08 +02:00
|
|
|
m_loop_count, src1.init_counter, m_loop_count, src1.end_counter, m_loop_count, src1.increment, src2.end_offset));
|
|
|
|
|
}
|
|
|
|
|
else
|
|
|
|
|
{
|
2015-08-12 20:38:17 +02:00
|
|
|
AddCode(fmt::format("if($cond) for(int i%u = %u; i%u < %u; i%u += %u) //REP",
|
2015-05-19 18:17:08 +02:00
|
|
|
m_loop_count, src1.init_counter, m_loop_count, src1.end_counter, m_loop_count, src1.increment));
|
|
|
|
|
m_loop_count++;
|
|
|
|
|
m_end_offsets.push_back(src2.end_offset << 2);
|
|
|
|
|
AddCode("{");
|
|
|
|
|
m_code_level++;
|
|
|
|
|
}
|
|
|
|
|
break;
|
2018-02-03 09:37:42 +01:00
|
|
|
case RSX_FP_OPCODE_RET:
|
|
|
|
|
AddFlowOp("return");
|
|
|
|
|
break;
|
2015-05-19 18:17:08 +02:00
|
|
|
|
|
|
|
|
default:
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return true;
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
switch (opcode)
|
|
|
|
|
{
|
|
|
|
|
case RSX_FP_OPCODE_NOP: break;
|
2017-05-21 21:14:59 +02:00
|
|
|
case RSX_FP_OPCODE_KIL: AddFlowOp("discard"); break;
|
2015-05-19 18:17:08 +02:00
|
|
|
|
|
|
|
|
default:
|
2016-04-02 18:18:25 +02:00
|
|
|
int prev_force_unit = forced_unit;
|
|
|
|
|
|
2017-06-30 12:59:02 +02:00
|
|
|
//Some instructions do not respect forced unit
|
|
|
|
|
//Tested with Tales of Vesperia
|
|
|
|
|
if (SIP()) break;
|
|
|
|
|
if (handle_tex_srb(opcode)) break;
|
|
|
|
|
|
2017-11-08 14:27:20 +01:00
|
|
|
//FENCT/FENCB do not actually reject instructions if they dont match the forced unit
|
2018-04-29 08:41:51 +02:00
|
|
|
//Tested with Dark Souls II where the respecting FENCX instruction will result in empty luminance averaging shaders
|
|
|
|
|
//TODO: More research is needed to determine what real HW does
|
2017-11-08 14:27:20 +01:00
|
|
|
if (handle_sct(opcode)) break;
|
|
|
|
|
if (handle_scb(opcode)) break;
|
|
|
|
|
forced_unit = FORCE_NONE;
|
2015-05-19 18:17:08 +02:00
|
|
|
|
2016-04-02 18:18:25 +02:00
|
|
|
LOG_ERROR(RSX, "Unknown/illegal instruction: 0x%x (forced unit %d)", opcode, prev_force_unit);
|
2015-05-19 18:17:08 +02:00
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
m_size += m_offset;
|
|
|
|
|
|
|
|
|
|
if (dst.end) break;
|
|
|
|
|
|
2016-08-14 21:41:01 +02:00
|
|
|
verify(HERE), m_offset % sizeof(u32) == 0;
|
2015-05-19 18:17:08 +02:00
|
|
|
data += m_offset / sizeof(u32);
|
|
|
|
|
}
|
|
|
|
|
|
2017-09-05 15:25:02 +02:00
|
|
|
while (m_code_level > 1)
|
|
|
|
|
{
|
|
|
|
|
LOG_ERROR(RSX, "Hanging block found at end of shader. Malformed shader?");
|
|
|
|
|
|
|
|
|
|
m_code_level--;
|
|
|
|
|
AddCode("}");
|
|
|
|
|
}
|
|
|
|
|
|
2015-05-19 18:17:08 +02:00
|
|
|
// flush m_code_level
|
|
|
|
|
m_code_level = 1;
|
|
|
|
|
std::string m_shader = BuildCode();
|
|
|
|
|
main.clear();
|
|
|
|
|
// m_parr.params.clear();
|
|
|
|
|
return m_shader;
|
2015-05-23 16:28:22 +02:00
|
|
|
}
|