mirror of
https://github.com/RPCSX/rpcsx.git
synced 2026-01-06 16:49:59 +01:00
- The hw generates inaccurate values when doing perspective-correct interpolation of vertex output attributes and makes the comparison (a == b) fail even when they are a fixed constant value. - Increase equality tolerance when doing comparisons in fragment shaders for NV cards only to work around this issue. - Teepo fix
234 lines
8 KiB
C++
234 lines
8 KiB
C++
#ifdef _MSC_VER
|
|
#include "stdafx.h"
|
|
#include "stdafx_d3d12.h"
|
|
#include "D3D12CommonDecompiler.h"
|
|
|
|
std::string getFloatTypeNameImp(size_t elementCount)
|
|
{
|
|
switch (elementCount)
|
|
{
|
|
default:
|
|
abort();
|
|
case 1:
|
|
return "float";
|
|
case 2:
|
|
return "float2";
|
|
case 3:
|
|
return "float3";
|
|
case 4:
|
|
return "float4";
|
|
}
|
|
}
|
|
|
|
std::string getFunctionImp(FUNCTION f)
|
|
{
|
|
switch (f)
|
|
{
|
|
default:
|
|
fmt::throw_exception("Unsupported program function %d", (u32)f);
|
|
case FUNCTION::FUNCTION_DP2:
|
|
return "dot($0.xy, $1.xy).xxxx";
|
|
case FUNCTION::FUNCTION_DP2A:
|
|
return "(dot($0.xy, $1.xy) + $2.x).xxxx";
|
|
case FUNCTION::FUNCTION_DP3:
|
|
return "dot($0.xyz, $1.xyz).xxxx";
|
|
case FUNCTION::FUNCTION_DP4:
|
|
return "dot($0, $1).xxxx";
|
|
case FUNCTION::FUNCTION_DPH:
|
|
return "dot(float4($0.xyz, 1.0), $1).xxxx";
|
|
case FUNCTION::FUNCTION_SFL:
|
|
return "float4(0., 0., 0., 0.)";
|
|
case FUNCTION::FUNCTION_STR:
|
|
return "float4(1., 1., 1., 1.)";
|
|
case FUNCTION::FUNCTION_FRACT:
|
|
return "frac($0)";
|
|
case FUNCTION::FUNCTION_REFL:
|
|
return "($0 - 2.0 * (dot($0, $1)) * $1)";
|
|
case FUNCTION::FUNCTION_TEXTURE_SAMPLE1D:
|
|
return "$t.Sample($tsampler, $0.x)";
|
|
case FUNCTION::FUNCTION_TEXTURE_SAMPLE1D_PROJ:
|
|
return "$t.Sample($tsampler, ($0.x / $0.w))";
|
|
case FUNCTION::FUNCTION_TEXTURE_SAMPLE1D_BIAS:
|
|
case FUNCTION::FUNCTION_TEXTURE_SAMPLE1D_LOD:
|
|
return "$t.SampleLevel($tsampler, $0.x, $1)";
|
|
case FUNCTION::FUNCTION_TEXTURE_SAMPLE1D_GRAD:
|
|
return "$t.SampleGrad($tsampler, $0.x, $1, $2)";
|
|
case FUNCTION::FUNCTION_TEXTURE_SHADOW2D: //TODO
|
|
case FUNCTION::FUNCTION_TEXTURE_SHADOW2D_PROJ:
|
|
case FUNCTION::FUNCTION_TEXTURE_SAMPLE2D:
|
|
return "$t.Sample($tsampler, $0.xy * $t_scale)";
|
|
case FUNCTION::FUNCTION_TEXTURE_SAMPLE2D_PROJ:
|
|
return "$t.Sample($tsampler, ($0.xy / $0.w) * $t_scale)";
|
|
case FUNCTION::FUNCTION_TEXTURE_SAMPLE2D_BIAS:
|
|
case FUNCTION::FUNCTION_TEXTURE_SAMPLE2D_LOD:
|
|
return "$t.SampleLevel($tsampler, $0.xy * $t_scale, $1)";
|
|
case FUNCTION::FUNCTION_TEXTURE_SAMPLE2D_GRAD:
|
|
return "$t.SampleGrad($tsampler, $0.xy, $1, $2)";
|
|
case FUNCTION::FUNCTION_TEXTURE_SAMPLECUBE:
|
|
return "$t.Sample($tsampler, $0.xyz)";
|
|
case FUNCTION::FUNCTION_TEXTURE_SAMPLECUBE_PROJ:
|
|
return "$t.Sample($tsampler, ($0.xyz / $0.w))";
|
|
case FUNCTION::FUNCTION_TEXTURE_SAMPLECUBE_BIAS:
|
|
case FUNCTION::FUNCTION_TEXTURE_SAMPLECUBE_LOD:
|
|
return "$t.SampleLevel($tsampler, $0.xyz, $1)";
|
|
case FUNCTION::FUNCTION_TEXTURE_SAMPLECUBE_GRAD:
|
|
return "$t.SampleGrad($tsampler, $0.xyz, $1, $2)";
|
|
case FUNCTION::FUNCTION_TEXTURE_SAMPLE3D:
|
|
return "$t.Sample($tsampler, $0.xyz)";
|
|
case FUNCTION::FUNCTION_TEXTURE_SAMPLE3D_PROJ:
|
|
return "$t.Sample($tsampler, ($0.xyz / $0.w))";
|
|
case FUNCTION::FUNCTION_TEXTURE_SAMPLE3D_BIAS:
|
|
case FUNCTION::FUNCTION_TEXTURE_SAMPLE3D_LOD:
|
|
return "$t.SampleLevel($tsampler, $0.xyz, $1)";
|
|
case FUNCTION::FUNCTION_TEXTURE_SAMPLE3D_GRAD:
|
|
return "$t.SampleGrad($tsampler, $0.xyz, $1, $2)";
|
|
case FUNCTION::FUNCTION_DFDX:
|
|
return "ddx($0)";
|
|
case FUNCTION::FUNCTION_DFDY:
|
|
return "ddy($0)";
|
|
case FUNCTION::FUNCTION_TEXTURE_SAMPLE2D_DEPTH_RGBA:
|
|
return "texture2DReconstruct($t.Sample($tsampler, $0.xy * $t_scale), texture_parameters[$_i].z)";
|
|
}
|
|
}
|
|
|
|
std::string compareFunctionImp(COMPARE f, const std::string &Op0, const std::string &Op1)
|
|
{
|
|
switch (f)
|
|
{
|
|
default:
|
|
abort();
|
|
case COMPARE::FUNCTION_SEQ:
|
|
return "(" + Op0 + " == " + Op1 + ")";
|
|
case COMPARE::FUNCTION_SGE:
|
|
return "(" + Op0 + " >= " + Op1 + ")";
|
|
case COMPARE::FUNCTION_SGT:
|
|
return "(" + Op0 + " > " + Op1 + ")";
|
|
case COMPARE::FUNCTION_SLE:
|
|
return "(" + Op0 + " <= " + Op1 + ")";
|
|
case COMPARE::FUNCTION_SLT:
|
|
return "(" + Op0 + " < " + Op1 + ")";
|
|
case COMPARE::FUNCTION_SNE:
|
|
return "(" + Op0 + " != " + Op1 + ")";
|
|
}
|
|
}
|
|
|
|
void insert_d3d12_legacy_function(std::ostream& OS, bool is_fragment_program)
|
|
{
|
|
OS << "#define _select lerp\n\n";
|
|
|
|
OS << "float4 lit_legacy(float4 val)";
|
|
OS << "{\n";
|
|
OS << " float4 clamped_val = val;\n";
|
|
OS << " clamped_val.x = max(val.x, 0);\n";
|
|
OS << " clamped_val.y = max(val.y, 0);\n";
|
|
OS << " float4 result;\n";
|
|
OS << " result.x = 1.0;\n";
|
|
OS << " result.w = 1.;\n";
|
|
OS << " result.y = clamped_val.x;\n";
|
|
OS << " result.z = clamped_val.x > 0.0 ? exp(clamped_val.w * log(max(clamped_val.y, 1.E-10))) : 0.0;\n";
|
|
OS << " return result;\n";
|
|
OS << "}\n\n";
|
|
|
|
if (!is_fragment_program)
|
|
return;
|
|
|
|
program_common::insert_compare_op(OS, false);
|
|
|
|
OS << "uint packSnorm2x16(float2 val)";
|
|
OS << "{\n";
|
|
OS << " uint high_bits = round(clamp(val.x, -1., 1.) * 32767.);\n";
|
|
OS << " uint low_bits = round(clamp(val.y, -1., 1.) * 32767.);\n";
|
|
OS << " return (high_bits << 16)|low_bits;\n";
|
|
OS << "}\n\n";
|
|
|
|
OS << "uint packSnorm4x8(float4 val)";
|
|
OS << "{\n";
|
|
OS << " uint high_bits_a = round(clamp(val.x, -1., 1.) * 127.);\n";
|
|
OS << " uint high_bits_b = round(clamp(val.y, -1., 1.) * 127.);\n";
|
|
OS << " uint low_bits_a = round(clamp(val.z, -1., 1.) * 127.);\n";
|
|
OS << " uint low_bits_b = round(clamp(val.z, -1., 1.) * 127.);\n";
|
|
OS << " return (high_bits_a << 24)|(high_bits_b << 16)|(low_bits_a << 8)|low_bits_b;\n";
|
|
OS << "}\n\n";
|
|
|
|
OS << "float2 unpackSnorm2x16(uint val)";
|
|
OS << "{\n";
|
|
OS << " float high = clamp((val >> 16) / 32767., -1., 1.);\n";
|
|
OS << " float low = clamp((val & 0x0000FFFF) / 32767., -1., 1.);\n";
|
|
OS << " return float2(high, low);\n";
|
|
OS << "}\n\n";
|
|
|
|
OS << "float4 unpackSnorm4x8(uint val)";
|
|
OS << "{\n";
|
|
OS << " float high_a = clamp((val >> 24) / 127., -1., 1.);\n";
|
|
OS << " float high_b = clamp(((val >> 16) & 0xFF) / 127., -1., 1.);\n";
|
|
OS << " float low_a = clamp(((val >> 8) & 0xFF) / 127., -1., 1.);\n";
|
|
OS << " float low_b = clamp((val & 0xFF) / 127., -1., 1.);\n";
|
|
OS << " return float4(high_a, high_b, low_a, low_b);\n";
|
|
OS << "}\n\n";
|
|
|
|
OS << "uint packUnorm4x8(float4 val)";
|
|
OS << "{\n";
|
|
OS << " uint high_bits_a = round(clamp(val.x, -1., 1.) * 255.);\n";
|
|
OS << " uint high_bits_b = round(clamp(val.y, -1., 1.) * 255.);\n";
|
|
OS << " uint low_bits_a = round(clamp(val.z, -1., 1.) * 255.);\n";
|
|
OS << " uint low_bits_b = round(clamp(val.z, -1., 1.) * 255.);\n";
|
|
OS << " return (high_bits_a << 24)|(high_bits_b << 16)|(low_bits_a << 8)|low_bits_b;\n";
|
|
OS << "}\n\n";
|
|
|
|
OS << "float4 unpackUnorm4x8(uint val)";
|
|
OS << "{\n";
|
|
OS << " float high_a = clamp((val >> 24) / 255., -1., 1.);\n";
|
|
OS << " float high_b = clamp(((val >> 16) & 0xFF) / 255., -1., 1.);\n";
|
|
OS << " float low_a = clamp(((val >> 8) & 0xFF) / 255., -1., 1.);\n";
|
|
OS << " float low_b = clamp((val & 0xFF) / 255., -1., 1.);\n";
|
|
OS << " return float4(high_a, high_b, low_a, low_b);\n";
|
|
OS << "}\n\n";
|
|
|
|
/**
|
|
* There is no easy way to do this in a shader since we cant recast the f16 blocks to u16
|
|
* Fake it and hope the program requests the corresponding f16 unpack
|
|
**/
|
|
OS << "uint packHalf2x16(float2 val)";
|
|
OS << "{\n";
|
|
OS << " return packSnorm2x16(val / 65504.);\n";
|
|
OS << "}\n\n";
|
|
|
|
OS << "float2 unpackHalf2x16(uint val)";
|
|
OS << "{\n";
|
|
OS << " return unpackSnorm2x16(val) * 65504.;\n";
|
|
OS << "}\n\n";
|
|
|
|
OS << "float read_value(float4 src, uint remap_index)\n";
|
|
OS << "{\n";
|
|
OS << " switch (remap_index)\n";
|
|
OS << " {\n";
|
|
OS << " case 0: return src.a;\n";
|
|
OS << " case 1: return src.r;\n";
|
|
OS << " case 2: return src.g;\n";
|
|
OS << " case 3: return src.b;\n";
|
|
OS << " }\n";
|
|
OS << "}\n\n";
|
|
|
|
OS << "float4 texture2DReconstruct(float depth_value, float remap)\n";
|
|
OS << "{\n";
|
|
OS << " uint value = round(depth_value * 16777215);\n";
|
|
OS << " uint b = (value & 0xff);\n";
|
|
OS << " uint g = (value >> 8) & 0xff;\n";
|
|
OS << " uint r = (value >> 16) & 0xff;\n";
|
|
OS << " float4 result = float4(g/255., b/255., 1., r/255.);\n\n";
|
|
OS << " uint remap_vector = asuint(remap) & 0xFF;\n";
|
|
OS << " if (remap_vector == 0xE4) return result;\n\n";
|
|
OS << " float4 tmp;\n";
|
|
OS << " uint remap_a = remap_vector & 0x3;\n";
|
|
OS << " uint remap_r = (remap_vector >> 2) & 0x3;\n";
|
|
OS << " uint remap_g = (remap_vector >> 4) & 0x3;\n";
|
|
OS << " uint remap_b = (remap_vector >> 6) & 0x3;\n";
|
|
OS << " tmp.a = read_value(result, remap_a);\n";
|
|
OS << " tmp.r = read_value(result, remap_r);\n";
|
|
OS << " tmp.g = read_value(result, remap_g);\n";
|
|
OS << " tmp.b = read_value(result, remap_b);\n";
|
|
OS << " return tmp;\n";
|
|
OS << "}\n\n";
|
|
}
|
|
#endif
|