2012-11-15 00:39:56 +01:00
# include "stdafx.h"
2014-06-02 19:27:24 +02:00
# include "Emu/Memory/Memory.h"
2017-05-20 13:45:02 +02:00
# include "Emu/System.h"
2015-10-26 22:09:31 +01:00
# include "GLGSRender.h"
2016-10-18 09:57:28 +02:00
# include "GLVertexProgram.h"
2016-01-05 22:29:49 +01:00
# include "../rsx_methods.h"
2016-01-12 00:54:07 +01:00
# include "../Common/BufferUtils.h"
2016-06-20 23:38:38 +02:00
# include "../rsx_utils.h"
2012-11-15 00:39:56 +01:00
2013-08-27 17:18:01 +02:00
# define DUMP_VERTEX_DATA 0
2012-11-15 00:39:56 +01:00
2016-01-13 17:40:10 +01:00
namespace
{
2016-01-20 18:12:48 +01:00
u32 get_max_depth_value ( rsx : : surface_depth_format format )
2016-01-13 17:40:10 +01:00
{
switch ( format )
{
2016-01-20 18:12:48 +01:00
case rsx : : surface_depth_format : : z16 : return 0xFFFF ;
case rsx : : surface_depth_format : : z24s8 : return 0xFFFFFF ;
2016-01-13 17:40:10 +01:00
}
2016-08-08 18:01:06 +02:00
fmt : : throw_exception ( " Unknown depth format " HERE ) ;
2016-06-30 06:46:25 +02:00
}
2016-01-13 17:40:10 +01:00
}
2017-05-20 13:45:02 +02:00
GLGSRender : : GLGSRender ( ) : GSRender ( )
2015-10-04 00:45:26 +02:00
{
2017-11-08 11:40:19 +01:00
m_shaders_cache . reset ( new gl : : shader_cache ( m_prog_buffer , " opengl " , " v1.1 " ) ) ;
2017-07-26 18:32:13 +02:00
if ( g_cfg . video . disable_vertex_cache )
m_vertex_cache . reset ( new gl : : null_vertex_cache ( ) ) ;
else
m_vertex_cache . reset ( new gl : : weak_vertex_cache ( ) ) ;
2017-09-07 21:32:52 +02:00
2017-10-25 12:48:12 +02:00
supports_multidraw = ! g_cfg . video . strict_rendering_mode ;
2018-01-17 17:14:00 +01:00
supports_native_ui = ( bool ) g_cfg . misc . use_native_interface ;
2015-10-11 22:00:51 +02:00
}
2014-08-23 02:16:54 +02:00
2015-10-11 22:00:51 +02:00
extern CellGcmContextData current_context ;
2016-06-26 23:37:02 +02:00
namespace
{
2016-07-19 13:06:01 +02:00
GLenum comparison_op ( rsx : : comparison_function op )
2016-06-26 23:37:02 +02:00
{
switch ( op )
{
2016-07-19 13:06:01 +02:00
case rsx : : comparison_function : : never : return GL_NEVER ;
case rsx : : comparison_function : : less : return GL_LESS ;
case rsx : : comparison_function : : equal : return GL_EQUAL ;
case rsx : : comparison_function : : less_or_equal : return GL_LEQUAL ;
case rsx : : comparison_function : : greater : return GL_GREATER ;
case rsx : : comparison_function : : not_equal : return GL_NOTEQUAL ;
case rsx : : comparison_function : : greater_or_equal : return GL_GEQUAL ;
case rsx : : comparison_function : : always : return GL_ALWAYS ;
2016-06-26 23:37:02 +02:00
}
2017-10-31 14:54:55 +01:00
fmt : : throw_exception ( " Unsupported comparison op 0x%X " HERE , ( u32 ) op ) ; ;
2016-06-26 23:37:02 +02:00
}
GLenum stencil_op ( rsx : : stencil_op op )
{
switch ( op )
{
2017-01-23 19:59:54 +01:00
case rsx : : stencil_op : : invert : return GL_INVERT ;
2016-06-26 23:37:02 +02:00
case rsx : : stencil_op : : keep : return GL_KEEP ;
case rsx : : stencil_op : : zero : return GL_ZERO ;
case rsx : : stencil_op : : replace : return GL_REPLACE ;
case rsx : : stencil_op : : incr : return GL_INCR ;
case rsx : : stencil_op : : decr : return GL_DECR ;
case rsx : : stencil_op : : incr_wrap : return GL_INCR_WRAP ;
case rsx : : stencil_op : : decr_wrap : return GL_DECR_WRAP ;
}
2017-10-31 14:54:55 +01:00
fmt : : throw_exception ( " Unsupported stencil op 0x%X " HERE , ( u32 ) op ) ;
2016-06-26 23:37:02 +02:00
}
GLenum blend_equation ( rsx : : blend_equation op )
{
switch ( op )
{
// Note : maybe add is signed on gl
2017-10-31 14:54:55 +01:00
case rsx : : blend_equation : : add_signed :
LOG_TRACE ( RSX , " blend equation add_signed used. Emulating using FUNC_ADD " ) ;
2016-06-26 23:37:02 +02:00
case rsx : : blend_equation : : add : return GL_FUNC_ADD ;
case rsx : : blend_equation : : min : return GL_MIN ;
case rsx : : blend_equation : : max : return GL_MAX ;
case rsx : : blend_equation : : substract : return GL_FUNC_SUBTRACT ;
2017-10-31 14:54:55 +01:00
case rsx : : blend_equation : : reverse_substract_signed :
LOG_TRACE ( RSX , " blend equation reverse_subtract_signed used. Emulating using FUNC_REVERSE_SUBTRACT " ) ;
2016-06-26 23:37:02 +02:00
case rsx : : blend_equation : : reverse_substract : return GL_FUNC_REVERSE_SUBTRACT ;
2017-10-31 14:54:55 +01:00
case rsx : : blend_equation : : reverse_add_signed :
default :
LOG_ERROR ( RSX , " Blend equation 0x%X is unimplemented! " , ( u32 ) op ) ;
return GL_FUNC_ADD ;
2016-06-26 23:37:02 +02:00
}
}
GLenum blend_factor ( rsx : : blend_factor op )
{
switch ( op )
{
case rsx : : blend_factor : : zero : return GL_ZERO ;
case rsx : : blend_factor : : one : return GL_ONE ;
case rsx : : blend_factor : : src_color : return GL_SRC_COLOR ;
case rsx : : blend_factor : : one_minus_src_color : return GL_ONE_MINUS_SRC_COLOR ;
case rsx : : blend_factor : : dst_color : return GL_DST_COLOR ;
case rsx : : blend_factor : : one_minus_dst_color : return GL_ONE_MINUS_DST_COLOR ;
case rsx : : blend_factor : : src_alpha : return GL_SRC_ALPHA ;
case rsx : : blend_factor : : one_minus_src_alpha : return GL_ONE_MINUS_SRC_ALPHA ;
case rsx : : blend_factor : : dst_alpha : return GL_DST_ALPHA ;
case rsx : : blend_factor : : one_minus_dst_alpha : return GL_ONE_MINUS_DST_ALPHA ;
case rsx : : blend_factor : : src_alpha_saturate : return GL_SRC_ALPHA_SATURATE ;
case rsx : : blend_factor : : constant_color : return GL_CONSTANT_COLOR ;
case rsx : : blend_factor : : one_minus_constant_color : return GL_ONE_MINUS_CONSTANT_COLOR ;
case rsx : : blend_factor : : constant_alpha : return GL_CONSTANT_ALPHA ;
case rsx : : blend_factor : : one_minus_constant_alpha : return GL_ONE_MINUS_CONSTANT_ALPHA ;
}
2017-10-31 14:54:55 +01:00
fmt : : throw_exception ( " Unsupported blend factor 0x%X " HERE , ( u32 ) op ) ;
2016-06-26 23:37:02 +02:00
}
GLenum logic_op ( rsx : : logic_op op )
{
switch ( op )
{
case rsx : : logic_op : : logic_clear : return GL_CLEAR ;
case rsx : : logic_op : : logic_and : return GL_AND ;
case rsx : : logic_op : : logic_and_reverse : return GL_AND_REVERSE ;
case rsx : : logic_op : : logic_copy : return GL_COPY ;
case rsx : : logic_op : : logic_and_inverted : return GL_AND_INVERTED ;
case rsx : : logic_op : : logic_noop : return GL_NOOP ;
case rsx : : logic_op : : logic_xor : return GL_XOR ;
2016-08-26 16:23:23 +02:00
case rsx : : logic_op : : logic_or : return GL_OR ;
2016-06-26 23:37:02 +02:00
case rsx : : logic_op : : logic_nor : return GL_NOR ;
case rsx : : logic_op : : logic_equiv : return GL_EQUIV ;
case rsx : : logic_op : : logic_invert : return GL_INVERT ;
case rsx : : logic_op : : logic_or_reverse : return GL_OR_REVERSE ;
case rsx : : logic_op : : logic_copy_inverted : return GL_COPY_INVERTED ;
case rsx : : logic_op : : logic_or_inverted : return GL_OR_INVERTED ;
case rsx : : logic_op : : logic_nand : return GL_NAND ;
case rsx : : logic_op : : logic_set : return GL_SET ;
}
2017-10-31 14:54:55 +01:00
fmt : : throw_exception ( " Unsupported logic op 0x%X " HERE , ( u32 ) op ) ;
2016-06-26 23:37:02 +02:00
}
GLenum front_face ( rsx : : front_face op )
{
2017-11-18 15:23:25 +01:00
//NOTE: RSX face winding is always based off of upper-left corner like vulkan, but GL is bottom left
//shader_window_origin register does not affect this
//verified with Outrun Online Arcade (window_origin::top) and DS2 (window_origin::bottom)
//correctness of face winding checked using stencil test (GOW collection shadows)
2016-06-26 23:37:02 +02:00
switch ( op )
{
2017-11-18 15:23:25 +01:00
case rsx : : front_face : : cw : return GL_CCW ;
case rsx : : front_face : : ccw : return GL_CW ;
2016-06-26 23:37:02 +02:00
}
2017-10-31 14:54:55 +01:00
fmt : : throw_exception ( " Unsupported front face 0x%X " HERE , ( u32 ) op ) ;
2016-06-26 23:37:02 +02:00
}
GLenum cull_face ( rsx : : cull_face op )
{
switch ( op )
{
2017-11-18 15:23:25 +01:00
case rsx : : cull_face : : front : return GL_FRONT ;
case rsx : : cull_face : : back : return GL_BACK ;
2016-06-26 23:37:02 +02:00
case rsx : : cull_face : : front_and_back : return GL_FRONT_AND_BACK ;
}
2017-10-31 14:54:55 +01:00
fmt : : throw_exception ( " Unsupported cull face 0x%X " HERE , ( u32 ) op ) ;
2016-06-26 23:37:02 +02:00
}
}
2015-10-11 22:00:51 +02:00
void GLGSRender : : begin ( )
2015-10-04 00:45:26 +02:00
{
2015-10-11 22:00:51 +02:00
rsx : : thread : : begin ( ) ;
2017-12-02 13:15:03 +01:00
if ( skip_frame | |
( conditional_render_enabled & & conditional_render_test_failed ) )
2017-07-27 18:04:55 +02:00
return ;
2017-11-15 16:50:41 +01:00
init_buffers ( rsx : : framebuffer_creation_context : : context_draw ) ;
2015-01-31 14:01:34 +01:00
}
2015-10-11 22:00:51 +02:00
void GLGSRender : : end ( )
{
2017-10-29 17:34:55 +01:00
std : : chrono : : time_point < steady_clock > state_check_start = steady_clock : : now ( ) ;
2017-12-02 13:15:03 +01:00
if ( skip_frame | | ! framebuffer_status_valid | |
( conditional_render_enabled & & conditional_render_test_failed ) | |
! check_program_state ( ) )
2015-10-11 22:00:51 +02:00
{
rsx : : thread : : end ( ) ;
return ;
}
2015-10-09 20:04:20 +02:00
2017-10-29 17:34:55 +01:00
std : : chrono : : time_point < steady_clock > state_check_end = steady_clock : : now ( ) ;
m_begin_time + = ( u32 ) std : : chrono : : duration_cast < std : : chrono : : microseconds > ( state_check_end - state_check_start ) . count ( ) ;
2016-10-18 09:57:28 +02:00
if ( manually_flush_ring_buffers )
{
//Use approximations to reseve space. This path is mostly for debug purposes anyway
u32 approx_vertex_count = rsx : : method_registers . current_draw_clause . get_elements_count ( ) ;
u32 approx_working_buffer_size = approx_vertex_count * 256 ;
//Allocate 256K heap if we have no approximation at this time (inlined array)
m_attrib_ring_buffer - > reserve_storage_on_heap ( std : : max ( approx_working_buffer_size , 256 * 1024U ) ) ;
m_index_ring_buffer - > reserve_storage_on_heap ( 16 * 1024 ) ;
}
2017-07-31 13:38:28 +02:00
//Do vertex upload before RTT prep / texture lookups to give the driver time to push data
2018-01-21 16:31:35 +01:00
auto upload_info = set_vertex_buffer ( ) ;
2017-07-31 13:38:28 +02:00
2017-10-30 13:27:22 +01:00
//Load textures
{
std : : chrono : : time_point < steady_clock > textures_start = steady_clock : : now ( ) ;
2017-10-31 14:54:55 +01:00
std : : lock_guard < std : : mutex > lock ( m_sampler_mutex ) ;
2017-10-30 13:27:22 +01:00
void * unused = nullptr ;
2017-10-31 19:49:30 +01:00
bool update_framebuffer_sourced = false ;
2017-10-31 14:54:55 +01:00
2017-10-31 16:45:54 +01:00
if ( surface_store_tag ! = m_rtts . cache_tag )
{
2017-10-31 19:49:30 +01:00
update_framebuffer_sourced = true ;
2017-10-31 16:45:54 +01:00
surface_store_tag = m_rtts . cache_tag ;
}
2017-10-31 14:54:55 +01:00
for ( int i = 0 ; i < rsx : : limits : : fragment_textures_count ; + + i )
{
2017-10-31 19:49:30 +01:00
if ( ! fs_sampler_state [ i ] )
fs_sampler_state [ i ] = std : : make_unique < gl : : texture_cache : : sampled_image_descriptor > ( ) ;
2017-10-31 14:54:55 +01:00
2017-10-31 19:49:30 +01:00
if ( m_samplers_dirty | | m_textures_dirty [ i ] | |
( update_framebuffer_sourced & & fs_sampler_state [ i ] - > upload_context = = rsx : : texture_upload_context : : framebuffer_storage ) )
{
2017-10-31 14:54:55 +01:00
auto sampler_state = static_cast < gl : : texture_cache : : sampled_image_descriptor * > ( fs_sampler_state [ i ] . get ( ) ) ;
if ( rsx : : method_registers . fragment_textures [ i ] . enabled ( ) )
{
* sampler_state = m_gl_texture_cache . upload_texture ( unused , rsx : : method_registers . fragment_textures [ i ] , m_rtts ) ;
2017-11-03 19:09:29 +01:00
if ( m_textures_dirty [ i ] )
2017-12-09 10:21:44 +01:00
m_gl_sampler_states [ i ] . apply ( rsx : : method_registers . fragment_textures [ i ] , fs_sampler_state [ i ] . get ( ) ) ;
2017-10-31 14:54:55 +01:00
}
else
{
2017-10-30 13:27:22 +01:00
* sampler_state = { } ;
}
2017-10-31 14:54:55 +01:00
m_textures_dirty [ i ] = false ;
}
}
for ( int i = 0 ; i < rsx : : limits : : vertex_textures_count ; + + i )
{
2017-10-31 19:49:30 +01:00
if ( ! vs_sampler_state [ i ] )
vs_sampler_state [ i ] = std : : make_unique < gl : : texture_cache : : sampled_image_descriptor > ( ) ;
2017-10-31 14:54:55 +01:00
2017-10-31 19:49:30 +01:00
if ( m_samplers_dirty | | m_vertex_textures_dirty [ i ] | |
( update_framebuffer_sourced & & vs_sampler_state [ i ] - > upload_context = = rsx : : texture_upload_context : : framebuffer_storage ) )
2017-10-31 14:54:55 +01:00
{
auto sampler_state = static_cast < gl : : texture_cache : : sampled_image_descriptor * > ( vs_sampler_state [ i ] . get ( ) ) ;
if ( rsx : : method_registers . vertex_textures [ i ] . enabled ( ) )
{
* sampler_state = m_gl_texture_cache . upload_texture ( unused , rsx : : method_registers . vertex_textures [ i ] , m_rtts ) ;
}
else
* sampler_state = { } ;
m_vertex_textures_dirty [ i ] = false ;
}
}
2017-10-30 13:27:22 +01:00
m_samplers_dirty . store ( false ) ;
std : : chrono : : time_point < steady_clock > textures_end = steady_clock : : now ( ) ;
m_textures_upload_time + = ( u32 ) std : : chrono : : duration_cast < std : : chrono : : microseconds > ( textures_end - textures_start ) . count ( ) ;
}
2017-07-31 13:38:28 +02:00
std : : chrono : : time_point < steady_clock > program_start = steady_clock : : now ( ) ;
//Load program here since it is dependent on vertex state
2018-01-21 16:31:35 +01:00
load_program ( upload_info ) ;
2017-07-31 13:38:28 +02:00
std : : chrono : : time_point < steady_clock > program_stop = steady_clock : : now ( ) ;
m_begin_time + = ( u32 ) std : : chrono : : duration_cast < std : : chrono : : microseconds > ( program_stop - program_start ) . count ( ) ;
if ( manually_flush_ring_buffers )
{
m_attrib_ring_buffer - > unmap ( ) ;
m_index_ring_buffer - > unmap ( ) ;
}
else
{
//DMA push; not needed with MAP_COHERENT
//glMemoryBarrier(GL_CLIENT_MAPPED_BUFFER_BARRIER_BIT);
}
2017-11-01 13:34:38 +01:00
//Bind textures and resolve external copy operations
std : : chrono : : time_point < steady_clock > textures_start = steady_clock : : now ( ) ;
int unused_location ;
for ( int i = 0 ; i < rsx : : limits : : fragment_textures_count ; + + i )
{
if ( m_program - > uniforms . has_location ( " tex " + std : : to_string ( i ) , & unused_location ) )
{
auto sampler_state = static_cast < gl : : texture_cache : : sampled_image_descriptor * > ( fs_sampler_state [ i ] . get ( ) ) ;
auto & tex = rsx : : method_registers . fragment_textures [ i ] ;
glActiveTexture ( GL_TEXTURE0 + i ) ;
2017-11-01 14:38:37 +01:00
if ( tex . enabled ( ) )
2017-11-01 13:34:38 +01:00
{
2018-01-31 17:11:03 +01:00
GLenum target = gl : : get_target ( sampler_state - > image_type ) ;
2017-11-01 14:38:37 +01:00
if ( sampler_state - > image_handle )
{
glBindTexture ( target , sampler_state - > image_handle ) ;
}
else if ( sampler_state - > external_subresource_desc . external_handle )
{
2017-11-03 12:16:55 +01:00
void * unused = nullptr ;
glBindTexture ( target , m_gl_texture_cache . create_temporary_subresource ( unused , sampler_state - > external_subresource_desc ) ) ;
2017-11-01 14:38:37 +01:00
}
else
{
2018-02-02 13:25:15 +01:00
glBindTexture ( target , m_null_textures [ target ] - > id ( ) ) ;
2017-11-01 14:38:37 +01:00
}
2017-11-01 13:34:38 +01:00
}
else
{
2018-02-02 13:25:15 +01:00
glBindTexture ( GL_TEXTURE_1D , m_null_textures [ GL_TEXTURE_1D ] - > id ( ) ) ;
glBindTexture ( GL_TEXTURE_2D , m_null_textures [ GL_TEXTURE_2D ] - > id ( ) ) ;
glBindTexture ( GL_TEXTURE_3D , m_null_textures [ GL_TEXTURE_3D ] - > id ( ) ) ;
glBindTexture ( GL_TEXTURE_CUBE_MAP , m_null_textures [ GL_TEXTURE_CUBE_MAP ] - > id ( ) ) ;
2017-11-01 13:34:38 +01:00
}
}
}
for ( int i = 0 ; i < rsx : : limits : : vertex_textures_count ; + + i )
{
if ( m_program - > uniforms . has_location ( " vtex " + std : : to_string ( i ) , & unused_location ) )
{
auto sampler_state = static_cast < gl : : texture_cache : : sampled_image_descriptor * > ( vs_sampler_state [ i ] . get ( ) ) ;
glActiveTexture ( GL_TEXTURE0 + rsx : : limits : : fragment_textures_count + i ) ;
if ( sampler_state - > image_handle )
{
glBindTexture ( GL_TEXTURE_2D , sampler_state - > image_handle ) ;
}
else if ( sampler_state - > external_subresource_desc . external_handle )
{
2017-11-03 12:16:55 +01:00
void * unused = nullptr ;
glBindTexture ( GL_TEXTURE_2D , m_gl_texture_cache . create_temporary_subresource ( unused , sampler_state - > external_subresource_desc ) ) ;
2017-11-01 13:34:38 +01:00
}
else
{
glBindTexture ( GL_TEXTURE_2D , GL_NONE ) ;
}
}
}
std : : chrono : : time_point < steady_clock > textures_end = steady_clock : : now ( ) ;
m_textures_upload_time + = ( u32 ) std : : chrono : : duration_cast < std : : chrono : : microseconds > ( textures_end - textures_start ) . count ( ) ;
2017-11-01 14:38:37 +01:00
update_draw_state ( ) ;
2016-07-22 01:31:58 +02:00
//Check if depth buffer is bound and valid
//If ds is not initialized clear it; it seems new depth textures should have depth cleared
2017-06-30 23:24:41 +02:00
auto copy_rtt_contents = [ ] ( gl : : render_target * surface )
{
2017-10-23 14:54:29 +02:00
if ( surface - > get_compatible_internal_format ( ) = = surface - > old_contents - > get_compatible_internal_format ( ) )
{
//Copy data from old contents onto this one
//1. Clip a rectangular region defning the data
//2. Perform a GPU blit
u16 parent_w = surface - > old_contents - > width ( ) ;
u16 parent_h = surface - > old_contents - > height ( ) ;
u16 copy_w , copy_h ;
std : : tie ( std : : ignore , std : : ignore , copy_w , copy_h ) = rsx : : clip_region < u16 > ( parent_w , parent_h , 0 , 0 , surface - > width ( ) , surface - > height ( ) , true ) ;
glCopyImageSubData ( surface - > old_contents - > id ( ) , GL_TEXTURE_2D , 0 , 0 , 0 , 0 , surface - > id ( ) , GL_TEXTURE_2D , 0 , 0 , 0 , 0 , copy_w , copy_h , 1 ) ;
surface - > set_cleared ( ) ;
}
//TODO: download image contents and reupload them or do a memory cast to copy memory contents if not compatible
2017-06-30 23:24:41 +02:00
surface - > old_contents = nullptr ;
} ;
2017-07-18 12:44:36 +02:00
//Check if we have any 'recycled' surfaces in memory and if so, clear them
std : : vector < int > buffers_to_clear ;
bool clear_all_color = true ;
bool clear_depth = false ;
for ( int index = 0 ; index < 4 ; index + + )
{
if ( std : : get < 0 > ( m_rtts . m_bound_render_targets [ index ] ) ! = 0 )
{
if ( std : : get < 1 > ( m_rtts . m_bound_render_targets [ index ] ) - > cleared ( ) )
clear_all_color = false ;
else
buffers_to_clear . push_back ( index ) ;
}
}
2016-07-22 01:31:58 +02:00
gl : : render_target * ds = std : : get < 1 > ( m_rtts . m_bound_depth_stencil ) ;
if ( ds & & ! ds - > cleared ( ) )
{
2017-07-18 12:44:36 +02:00
clear_depth = true ;
}
//Temporarily disable pixel tests
glDisable ( GL_SCISSOR_TEST ) ;
if ( clear_depth | | buffers_to_clear . size ( ) > 0 )
{
GLenum mask = 0 ;
if ( clear_depth )
{
2017-08-07 18:35:16 +02:00
gl_state . depth_mask ( GL_TRUE ) ;
gl_state . clear_depth ( 1.0 ) ;
gl_state . clear_stencil ( 255 ) ;
2017-07-18 12:44:36 +02:00
mask | = GL_DEPTH_BUFFER_BIT | GL_STENCIL_BUFFER_BIT ;
}
if ( clear_all_color )
mask | = GL_COLOR_BUFFER_BIT ;
2016-08-26 16:23:23 +02:00
2017-07-18 12:44:36 +02:00
glClear ( mask ) ;
2017-06-30 23:24:41 +02:00
2017-07-18 12:44:36 +02:00
if ( buffers_to_clear . size ( ) > 0 & & ! clear_all_color )
2017-06-30 23:24:41 +02:00
{
2017-07-18 12:44:36 +02:00
GLfloat colors [ ] = { 0.f , 0.f , 0.f , 0.f } ;
//It is impossible for the render target to be typa A or B here (clear all would have been flagged)
for ( auto & i : buffers_to_clear )
glClearBufferfv ( draw_fbo . id ( ) , i , colors ) ;
2017-06-30 23:24:41 +02:00
}
2017-07-18 12:44:36 +02:00
if ( clear_depth )
2017-08-07 18:35:16 +02:00
gl_state . depth_mask ( rsx : : method_registers . depth_write_enabled ( ) ) ;
2016-07-22 01:31:58 +02:00
ds - > set_cleared ( ) ;
}
2017-11-15 13:02:59 +01:00
if ( ds & & ds - > old_contents ! = nullptr & & ds - > get_rsx_pitch ( ) = = ds - > old_contents - > get_rsx_pitch ( ) & &
ds - > old_contents - > get_compatible_internal_format ( ) = = gl : : texture : : internal_format : : rgba8 )
{
m_depth_converter . run ( ds - > width ( ) , ds - > height ( ) , ds - > id ( ) , ds - > old_contents - > id ( ) ) ;
ds - > old_contents = nullptr ;
}
2017-06-30 23:24:41 +02:00
if ( g_cfg . video . strict_rendering_mode )
{
2017-11-22 16:45:26 +01:00
if ( ds & & ds - > old_contents ! = nullptr )
2017-07-18 12:44:36 +02:00
copy_rtt_contents ( ds ) ;
2017-06-30 23:24:41 +02:00
for ( auto & rtt : m_rtts . m_bound_render_targets )
{
2017-11-22 16:45:26 +01:00
if ( auto surface = std : : get < 1 > ( rtt ) )
2017-06-30 23:24:41 +02:00
{
2017-07-18 12:44:36 +02:00
if ( surface - > old_contents ! = nullptr )
2017-06-30 23:24:41 +02:00
copy_rtt_contents ( surface ) ;
}
}
}
2017-11-15 13:02:59 +01:00
else
{
// Old contents are one use only. Keep the depth conversion check from firing over and over
if ( ds ) ds - > old_contents = nullptr ;
}
2017-06-30 23:24:41 +02:00
2017-07-18 12:44:36 +02:00
glEnable ( GL_SCISSOR_TEST ) ;
2017-01-29 00:00:49 +01:00
std : : chrono : : time_point < steady_clock > draw_start = steady_clock : : now ( ) ;
2015-12-23 22:25:02 +01:00
2017-05-20 13:45:02 +02:00
if ( g_cfg . video . debug_output )
2016-06-20 23:38:38 +02:00
{
2016-06-11 21:51:34 +02:00
m_program - > validate ( ) ;
2016-06-20 23:38:38 +02:00
}
2016-02-02 19:41:39 +01:00
2017-09-07 21:32:52 +02:00
const GLenum draw_mode = gl : : draw_mode ( rsx : : method_registers . current_draw_clause . primitive ) ;
2017-10-17 12:34:44 +02:00
bool single_draw = ! supports_multidraw | | ( rsx : : method_registers . current_draw_clause . first_count_commands . size ( ) < = 1 | | rsx : : method_registers . current_draw_clause . is_disjoint_primitive ) ;
2017-09-07 21:32:52 +02:00
2018-01-21 16:31:35 +01:00
if ( upload_info . index_info )
2016-10-18 09:57:28 +02:00
{
2018-01-21 16:31:35 +01:00
const GLenum index_type = std : : get < 0 > ( upload_info . index_info . value ( ) ) ;
const u32 index_offset = std : : get < 1 > ( upload_info . index_info . value ( ) ) ;
2017-10-17 12:09:02 +02:00
const bool restarts_valid = gl : : is_primitive_native ( rsx : : method_registers . current_draw_clause . primitive ) & & ! rsx : : method_registers . current_draw_clause . is_disjoint_primitive ;
2016-10-18 09:57:28 +02:00
2017-10-17 12:09:02 +02:00
if ( gl_state . enable ( restarts_valid & & rsx : : method_registers . restart_index_enabled ( ) , GL_PRIMITIVE_RESTART ) )
2017-09-07 21:32:52 +02:00
{
glPrimitiveRestartIndex ( ( index_type = = GL_UNSIGNED_SHORT ) ? 0xffff : 0xffffffff ) ;
}
if ( single_draw )
2016-09-20 16:23:56 +02:00
{
2018-01-21 16:31:35 +01:00
glDrawElements ( draw_mode , upload_info . vertex_draw_count , index_type , ( GLvoid * ) ( uintptr_t ) index_offset ) ;
2016-09-20 16:23:56 +02:00
}
2017-09-07 21:32:52 +02:00
else
{
std : : vector < GLsizei > counts ;
std : : vector < const GLvoid * > offsets ;
const auto draw_count = rsx : : method_registers . current_draw_clause . first_count_commands . size ( ) ;
const u32 type_scale = ( index_type = = GL_UNSIGNED_SHORT ) ? 1 : 2 ;
uintptr_t index_ptr = index_offset ;
2016-09-20 16:23:56 +02:00
2017-09-07 21:32:52 +02:00
counts . reserve ( draw_count ) ;
offsets . reserve ( draw_count ) ;
for ( const auto & range : rsx : : method_registers . current_draw_clause . first_count_commands )
{
const auto index_size = get_index_count ( rsx : : method_registers . current_draw_clause . primitive , range . second ) ;
counts . push_back ( index_size ) ;
offsets . push_back ( ( const GLvoid * ) index_ptr ) ;
index_ptr + = ( index_size < < type_scale ) ;
}
2017-09-08 23:22:51 +02:00
glMultiDrawElements ( draw_mode , counts . data ( ) , index_type , offsets . data ( ) , ( GLsizei ) draw_count ) ;
2017-09-07 21:32:52 +02:00
}
2016-03-01 21:42:46 +01:00
}
2016-01-12 00:54:07 +01:00
else
{
2017-09-07 21:32:52 +02:00
if ( single_draw )
{
2018-01-21 16:31:35 +01:00
glDrawArrays ( draw_mode , 0 , upload_info . vertex_draw_count ) ;
2017-09-07 21:32:52 +02:00
}
else
{
2017-10-17 12:34:44 +02:00
u32 base_index = rsx : : method_registers . current_draw_clause . first_count_commands . front ( ) . first ;
if ( gl : : get_driver_caps ( ) . vendor_AMD = = false )
{
std : : vector < GLint > firsts ;
std : : vector < GLsizei > counts ;
const auto draw_count = rsx : : method_registers . current_draw_clause . first_count_commands . size ( ) ;
2017-09-07 21:32:52 +02:00
2017-10-17 12:34:44 +02:00
firsts . reserve ( draw_count ) ;
counts . reserve ( draw_count ) ;
2017-09-07 21:32:52 +02:00
2017-10-17 12:34:44 +02:00
for ( const auto & range : rsx : : method_registers . current_draw_clause . first_count_commands )
{
firsts . push_back ( range . first - base_index ) ;
counts . push_back ( range . second ) ;
}
glMultiDrawArrays ( draw_mode , firsts . data ( ) , counts . data ( ) , ( GLsizei ) draw_count ) ;
}
else
2017-09-07 21:32:52 +02:00
{
2017-10-17 12:34:44 +02:00
//MultiDrawArrays is broken on some primitive types using AMD. One known type is GL_TRIANGLE_STRIP but there could be more
for ( const auto & range : rsx : : method_registers . current_draw_clause . first_count_commands )
{
glDrawArrays ( draw_mode , range . first - base_index , range . second ) ;
}
2017-09-07 21:32:52 +02:00
}
}
2015-10-04 00:45:26 +02:00
}
2015-10-11 22:00:51 +02:00
2017-02-16 19:29:56 +01:00
m_attrib_ring_buffer - > notify ( ) ;
m_index_ring_buffer - > notify ( ) ;
2017-07-31 13:38:28 +02:00
m_vertex_state_buffer - > notify ( ) ;
2017-03-11 10:07:26 +01:00
m_fragment_constants_buffer - > notify ( ) ;
m_transform_constants_buffer - > notify ( ) ;
2017-02-16 19:29:56 +01:00
2017-01-29 00:00:49 +01:00
std : : chrono : : time_point < steady_clock > draw_end = steady_clock : : now ( ) ;
2016-10-11 02:55:42 +02:00
m_draw_time + = ( u32 ) std : : chrono : : duration_cast < std : : chrono : : microseconds > ( draw_end - draw_start ) . count ( ) ;
2017-02-16 19:29:56 +01:00
m_draw_calls + + ;
synchronize_buffers ( ) ;
2015-10-11 22:00:51 +02:00
rsx : : thread : : end ( ) ;
2015-10-09 20:04:20 +02:00
}
2014-08-18 16:37:23 +02:00
2016-01-06 00:15:35 +01:00
void GLGSRender : : set_viewport ( )
{
2016-09-26 14:21:17 +02:00
//NOTE: scale offset matrix already contains the viewport transformation
2017-09-26 15:24:43 +02:00
const auto clip_width = rsx : : apply_resolution_scale ( rsx : : method_registers . surface_clip_width ( ) , true ) ;
const auto clip_height = rsx : : apply_resolution_scale ( rsx : : method_registers . surface_clip_height ( ) , true ) ;
2017-07-05 00:16:59 +02:00
glViewport ( 0 , 0 , clip_width , clip_height ) ;
2016-01-06 00:15:35 +01:00
2017-09-26 15:24:43 +02:00
u16 scissor_x = rsx : : apply_resolution_scale ( rsx : : method_registers . scissor_origin_x ( ) , false ) ;
u16 scissor_w = rsx : : apply_resolution_scale ( rsx : : method_registers . scissor_width ( ) , true ) ;
u16 scissor_y = rsx : : apply_resolution_scale ( rsx : : method_registers . scissor_origin_y ( ) , false ) ;
u16 scissor_h = rsx : : apply_resolution_scale ( rsx : : method_registers . scissor_height ( ) , true ) ;
2016-01-06 00:15:35 +01:00
2017-07-05 00:16:59 +02:00
//Do not bother drawing anything if output is zero sized
//TODO: Clip scissor region
if ( scissor_x > = clip_width | | scissor_y > = clip_height | | scissor_w = = 0 | | scissor_h = = 0 )
{
if ( ! g_cfg . video . strict_rendering_mode )
{
framebuffer_status_valid = false ;
return ;
}
}
2016-09-26 14:21:17 +02:00
//NOTE: window origin does not affect scissor region (probably only affects viewport matrix; already applied)
//See LIMBO [NPUB-30373] which uses shader window origin = top
2017-09-07 21:32:52 +02:00
glScissor ( scissor_x , scissor_y , scissor_w , scissor_h ) ;
2016-01-06 00:15:35 +01:00
glEnable ( GL_SCISSOR_TEST ) ;
}
2015-11-26 09:06:29 +01:00
void GLGSRender : : on_init_thread ( )
2015-10-09 20:04:20 +02:00
{
2015-11-26 09:06:29 +01:00
GSRender : : on_init_thread ( ) ;
2015-10-11 22:00:51 +02:00
gl : : init ( ) ;
2017-04-04 18:14:36 +02:00
2017-08-13 19:41:55 +02:00
//Enable adaptive vsync if vsync is requested
gl : : set_swapinterval ( g_cfg . video . vsync ? - 1 : 0 ) ;
2017-05-20 13:45:02 +02:00
if ( g_cfg . video . debug_output )
2016-03-22 22:26:37 +01:00
gl : : enable_debugging ( ) ;
2017-04-04 18:14:36 +02:00
2016-01-12 22:57:16 +01:00
LOG_NOTICE ( RSX , " %s " , ( const char * ) glGetString ( GL_VERSION ) ) ;
LOG_NOTICE ( RSX , " %s " , ( const char * ) glGetString ( GL_SHADING_LANGUAGE_VERSION ) ) ;
LOG_NOTICE ( RSX , " %s " , ( const char * ) glGetString ( GL_VENDOR ) ) ;
2015-10-11 22:00:51 +02:00
2017-06-19 12:47:38 +02:00
auto & gl_caps = gl : : get_driver_caps ( ) ;
2017-04-04 18:14:36 +02:00
if ( ! gl_caps . ARB_texture_buffer_supported )
{
fmt : : throw_exception ( " Failed to initialize OpenGL renderer. ARB_texture_buffer_object is required but not supported by your GPU " ) ;
}
if ( ! gl_caps . ARB_dsa_supported & & ! gl_caps . EXT_dsa_supported )
{
fmt : : throw_exception ( " Failed to initialize OpenGL renderer. ARB_direct_state_access or EXT_direct_state_access is required but not supported by your GPU " ) ;
}
2017-06-19 12:47:38 +02:00
if ( ! gl_caps . ARB_depth_buffer_float_supported & & g_cfg . video . force_high_precision_z_buffer )
{
LOG_WARNING ( RSX , " High precision Z buffer requested but your GPU does not support GL_ARB_depth_buffer_float. Option ignored. " ) ;
}
2017-06-22 20:25:58 +02:00
if ( ! gl_caps . ARB_texture_barrier_supported & & ! gl_caps . NV_texture_barrier_supported & & ! g_cfg . video . strict_rendering_mode )
{
LOG_WARNING ( RSX , " Texture barriers are not supported by your GPU. Feedback loops will have undefined results. " ) ;
}
2017-04-04 18:14:36 +02:00
//Use industry standard resource alignment values as defaults
m_uniform_buffer_offset_align = 256 ;
m_min_texbuffer_alignment = 256 ;
2018-01-21 16:31:35 +01:00
m_max_texbuffer_size = 0 ;
2017-04-04 18:14:36 +02:00
2015-10-11 22:00:51 +02:00
glEnable ( GL_VERTEX_PROGRAM_POINT_SIZE ) ;
2016-06-20 23:38:38 +02:00
glGetIntegerv ( GL_UNIFORM_BUFFER_OFFSET_ALIGNMENT , & m_uniform_buffer_offset_align ) ;
2016-06-12 17:54:15 +02:00
glGetIntegerv ( GL_TEXTURE_BUFFER_OFFSET_ALIGNMENT , & m_min_texbuffer_alignment ) ;
2018-01-21 16:31:35 +01:00
glGetIntegerv ( GL_MAX_TEXTURE_BUFFER_SIZE , & m_max_texbuffer_size ) ;
2015-10-14 00:45:18 +02:00
m_vao . create ( ) ;
2016-01-28 18:01:10 +01:00
2017-03-29 11:29:11 +02:00
//Set min alignment to 16-bytes for SSE optimizations with aligned addresses to work
m_min_texbuffer_alignment = std : : max ( m_min_texbuffer_alignment , 16 ) ;
m_uniform_buffer_offset_align = std : : max ( m_uniform_buffer_offset_align , 16 ) ;
2018-01-21 16:31:35 +01:00
LOG_NOTICE ( RSX , " Supported texel buffer size reported: %d bytes " , m_max_texbuffer_size ) ;
if ( m_max_texbuffer_size < ( 16 * 0x100000 ) )
{
LOG_ERROR ( RSX , " Max texture buffer size supported is less than 16M which is useless. Expect undefined behaviour. " ) ;
m_max_texbuffer_size = ( 16 * 0x100000 ) ;
}
2017-04-04 18:14:36 +02:00
const u32 texture_index_offset = rsx : : limits : : fragment_textures_count + rsx : : limits : : vertex_textures_count ;
2017-07-31 13:38:28 +02:00
//Array stream buffer
2016-01-28 18:01:10 +01:00
{
2017-07-31 13:38:28 +02:00
auto & tex = m_gl_persistent_stream_buffer ;
2016-06-11 21:51:34 +02:00
tex . create ( ) ;
tex . set_target ( gl : : texture : : target : : textureBuffer ) ;
2017-07-31 13:38:28 +02:00
glActiveTexture ( GL_TEXTURE0 + texture_index_offset ) ;
tex . bind ( ) ;
}
2016-10-18 09:57:28 +02:00
2017-07-31 13:38:28 +02:00
//Register stream buffer
{
auto & tex = m_gl_volatile_stream_buffer ;
tex . create ( ) ;
tex . set_target ( gl : : texture : : target : : textureBuffer ) ;
glActiveTexture ( GL_TEXTURE0 + texture_index_offset + 1 ) ;
2016-10-18 09:57:28 +02:00
tex . bind ( ) ;
2016-01-28 18:01:10 +01:00
}
2016-02-15 10:50:14 +01:00
2018-02-02 13:25:15 +01:00
//Fallback null texture instead of relying on texture0
{
std : : vector < u32 > pixeldata = { 0 , 0 , 0 , 0 } ;
//1D
auto tex1D = std : : make_unique < gl : : texture > ( ) ;
tex1D - > create ( ) ;
tex1D - > set_target ( gl : : texture : : target : : texture1D ) ;
tex1D - > config ( ) . width ( 1 ) . min_lod ( 0.f ) . max_lod ( 0.f ) . pixels ( pixeldata . data ( ) ) . apply ( ) ;
//2D
auto tex2D = std : : make_unique < gl : : texture > ( ) ;
tex2D - > create ( ) ;
tex2D - > set_target ( gl : : texture : : target : : texture2D ) ;
tex2D - > config ( ) . width ( 1 ) . height ( 1 ) . min_lod ( 0.f ) . max_lod ( 0.f ) . pixels ( pixeldata . data ( ) ) . apply ( ) ;
//3D
auto tex3D = std : : make_unique < gl : : texture > ( ) ;
tex3D - > create ( ) ;
tex3D - > set_target ( gl : : texture : : target : : texture3D ) ;
tex3D - > config ( ) . width ( 1 ) . height ( 1 ) . depth ( 1 ) . min_lod ( 0.f ) . max_lod ( 0.f ) . pixels ( pixeldata . data ( ) ) . apply ( ) ;
//CUBE
auto texCUBE = std : : make_unique < gl : : texture > ( ) ;
texCUBE - > create ( ) ;
texCUBE - > set_target ( gl : : texture : : target : : textureCUBE ) ;
texCUBE - > config ( ) . width ( 1 ) . height ( 1 ) . depth ( 1 ) . min_lod ( 0.f ) . max_lod ( 0.f ) . pixels ( pixeldata . data ( ) ) . apply ( ) ;
m_null_textures [ GL_TEXTURE_1D ] = std : : move ( tex1D ) ;
m_null_textures [ GL_TEXTURE_2D ] = std : : move ( tex2D ) ;
m_null_textures [ GL_TEXTURE_3D ] = std : : move ( tex3D ) ;
m_null_textures [ GL_TEXTURE_CUBE_MAP ] = std : : move ( texCUBE ) ;
}
2017-04-04 18:14:36 +02:00
if ( ! gl_caps . ARB_buffer_storage_supported )
{
LOG_WARNING ( RSX , " Forcing use of legacy OpenGL buffers because ARB_buffer_storage is not supported " ) ;
2017-05-20 13:45:02 +02:00
// TODO: do not modify config options
g_cfg . video . gl_legacy_buffers . from_string ( " true " ) ;
2017-04-04 18:14:36 +02:00
}
2017-05-20 13:45:02 +02:00
if ( g_cfg . video . gl_legacy_buffers )
2016-10-18 09:57:28 +02:00
{
LOG_WARNING ( RSX , " Using legacy openGL buffers. " ) ;
manually_flush_ring_buffers = true ;
2016-06-12 11:05:22 +02:00
2016-10-18 09:57:28 +02:00
m_attrib_ring_buffer . reset ( new gl : : legacy_ring_buffer ( ) ) ;
2017-03-11 10:07:26 +01:00
m_transform_constants_buffer . reset ( new gl : : legacy_ring_buffer ( ) ) ;
m_fragment_constants_buffer . reset ( new gl : : legacy_ring_buffer ( ) ) ;
2017-07-31 13:38:28 +02:00
m_vertex_state_buffer . reset ( new gl : : legacy_ring_buffer ( ) ) ;
2016-10-18 09:57:28 +02:00
m_index_ring_buffer . reset ( new gl : : legacy_ring_buffer ( ) ) ;
}
else
{
m_attrib_ring_buffer . reset ( new gl : : ring_buffer ( ) ) ;
2017-03-11 10:07:26 +01:00
m_transform_constants_buffer . reset ( new gl : : ring_buffer ( ) ) ;
m_fragment_constants_buffer . reset ( new gl : : ring_buffer ( ) ) ;
2017-07-31 13:38:28 +02:00
m_vertex_state_buffer . reset ( new gl : : ring_buffer ( ) ) ;
2016-10-18 09:57:28 +02:00
m_index_ring_buffer . reset ( new gl : : ring_buffer ( ) ) ;
}
2018-01-21 16:31:35 +01:00
m_attrib_ring_buffer - > create ( gl : : buffer : : target : : texture , std : : min < GLsizeiptr > ( m_max_texbuffer_size , 256 * 0x100000 ) ) ;
m_index_ring_buffer - > create ( gl : : buffer : : target : : element_array , std : : min < GLsizeiptr > ( m_max_texbuffer_size , 64 * 0x100000 ) ) ;
m_transform_constants_buffer - > create ( gl : : buffer : : target : : uniform , std : : min < GLsizeiptr > ( m_max_texbuffer_size , 16 * 0x100000 ) ) ;
m_fragment_constants_buffer - > create ( gl : : buffer : : target : : uniform , std : : min < GLsizeiptr > ( m_max_texbuffer_size , 16 * 0x100000 ) ) ;
m_vertex_state_buffer - > create ( gl : : buffer : : target : : uniform , std : : min < GLsizeiptr > ( m_max_texbuffer_size , 16 * 0x100000 ) ) ;
m_gl_persistent_stream_buffer . copy_from ( * m_attrib_ring_buffer , GL_R8UI , 0 , ( u32 ) m_attrib_ring_buffer - > size ( ) ) ;
m_gl_volatile_stream_buffer . copy_from ( * m_attrib_ring_buffer , GL_R8UI , 0 , ( u32 ) m_attrib_ring_buffer - > size ( ) ) ;
2016-10-18 09:57:28 +02:00
m_vao . element_array_buffer = * m_index_ring_buffer ;
2016-10-20 05:20:45 +02:00
2017-05-20 13:45:02 +02:00
if ( g_cfg . video . overlay )
2017-04-04 18:14:36 +02:00
{
if ( gl_caps . ARB_shader_draw_parameters_supported )
{
m_text_printer . init ( ) ;
m_text_printer . set_enabled ( true ) ;
}
}
2017-02-16 19:29:56 +01:00
2017-03-29 21:27:29 +02:00
for ( int i = 0 ; i < rsx : : limits : : fragment_textures_count ; + + i )
{
m_gl_sampler_states [ i ] . create ( ) ;
m_gl_sampler_states [ i ] . bind ( i ) ;
}
2017-07-27 18:04:55 +02:00
//Occlusion query
for ( u32 i = 0 ; i < occlusion_query_count ; + + i )
{
2017-11-16 22:52:21 +01:00
GLuint handle = 0 ;
2017-07-27 18:04:55 +02:00
auto & query = occlusion_query_data [ i ] ;
2017-11-16 22:52:21 +01:00
glGenQueries ( 1 , & handle ) ;
2017-07-27 18:04:55 +02:00
2017-11-16 22:52:21 +01:00
query . driver_handle = ( u64 ) handle ;
2017-07-27 18:04:55 +02:00
query . pending = false ;
query . active = false ;
query . result = 0 ;
}
2017-05-11 00:42:55 +02:00
//Clip planes are shader controlled; enable all planes driver-side
glEnable ( GL_CLIP_DISTANCE0 + 0 ) ;
glEnable ( GL_CLIP_DISTANCE0 + 1 ) ;
glEnable ( GL_CLIP_DISTANCE0 + 2 ) ;
glEnable ( GL_CLIP_DISTANCE0 + 3 ) ;
glEnable ( GL_CLIP_DISTANCE0 + 4 ) ;
glEnable ( GL_CLIP_DISTANCE0 + 5 ) ;
2017-11-15 13:02:59 +01:00
m_depth_converter . create ( ) ;
2018-01-17 17:14:00 +01:00
m_ui_renderer . create ( ) ;
2017-11-15 13:02:59 +01:00
2017-09-08 16:52:13 +02:00
m_gl_texture_cache . initialize ( ) ;
m_thread_id = std : : this_thread : : get_id ( ) ;
2017-08-10 21:40:20 +02:00
2018-01-17 17:14:00 +01:00
if ( ! supports_native_ui )
{
m_frame - > disable_wm_event_queue ( ) ;
m_frame - > hide ( ) ;
m_shaders_cache - > load ( nullptr ) ;
m_frame - > enable_wm_event_queue ( ) ;
m_frame - > show ( ) ;
}
else
{
struct native_helper : gl : : shader_cache : : progress_dialog_helper
{
rsx : : thread * owner = nullptr ;
rsx : : overlays : : message_dialog * dlg = nullptr ;
native_helper ( GLGSRender * ptr ) :
owner ( ptr ) { }
void create ( ) override
{
MsgDialogType type = { } ;
type . disable_cancel = true ;
type . progress_bar_count = 1 ;
dlg = owner - > shell_open_message_dialog ( ) ;
dlg - > show ( " Loading precompiled shaders from disk... " , type , [ ] ( s32 status )
{
if ( status ! = CELL_OK )
Emu . Stop ( ) ;
} ) ;
}
void update_msg ( u32 processed , u32 entry_count ) override
{
dlg - > progress_bar_set_message ( 0 , fmt : : format ( " Loading pipeline object %u of %u " , processed , entry_count ) ) ;
owner - > flip ( 0 ) ;
}
void inc_value ( u32 value ) override
{
dlg - > progress_bar_increment ( 0 , ( f32 ) value ) ;
owner - > flip ( 0 ) ;
}
void close ( ) override
{
dlg - > return_code = CELL_OK ;
dlg - > close ( ) ;
}
}
helper ( this ) ;
2017-10-28 14:34:24 +02:00
2018-01-17 17:14:00 +01:00
m_frame - > enable_wm_event_queue ( ) ;
m_shaders_cache - > load ( & helper ) ;
}
2015-10-09 20:04:20 +02:00
}
2018-01-17 17:14:00 +01:00
2015-11-26 09:06:29 +01:00
void GLGSRender : : on_exit ( )
2015-10-09 20:04:20 +02:00
{
2016-08-26 16:23:23 +02:00
m_prog_buffer . clear ( ) ;
2015-10-04 00:45:26 +02:00
2015-10-11 22:00:51 +02:00
if ( draw_fbo )
2016-06-26 14:47:48 +02:00
{
2015-10-11 22:00:51 +02:00
draw_fbo . remove ( ) ;
2016-06-26 14:47:48 +02:00
}
2015-10-04 00:45:26 +02:00
2015-10-11 22:00:51 +02:00
if ( m_flip_fbo )
2016-06-26 14:47:48 +02:00
{
2015-10-11 22:00:51 +02:00
m_flip_fbo . remove ( ) ;
2016-06-26 14:47:48 +02:00
}
2015-10-04 00:45:26 +02:00
2015-10-11 22:00:51 +02:00
if ( m_flip_tex_color )
2016-06-26 14:47:48 +02:00
{
2015-10-11 22:00:51 +02:00
m_flip_tex_color . remove ( ) ;
2016-06-26 14:47:48 +02:00
}
2015-10-14 00:45:18 +02:00
if ( m_vao )
2016-06-26 14:47:48 +02:00
{
2015-10-14 00:45:18 +02:00
m_vao . remove ( ) ;
2016-06-26 14:47:48 +02:00
}
2015-10-14 02:15:23 +02:00
2017-07-31 13:38:28 +02:00
m_gl_persistent_stream_buffer . remove ( ) ;
m_gl_volatile_stream_buffer . remove ( ) ;
2016-06-11 21:51:34 +02:00
2017-03-29 21:27:29 +02:00
for ( auto & sampler : m_gl_sampler_states )
{
sampler . remove ( ) ;
}
2018-02-02 13:25:15 +01:00
for ( auto & tex : m_null_textures )
{
tex . second - > remove ( ) ;
}
2017-04-17 23:30:34 +02:00
if ( m_attrib_ring_buffer )
{
m_attrib_ring_buffer - > remove ( ) ;
}
if ( m_transform_constants_buffer )
{
m_transform_constants_buffer - > remove ( ) ;
}
if ( m_fragment_constants_buffer )
{
m_fragment_constants_buffer - > remove ( ) ;
}
2017-07-31 13:38:28 +02:00
if ( m_vertex_state_buffer )
2017-04-17 23:30:34 +02:00
{
2017-07-31 13:38:28 +02:00
m_vertex_state_buffer - > remove ( ) ;
2017-04-17 23:30:34 +02:00
}
if ( m_index_ring_buffer )
{
m_index_ring_buffer - > remove ( ) ;
}
2016-07-20 14:16:19 +02:00
2016-10-11 02:55:42 +02:00
m_text_printer . close ( ) ;
2017-09-08 16:52:13 +02:00
m_gl_texture_cache . destroy ( ) ;
2017-11-15 13:02:59 +01:00
m_depth_converter . destroy ( ) ;
2018-01-17 17:14:00 +01:00
m_ui_renderer . destroy ( ) ;
2016-10-11 02:55:42 +02:00
2017-07-27 18:04:55 +02:00
for ( u32 i = 0 ; i < occlusion_query_count ; + + i )
{
auto & query = occlusion_query_data [ i ] ;
query . active = false ;
query . pending = false ;
2017-11-16 22:52:21 +01:00
GLuint handle = ( GLuint ) query . driver_handle ;
glDeleteQueries ( 1 , & handle ) ;
query . driver_handle = 0 ;
2017-07-27 18:04:55 +02:00
}
2017-11-04 15:30:14 +01:00
glFlush ( ) ;
glFinish ( ) ;
2017-11-03 18:43:11 +01:00
GSRender : : on_exit ( ) ;
2012-11-15 00:39:56 +01:00
}
2017-02-16 19:29:56 +01:00
void GLGSRender : : clear_surface ( u32 arg )
2013-11-09 22:29:49 +01:00
{
2017-07-05 00:16:59 +02:00
if ( skip_frame | | ! framebuffer_status_valid ) return ;
2017-06-30 00:20:23 +02:00
if ( ( arg & 0xf3 ) = = 0 ) return ;
2014-08-18 16:37:23 +02:00
2015-10-11 22:00:51 +02:00
GLbitfield mask = 0 ;
2016-06-26 23:37:02 +02:00
rsx : : surface_depth_format surface_depth_format = rsx : : method_registers . surface_depth_fmt ( ) ;
2016-06-20 23:38:38 +02:00
2015-10-11 22:00:51 +02:00
if ( arg & 0x1 )
2015-10-09 20:04:20 +02:00
{
2016-01-13 17:40:10 +01:00
u32 max_depth_value = get_max_depth_value ( surface_depth_format ) ;
2017-03-26 13:51:25 +02:00
u32 clear_depth = rsx : : method_registers . z_clear_value ( surface_depth_format = = rsx : : surface_depth_format : : z24s8 ) ;
2014-02-16 09:56:58 +01:00
2017-07-27 18:04:55 +02:00
gl_state . depth_mask ( GL_TRUE ) ;
gl_state . clear_depth ( f32 ( clear_depth ) / max_depth_value ) ;
2015-10-11 22:00:51 +02:00
mask | = GLenum ( gl : : buffers : : depth ) ;
2017-02-16 19:29:56 +01:00
gl : : render_target * ds = std : : get < 1 > ( m_rtts . m_bound_depth_stencil ) ;
if ( ds & & ! ds - > cleared ( ) )
2017-06-30 23:24:41 +02:00
{
2017-02-16 19:29:56 +01:00
ds - > set_cleared ( ) ;
2017-06-30 23:24:41 +02:00
ds - > old_contents = nullptr ;
}
2015-10-11 22:00:51 +02:00
}
2014-02-16 09:56:58 +01:00
2016-06-26 14:47:48 +02:00
if ( surface_depth_format = = rsx : : surface_depth_format : : z24s8 & & ( arg & 0x2 ) )
2015-10-09 20:04:20 +02:00
{
2016-06-26 23:37:02 +02:00
u8 clear_stencil = rsx : : method_registers . stencil_clear_value ( ) ;
2014-02-16 09:56:58 +01:00
2017-07-27 18:04:55 +02:00
gl_state . stencil_mask ( rsx : : method_registers . stencil_mask ( ) ) ;
gl_state . clear_stencil ( clear_stencil ) ;
2015-10-04 00:45:26 +02:00
2015-10-11 22:00:51 +02:00
mask | = GLenum ( gl : : buffers : : stencil ) ;
}
if ( arg & 0xf0 )
{
2016-06-26 23:37:02 +02:00
u8 clear_a = rsx : : method_registers . clear_color_a ( ) ;
u8 clear_r = rsx : : method_registers . clear_color_r ( ) ;
u8 clear_g = rsx : : method_registers . clear_color_g ( ) ;
u8 clear_b = rsx : : method_registers . clear_color_b ( ) ;
2015-10-04 00:45:26 +02:00
2017-07-27 18:04:55 +02:00
gl_state . color_mask ( arg & 0xf0 ) ;
gl_state . clear_color ( clear_r , clear_g , clear_b , clear_a ) ;
2015-10-04 00:45:26 +02:00
2015-10-11 22:00:51 +02:00
mask | = GLenum ( gl : : buffers : : color ) ;
2017-06-30 23:24:41 +02:00
for ( auto & rtt : m_rtts . m_bound_render_targets )
{
if ( std : : get < 0 > ( rtt ) ! = 0 )
{
std : : get < 1 > ( rtt ) - > set_cleared ( true ) ;
std : : get < 1 > ( rtt ) - > old_contents = nullptr ;
}
}
2015-10-11 22:00:51 +02:00
}
2015-10-04 00:45:26 +02:00
2016-01-06 00:15:35 +01:00
glClear ( mask ) ;
2013-11-09 22:29:49 +01:00
}
2013-08-26 16:18:59 +02:00
2015-11-26 09:06:29 +01:00
bool GLGSRender : : do_method ( u32 cmd , u32 arg )
2015-10-11 22:00:51 +02:00
{
2016-07-22 01:31:58 +02:00
switch ( cmd )
{
case NV4097_CLEAR_SURFACE :
2017-02-27 13:50:00 +01:00
{
2017-07-23 16:11:45 +02:00
if ( arg & 0xF3 )
{
//Only do all this if we have actual work to do
2017-11-15 16:50:41 +01:00
u8 ctx = rsx : : framebuffer_creation_context : : context_draw ;
if ( arg & 0xF0 ) ctx | = rsx : : framebuffer_creation_context : : context_clear_color ;
if ( arg & 0x3 ) ctx | = rsx : : framebuffer_creation_context : : context_clear_depth ;
init_buffers ( ( rsx : : framebuffer_creation_context ) ctx , true ) ;
2017-07-23 16:11:45 +02:00
synchronize_buffers ( ) ;
clear_surface ( arg ) ;
}
2017-02-16 19:29:56 +01:00
return true ;
2017-02-27 13:50:00 +01:00
}
2017-08-18 20:10:21 +02:00
case NV4097_CLEAR_ZCULL_SURFACE :
{
2017-08-26 17:17:46 +02:00
// NOP
// Clearing zcull memory does not modify depth/stencil buffers 'bound' to the zcull region
2017-08-18 20:10:21 +02:00
return true ;
}
2017-02-16 19:29:56 +01:00
case NV4097_TEXTURE_READ_SEMAPHORE_RELEASE :
case NV4097_BACK_END_WRITE_SEMAPHORE_RELEASE :
flush_draw_buffers = true ;
return true ;
2016-07-22 01:31:58 +02:00
}
2017-02-16 19:29:56 +01:00
return false ;
2015-10-09 20:04:20 +02:00
}
2015-10-04 00:45:26 +02:00
2017-07-31 13:38:28 +02:00
bool GLGSRender : : check_program_state ( )
2015-10-09 20:04:20 +02:00
{
2017-10-30 13:27:22 +01:00
return ( rsx : : method_registers . shader_program_address ( ) ! = 0 ) ;
2017-07-31 13:38:28 +02:00
}
2017-02-10 10:08:46 +01:00
2018-01-21 16:31:35 +01:00
void GLGSRender : : load_program ( const vertex_upload_info & upload_info )
2017-07-31 13:38:28 +02:00
{
2017-10-30 13:27:22 +01:00
get_current_fragment_program ( fs_sampler_state ) ;
verify ( HERE ) , current_fragment_program . valid ;
get_current_vertex_program ( ) ;
2017-07-31 13:38:28 +02:00
auto & fragment_program = current_fragment_program ;
auto & vertex_program = current_vertex_program ;
2015-10-04 00:45:26 +02:00
2017-07-31 13:38:28 +02:00
vertex_program . skip_vertex_input_check = true ; //not needed for us since decoding is done server side
2017-11-02 19:54:19 +01:00
fragment_program . unnormalized_coords = 0 ; //unused
2017-08-10 21:40:20 +02:00
void * pipeline_properties = nullptr ;
2017-11-02 16:54:57 +01:00
m_program = & m_prog_buffer . getGraphicPipelineState ( vertex_program , fragment_program , pipeline_properties ) ;
m_program - > use ( ) ;
if ( m_prog_buffer . check_cache_missed ( ) )
2018-01-17 17:14:00 +01:00
{
2017-11-02 16:54:57 +01:00
m_shaders_cache - > store ( pipeline_properties , vertex_program , fragment_program ) ;
2018-01-17 17:14:00 +01:00
//Notify the user with HUD notification
if ( ! m_custom_ui )
{
//Create notification but do not draw it at this time. No need to spam flip requests
m_custom_ui = std : : make_unique < rsx : : overlays : : shader_compile_notification > ( ) ;
}
else if ( auto casted = dynamic_cast < rsx : : overlays : : shader_compile_notification * > ( m_custom_ui . get ( ) ) )
{
//Probe the notification
casted - > touch ( ) ;
}
}
2016-08-27 08:12:44 +02:00
u8 * buf ;
2017-07-31 13:38:28 +02:00
u32 vertex_state_offset ;
2016-06-12 11:05:22 +02:00
u32 vertex_constants_offset ;
u32 fragment_constants_offset ;
2016-02-13 11:26:07 +01:00
2017-06-18 16:53:02 +02:00
const u32 fragment_constants_size = ( const u32 ) m_prog_buffer . get_fragment_constants_buffer_size ( fragment_program ) ;
2017-08-21 19:56:31 +02:00
const u32 fragment_buffer_size = fragment_constants_size + ( 18 * 4 * sizeof ( float ) ) ;
2017-03-11 10:07:26 +01:00
if ( manually_flush_ring_buffers )
{
2017-07-31 13:38:28 +02:00
m_vertex_state_buffer - > reserve_storage_on_heap ( 512 ) ;
2017-03-11 10:07:26 +01:00
m_fragment_constants_buffer - > reserve_storage_on_heap ( align ( fragment_buffer_size , 256 ) ) ;
if ( m_transform_constants_dirty ) m_transform_constants_buffer - > reserve_storage_on_heap ( 8192 ) ;
}
2017-07-31 13:38:28 +02:00
// Vertex state
auto mapping = m_vertex_state_buffer - > alloc_from_heap ( 512 , m_uniform_buffer_offset_align ) ;
2016-08-27 08:12:44 +02:00
buf = static_cast < u8 * > ( mapping . first ) ;
2017-07-31 13:38:28 +02:00
vertex_state_offset = mapping . second ;
2017-06-14 17:47:01 +02:00
fill_scale_offset_data ( buf , false ) ;
2017-07-31 13:38:28 +02:00
fill_user_clip_data ( buf + 64 ) ;
* ( reinterpret_cast < u32 * > ( buf + 128 ) ) = rsx : : method_registers . transform_branch_bits ( ) ;
2018-01-21 16:31:35 +01:00
* ( reinterpret_cast < u32 * > ( buf + 132 ) ) = upload_info . vertex_index_base ;
2017-12-09 21:08:36 +01:00
* ( reinterpret_cast < f32 * > ( buf + 136 ) ) = rsx : : method_registers . point_size ( ) ;
2018-01-18 13:06:28 +01:00
* ( reinterpret_cast < f32 * > ( buf + 140 ) ) = rsx : : method_registers . clip_min ( ) ;
* ( reinterpret_cast < f32 * > ( buf + 144 ) ) = rsx : : method_registers . clip_max ( ) ;
2018-01-21 16:31:35 +01:00
fill_vertex_layout_state ( m_vertex_layout , upload_info . allocated_vertex_count , reinterpret_cast < s32 * > ( buf + 160 ) , upload_info . persistent_mapping_offset , upload_info . volatile_mapping_offset ) ;
2016-08-27 08:12:44 +02:00
2017-03-11 10:07:26 +01:00
if ( m_transform_constants_dirty )
{
// Vertex constants
mapping = m_transform_constants_buffer - > alloc_from_heap ( 8192 , m_uniform_buffer_offset_align ) ;
buf = static_cast < u8 * > ( mapping . first ) ;
vertex_constants_offset = mapping . second ;
fill_vertex_program_constants_data ( buf ) ;
}
2016-08-26 16:23:23 +02:00
// Fragment constants
2017-03-11 10:07:26 +01:00
mapping = m_fragment_constants_buffer - > alloc_from_heap ( fragment_buffer_size , m_uniform_buffer_offset_align ) ;
2017-02-10 10:08:46 +01:00
buf = static_cast < u8 * > ( mapping . first ) ;
fragment_constants_offset = mapping . second ;
2016-06-20 23:38:38 +02:00
if ( fragment_constants_size )
2016-08-27 08:12:44 +02:00
m_prog_buffer . fill_fragment_constants_buffer ( { reinterpret_cast < float * > ( buf ) , gsl : : narrow < int > ( fragment_constants_size ) } , fragment_program ) ;
2017-04-04 18:14:36 +02:00
2017-02-10 10:08:46 +01:00
// Fragment state
fill_fragment_state_buffer ( buf + fragment_constants_size , fragment_program ) ;
2016-06-12 11:05:22 +02:00
2017-07-31 13:38:28 +02:00
m_vertex_state_buffer - > bind_range ( 0 , vertex_state_offset , 512 ) ;
2017-03-11 10:07:26 +01:00
m_fragment_constants_buffer - > bind_range ( 2 , fragment_constants_offset , fragment_buffer_size ) ;
if ( m_transform_constants_dirty ) m_transform_constants_buffer - > bind_range ( 1 , vertex_constants_offset , 8192 ) ;
2016-06-27 00:52:08 +02:00
2016-10-18 09:57:28 +02:00
if ( manually_flush_ring_buffers )
2017-03-11 10:07:26 +01:00
{
2017-07-31 13:38:28 +02:00
m_vertex_state_buffer - > unmap ( ) ;
2017-03-11 10:07:26 +01:00
m_fragment_constants_buffer - > unmap ( ) ;
2017-04-04 18:14:36 +02:00
2017-03-11 10:07:26 +01:00
if ( m_transform_constants_dirty ) m_transform_constants_buffer - > unmap ( ) ;
}
2016-10-18 09:57:28 +02:00
2017-03-11 10:07:26 +01:00
m_transform_constants_dirty = false ;
2017-11-01 14:38:37 +01:00
}
void GLGSRender : : update_draw_state ( )
{
std : : chrono : : time_point < steady_clock > then = steady_clock : : now ( ) ;
bool color_mask_b = rsx : : method_registers . color_mask_b ( ) ;
bool color_mask_g = rsx : : method_registers . color_mask_g ( ) ;
bool color_mask_r = rsx : : method_registers . color_mask_r ( ) ;
bool color_mask_a = rsx : : method_registers . color_mask_a ( ) ;
gl_state . color_mask ( color_mask_r , color_mask_g , color_mask_b , color_mask_a ) ;
gl_state . depth_mask ( rsx : : method_registers . depth_write_enabled ( ) ) ;
gl_state . stencil_mask ( rsx : : method_registers . stencil_mask ( ) ) ;
2018-01-18 13:06:28 +01:00
gl_state . enable ( rsx : : method_registers . depth_clamp_enabled ( ) | | ! rsx : : method_registers . depth_clip_enabled ( ) , GL_DEPTH_CLAMP ) ;
2017-12-29 17:57:58 +01:00
2017-11-01 14:38:37 +01:00
if ( gl_state . enable ( rsx : : method_registers . depth_test_enabled ( ) , GL_DEPTH_TEST ) )
{
gl_state . depth_func ( comparison_op ( rsx : : method_registers . depth_func ( ) ) ) ;
}
if ( glDepthBoundsEXT & & ( gl_state . enable ( rsx : : method_registers . depth_bounds_test_enabled ( ) , GL_DEPTH_BOUNDS_TEST_EXT ) ) )
{
gl_state . depth_bounds ( rsx : : method_registers . depth_bounds_min ( ) , rsx : : method_registers . depth_bounds_max ( ) ) ;
}
gl_state . enable ( rsx : : method_registers . dither_enabled ( ) , GL_DITHER ) ;
if ( gl_state . enable ( rsx : : method_registers . blend_enabled ( ) , GL_BLEND ) )
{
glBlendFuncSeparate ( blend_factor ( rsx : : method_registers . blend_func_sfactor_rgb ( ) ) ,
blend_factor ( rsx : : method_registers . blend_func_dfactor_rgb ( ) ) ,
blend_factor ( rsx : : method_registers . blend_func_sfactor_a ( ) ) ,
blend_factor ( rsx : : method_registers . blend_func_dfactor_a ( ) ) ) ;
auto blend_colors = rsx : : get_constant_blend_colors ( ) ;
glBlendColor ( blend_colors [ 0 ] , blend_colors [ 1 ] , blend_colors [ 2 ] , blend_colors [ 3 ] ) ;
glBlendEquationSeparate ( blend_equation ( rsx : : method_registers . blend_equation_rgb ( ) ) ,
blend_equation ( rsx : : method_registers . blend_equation_a ( ) ) ) ;
}
if ( gl_state . enable ( rsx : : method_registers . stencil_test_enabled ( ) , GL_STENCIL_TEST ) )
{
glStencilFunc ( comparison_op ( rsx : : method_registers . stencil_func ( ) ) ,
rsx : : method_registers . stencil_func_ref ( ) ,
rsx : : method_registers . stencil_func_mask ( ) ) ;
glStencilOp ( stencil_op ( rsx : : method_registers . stencil_op_fail ( ) ) , stencil_op ( rsx : : method_registers . stencil_op_zfail ( ) ) ,
stencil_op ( rsx : : method_registers . stencil_op_zpass ( ) ) ) ;
if ( rsx : : method_registers . two_sided_stencil_test_enabled ( ) )
{
glStencilMaskSeparate ( GL_BACK , rsx : : method_registers . back_stencil_mask ( ) ) ;
glStencilFuncSeparate ( GL_BACK , comparison_op ( rsx : : method_registers . back_stencil_func ( ) ) ,
rsx : : method_registers . back_stencil_func_ref ( ) , rsx : : method_registers . back_stencil_func_mask ( ) ) ;
glStencilOpSeparate ( GL_BACK , stencil_op ( rsx : : method_registers . back_stencil_op_fail ( ) ) ,
stencil_op ( rsx : : method_registers . back_stencil_op_zfail ( ) ) , stencil_op ( rsx : : method_registers . back_stencil_op_zpass ( ) ) ) ;
}
}
gl_state . enablei ( rsx : : method_registers . blend_enabled_surface_1 ( ) , GL_BLEND , 1 ) ;
gl_state . enablei ( rsx : : method_registers . blend_enabled_surface_2 ( ) , GL_BLEND , 2 ) ;
gl_state . enablei ( rsx : : method_registers . blend_enabled_surface_3 ( ) , GL_BLEND , 3 ) ;
if ( gl_state . enable ( rsx : : method_registers . logic_op_enabled ( ) , GL_COLOR_LOGIC_OP ) )
{
gl_state . logic_op ( logic_op ( rsx : : method_registers . logic_operation ( ) ) ) ;
}
gl_state . line_width ( rsx : : method_registers . line_width ( ) ) ;
gl_state . enable ( rsx : : method_registers . line_smooth_enabled ( ) , GL_LINE_SMOOTH ) ;
gl_state . enable ( rsx : : method_registers . poly_offset_point_enabled ( ) , GL_POLYGON_OFFSET_POINT ) ;
gl_state . enable ( rsx : : method_registers . poly_offset_line_enabled ( ) , GL_POLYGON_OFFSET_LINE ) ;
gl_state . enable ( rsx : : method_registers . poly_offset_fill_enabled ( ) , GL_POLYGON_OFFSET_FILL ) ;
//offset_bias is the constant factor, multiplied by the implementation factor R
//offst_scale is the slope factor, multiplied by the triangle slope factor M
gl_state . polygon_offset ( rsx : : method_registers . poly_offset_scale ( ) , rsx : : method_registers . poly_offset_bias ( ) ) ;
if ( gl_state . enable ( rsx : : method_registers . cull_face_enabled ( ) , GL_CULL_FACE ) )
{
gl_state . cull_face ( cull_face ( rsx : : method_registers . cull_face_mode ( ) ) ) ;
}
gl_state . front_face ( front_face ( rsx : : method_registers . front_face_mode ( ) ) ) ;
//TODO
//NV4097_SET_ANISO_SPREAD
//NV4097_SET_SPECULAR_ENABLE
//NV4097_SET_TWO_SIDE_LIGHT_EN
//NV4097_SET_FLAT_SHADE_OP
//NV4097_SET_EDGE_FLAG
//NV4097_SET_COLOR_KEY_COLOR
//NV4097_SET_SHADER_CONTROL
//NV4097_SET_ZMIN_MAX_CONTROL
//NV4097_SET_ANTI_ALIASING_CONTROL
//NV4097_SET_CLIP_ID_TEST_ENABLE
std : : chrono : : time_point < steady_clock > now = steady_clock : : now ( ) ;
m_begin_time + = ( u32 ) std : : chrono : : duration_cast < std : : chrono : : microseconds > ( now - then ) . count ( ) ;
2017-10-31 14:54:55 +01:00
}
2013-11-03 20:23:16 +01:00
2015-10-11 22:00:51 +02:00
void GLGSRender : : flip ( int buffer )
{
2017-06-30 00:20:23 +02:00
if ( skip_frame )
{
m_frame - > flip ( m_context , true ) ;
rsx : : thread : : flip ( buffer ) ;
if ( ! skip_frame )
{
m_draw_calls = 0 ;
m_begin_time = 0 ;
m_draw_time = 0 ;
m_vertex_upload_time = 0 ;
m_textures_upload_time = 0 ;
}
return ;
}
2018-01-21 16:31:35 +01:00
gl : : screen . clear ( gl : : buffers : : color ) ;
2017-07-26 04:33:32 +02:00
u32 buffer_width = display_buffers [ buffer ] . width ;
u32 buffer_height = display_buffers [ buffer ] . height ;
u32 buffer_pitch = display_buffers [ buffer ] . pitch ;
2016-01-05 21:55:43 +01:00
2018-01-21 21:55:01 +01:00
if ( ( u32 ) buffer < display_buffers_count & & buffer_width & & buffer_height & & buffer_pitch )
2017-07-26 20:18:04 +02:00
{
2018-01-21 16:31:35 +01:00
// Calculate blit coordinates
coordi aspect_ratio ;
sizei csize ( m_frame - > client_width ( ) , m_frame - > client_height ( ) ) ;
sizei new_size = csize ;
2017-07-26 20:18:04 +02:00
2018-01-21 16:31:35 +01:00
if ( ! g_cfg . video . stretch_to_display_area )
2017-07-26 20:18:04 +02:00
{
2018-01-21 16:31:35 +01:00
const double aq = ( double ) buffer_width / buffer_height ;
const double rq = ( double ) new_size . width / new_size . height ;
const double q = aq / rq ;
2017-07-26 20:18:04 +02:00
2018-01-21 16:31:35 +01:00
if ( q > 1.0 )
{
new_size . height = int ( new_size . height / q ) ;
aspect_ratio . y = ( csize . height - new_size . height ) / 2 ;
}
else if ( q < 1.0 )
{
new_size . width = int ( new_size . width * q ) ;
aspect_ratio . x = ( csize . width - new_size . width ) / 2 ;
}
}
2015-10-11 22:00:51 +02:00
2018-01-21 16:31:35 +01:00
aspect_ratio . size = new_size ;
2015-10-09 20:04:20 +02:00
2018-01-21 16:31:35 +01:00
// Find the source image
rsx : : tiled_region buffer_region = get_tiled_address ( display_buffers [ buffer ] . offset , CELL_GCM_LOCATION_LOCAL ) ;
u32 absolute_address = buffer_region . address + buffer_region . base ;
2017-07-26 20:18:04 +02:00
2018-01-21 16:31:35 +01:00
m_flip_fbo . recreate ( ) ;
m_flip_fbo . bind ( ) ;
2017-06-30 23:24:41 +02:00
2018-01-21 16:31:35 +01:00
const u32 size = buffer_pitch * buffer_height ;
if ( auto render_target_texture = m_rtts . get_texture_from_render_target_if_applicable ( absolute_address ) )
2015-10-09 20:04:20 +02:00
{
2018-01-21 16:31:35 +01:00
buffer_width = render_target_texture - > width ( ) ;
buffer_height = render_target_texture - > height ( ) ;
2015-10-09 20:04:20 +02:00
2018-01-21 16:31:35 +01:00
m_flip_fbo . color = * render_target_texture ;
m_flip_fbo . read_buffer ( m_flip_fbo . color ) ;
2013-11-09 22:29:49 +01:00
}
2018-01-21 16:31:35 +01:00
else if ( auto surface = m_gl_texture_cache . find_texture_from_dimensions ( absolute_address ) )
2016-01-05 21:55:43 +01:00
{
2018-01-21 16:31:35 +01:00
//Hack - this should be the first location to check for output
//The render might have been done offscreen or in software and a blit used to display
m_flip_fbo . color = surface - > get_raw_view ( ) ;
m_flip_fbo . read_buffer ( m_flip_fbo . color ) ;
2016-01-05 21:55:43 +01:00
}
else
{
2018-01-21 16:31:35 +01:00
LOG_WARNING ( RSX , " Flip texture was not found in cache. Uploading surface from CPU " ) ;
2016-06-26 14:47:48 +02:00
2018-01-21 16:31:35 +01:00
if ( ! m_flip_tex_color | | m_flip_tex_color . size ( ) ! = sizei { ( int ) buffer_width , ( int ) buffer_height } )
{
m_flip_tex_color . recreate ( gl : : texture : : target : : texture2D ) ;
2014-05-22 19:39:56 +02:00
2018-01-21 16:31:35 +01:00
m_flip_tex_color . config ( )
. size ( { ( int ) buffer_width , ( int ) buffer_height } )
. type ( gl : : texture : : type : : uint_8_8_8_8 )
. format ( gl : : texture : : format : : bgra ) ;
2017-02-16 19:29:56 +01:00
2018-01-21 16:31:35 +01:00
m_flip_tex_color . pixel_unpack_settings ( ) . aligment ( 1 ) . row_length ( buffer_pitch / 4 ) ;
}
if ( buffer_region . tile )
{
std : : unique_ptr < u8 [ ] > temp ( new u8 [ buffer_height * buffer_pitch ] ) ;
buffer_region . read ( temp . get ( ) , buffer_width , buffer_height , buffer_pitch ) ;
m_flip_tex_color . copy_from ( temp . get ( ) , gl : : texture : : format : : bgra , gl : : texture : : type : : uint_8_8_8_8 ) ;
}
else
{
m_flip_tex_color . copy_from ( buffer_region . ptr , gl : : texture : : format : : bgra , gl : : texture : : type : : uint_8_8_8_8 ) ;
}
m_flip_fbo . color = m_flip_tex_color ;
m_flip_fbo . read_buffer ( m_flip_fbo . color ) ;
}
// Blit source image to the screen
// Disable scissor test (affects blit)
glDisable ( GL_SCISSOR_TEST ) ;
areai screen_area = coordi ( { } , { ( int ) buffer_width , ( int ) buffer_height } ) ;
m_flip_fbo . blit ( gl : : screen , screen_area , areai ( aspect_ratio ) . flipped_vertical ( ) , gl : : buffers : : color , gl : : filter : : linear ) ;
}
2015-01-31 14:01:34 +01:00
2018-01-17 17:14:00 +01:00
if ( m_custom_ui )
{
gl : : screen . bind ( ) ;
glViewport ( 0 , 0 , m_frame - > client_width ( ) , m_frame - > client_height ( ) ) ;
m_ui_renderer . run ( m_frame - > client_width ( ) , m_frame - > client_height ( ) , 0 , * m_custom_ui . get ( ) ) ;
}
2017-05-20 13:45:02 +02:00
if ( g_cfg . video . overlay )
2016-06-12 11:05:22 +02:00
{
2016-10-11 02:55:42 +02:00
gl : : screen . bind ( ) ;
glViewport ( 0 , 0 , m_frame - > client_width ( ) , m_frame - > client_height ( ) ) ;
2017-04-04 18:14:36 +02:00
2016-10-11 02:55:42 +02:00
m_text_printer . print_text ( 0 , 0 , m_frame - > client_width ( ) , m_frame - > client_height ( ) , " draw calls: " + std : : to_string ( m_draw_calls ) ) ;
m_text_printer . print_text ( 0 , 18 , m_frame - > client_width ( ) , m_frame - > client_height ( ) , " draw call setup: " + std : : to_string ( m_begin_time ) + " us " ) ;
m_text_printer . print_text ( 0 , 36 , m_frame - > client_width ( ) , m_frame - > client_height ( ) , " vertex upload time: " + std : : to_string ( m_vertex_upload_time ) + " us " ) ;
m_text_printer . print_text ( 0 , 54 , m_frame - > client_width ( ) , m_frame - > client_height ( ) , " textures upload time: " + std : : to_string ( m_textures_upload_time ) + " us " ) ;
m_text_printer . print_text ( 0 , 72 , m_frame - > client_width ( ) , m_frame - > client_height ( ) , " draw call execution: " + std : : to_string ( m_draw_time ) + " us " ) ;
2017-09-22 22:43:01 +02:00
auto num_dirty_textures = m_gl_texture_cache . get_unreleased_textures_count ( ) ;
2017-10-21 23:12:32 +02:00
auto texture_memory_size = m_gl_texture_cache . get_texture_memory_in_use ( ) / ( 1024 * 1024 ) ;
2017-09-22 22:43:01 +02:00
m_text_printer . print_text ( 0 , 108 , m_frame - > client_width ( ) , m_frame - > client_height ( ) , " Unreleased textures: " + std : : to_string ( num_dirty_textures ) ) ;
2017-10-21 23:12:32 +02:00
m_text_printer . print_text ( 0 , 126 , m_frame - > client_width ( ) , m_frame - > client_height ( ) , " Texture memory: " + std : : to_string ( texture_memory_size ) + " M " ) ;
2016-06-12 11:05:22 +02:00
}
2016-10-11 02:55:42 +02:00
m_frame - > flip ( m_context ) ;
2017-06-30 00:20:23 +02:00
rsx : : thread : : flip ( buffer ) ;
2016-03-09 19:11:22 +01:00
2017-07-26 20:18:04 +02:00
// Cleanup
2017-09-08 16:52:13 +02:00
m_gl_texture_cache . on_frame_end ( ) ;
2017-02-16 19:29:56 +01:00
2018-02-02 08:04:55 +01:00
m_rtts . free_invalidated ( ) ;
2017-07-26 18:32:13 +02:00
m_vertex_cache - > purge ( ) ;
2017-07-26 20:18:04 +02:00
//If we are skipping the next frame, do not reset perf counters
2017-06-30 00:20:23 +02:00
if ( skip_frame ) return ;
m_draw_calls = 0 ;
m_begin_time = 0 ;
m_draw_time = 0 ;
m_vertex_upload_time = 0 ;
m_textures_upload_time = 0 ;
2014-02-16 09:56:58 +01:00
}
2015-10-09 20:04:20 +02:00
2015-10-11 22:00:51 +02:00
u64 GLGSRender : : timestamp ( ) const
2015-10-09 20:04:20 +02:00
{
2015-10-11 22:00:51 +02:00
GLint64 result ;
glGetInteger64v ( GL_TIMESTAMP , & result ) ;
return result ;
2015-09-26 22:46:04 +02:00
}
2016-02-15 10:50:14 +01:00
bool GLGSRender : : on_access_violation ( u32 address , bool is_writing )
{
2017-10-23 14:39:24 +02:00
bool can_flush = ( std : : this_thread : : get_id ( ) = = m_thread_id ) ;
2017-10-24 12:59:46 +02:00
auto result = m_gl_texture_cache . invalidate_address ( address , is_writing , can_flush ) ;
2017-10-21 23:12:32 +02:00
2017-10-27 23:32:27 +02:00
if ( ! result . violation_handled )
2017-10-21 23:12:32 +02:00
return false ;
2017-10-30 13:27:22 +01:00
{
std : : lock_guard < std : : mutex > lock ( m_sampler_mutex ) ;
m_samplers_dirty . store ( true ) ;
}
2017-10-27 23:32:27 +02:00
if ( result . num_flushable > 0 )
2017-09-08 16:52:13 +02:00
{
2017-10-27 23:32:27 +02:00
work_item & task = post_flush_request ( address , result ) ;
2017-09-08 16:52:13 +02:00
2017-10-21 23:12:32 +02:00
vm : : temporary_unlock ( ) ;
{
std : : unique_lock < std : : mutex > lock ( task . guard_mutex ) ;
task . cv . wait ( lock , [ & task ] { return task . processed ; } ) ;
2017-09-08 16:52:13 +02:00
}
2017-10-21 23:12:32 +02:00
task . received = true ;
return true ;
2017-09-08 16:52:13 +02:00
}
2017-10-21 23:12:32 +02:00
2017-10-23 14:39:24 +02:00
return true ;
2016-08-27 08:12:44 +02:00
}
2017-02-16 19:29:56 +01:00
2017-08-07 23:54:40 +02:00
void GLGSRender : : on_notify_memory_unmapped ( u32 address_base , u32 size )
{
2017-10-21 23:12:32 +02:00
//Discard all memory in that range without bothering with writeback (Force it for strict?)
2017-10-27 23:32:27 +02:00
if ( m_gl_texture_cache . invalidate_range ( address_base , size , true , true , false ) . violation_handled )
2017-10-30 13:27:22 +01:00
{
2017-08-07 23:54:40 +02:00
m_gl_texture_cache . purge_dirty ( ) ;
2017-10-30 13:27:22 +01:00
{
std : : lock_guard < std : : mutex > lock ( m_sampler_mutex ) ;
m_samplers_dirty . store ( true ) ;
}
}
2017-08-07 23:54:40 +02:00
}
2018-01-21 21:55:01 +01:00
void GLGSRender : : do_local_task ( bool /*idle*/ )
2017-02-16 19:29:56 +01:00
{
2017-10-11 00:09:04 +02:00
m_frame - > clear_wm_events ( ) ;
2018-02-02 07:25:30 +01:00
if ( ! work_queue . empty ( ) )
2017-02-16 19:29:56 +01:00
{
2018-02-03 09:37:42 +01:00
std : : lock_guard < std : : mutex > lock ( queue_guard ) ;
2018-02-02 07:25:30 +01:00
work_queue . remove_if ( [ ] ( work_item & q ) { return q . received ; } ) ;
for ( work_item & q : work_queue )
{
if ( q . processed ) continue ;
2017-03-10 14:27:38 +01:00
2018-02-02 07:25:30 +01:00
std : : unique_lock < std : : mutex > lock ( q . guard_mutex ) ;
q . result = m_gl_texture_cache . flush_all ( q . section_data ) ;
q . processed = true ;
2017-02-16 19:29:56 +01:00
2018-02-02 07:25:30 +01:00
//Notify thread waiting on this
lock . unlock ( ) ;
q . cv . notify_one ( ) ;
}
2017-02-16 19:29:56 +01:00
}
2018-02-03 09:37:42 +01:00
else if ( ! in_begin_end )
{
//This will re-engage locks and break the texture cache if another thread is waiting in access violation handler!
//Only call when there are no waiters
m_gl_texture_cache . do_update ( ) ;
}
2018-01-17 17:14:00 +01:00
2018-01-21 21:55:01 +01:00
if ( m_overlay_cleanup_requests . size ( ) )
{
m_ui_renderer . remove_temp_resources ( ) ;
m_overlay_cleanup_requests . clear ( ) ;
}
else if ( m_custom_ui )
2018-01-17 17:14:00 +01:00
{
2018-01-21 21:55:01 +01:00
if ( ! in_begin_end & & native_ui_flip_request . load ( ) )
2018-01-17 17:14:00 +01:00
{
native_ui_flip_request . store ( false ) ;
flip ( ( s32 ) current_display_buffer ) ;
}
}
2017-02-16 19:29:56 +01:00
}
2017-10-27 23:32:27 +02:00
work_item & GLGSRender : : post_flush_request ( u32 address , gl : : texture_cache : : thrashed_set & flush_data )
2017-02-16 19:29:56 +01:00
{
std : : lock_guard < std : : mutex > lock ( queue_guard ) ;
work_queue . emplace_back ( ) ;
work_item & result = work_queue . back ( ) ;
result . address_to_flush = address ;
2017-10-27 23:32:27 +02:00
result . section_data = std : : move ( flush_data ) ;
2017-02-16 19:29:56 +01:00
return result ;
}
void GLGSRender : : synchronize_buffers ( )
{
if ( flush_draw_buffers )
{
write_buffers ( ) ;
flush_draw_buffers = false ;
}
}
2017-03-29 21:27:29 +02:00
bool GLGSRender : : scaled_image_from_memory ( rsx : : blit_src_info & src , rsx : : blit_dst_info & dst , bool interpolate )
{
2017-10-30 13:27:22 +01:00
m_samplers_dirty . store ( true ) ;
2017-09-08 16:52:13 +02:00
return m_gl_texture_cache . blit ( src , dst , interpolate , m_rtts ) ;
2017-03-29 21:27:29 +02:00
}
2017-07-27 18:04:55 +02:00
2017-10-26 05:01:10 +02:00
void GLGSRender : : notify_tile_unbound ( u32 tile )
{
2017-10-28 21:17:27 +02:00
//TODO: Handle texture writeback
//u32 addr = rsx::get_address(tiles[tile].offset, tiles[tile].location);
//on_notify_memory_unmapped(addr, tiles[tile].size);
//m_rtts.invalidate_surface_address(addr, false);
2017-10-26 05:01:10 +02:00
}
2017-11-16 22:52:21 +01:00
void GLGSRender : : begin_occlusion_query ( rsx : : occlusion_query_info * query )
2017-07-27 18:04:55 +02:00
{
2017-11-16 22:52:21 +01:00
query - > result = 0 ;
glBeginQuery ( GL_ANY_SAMPLES_PASSED , ( GLuint ) query - > driver_handle ) ;
2017-07-27 18:04:55 +02:00
}
2017-11-16 22:52:21 +01:00
void GLGSRender : : end_occlusion_query ( rsx : : occlusion_query_info * query )
2017-07-27 18:04:55 +02:00
{
2017-11-16 22:52:21 +01:00
glEndQuery ( GL_ANY_SAMPLES_PASSED ) ;
2017-07-27 18:04:55 +02:00
}
2017-11-16 22:52:21 +01:00
bool GLGSRender : : check_occlusion_query_status ( rsx : : occlusion_query_info * query )
2017-07-27 18:04:55 +02:00
{
2017-11-16 22:52:21 +01:00
GLint status = GL_TRUE ;
glGetQueryObjectiv ( ( GLuint ) query - > driver_handle , GL_QUERY_RESULT_AVAILABLE , & status ) ;
2017-08-11 22:32:44 +02:00
2017-11-16 22:52:21 +01:00
return status ! = GL_FALSE ;
2017-07-27 18:04:55 +02:00
}
2017-11-16 22:52:21 +01:00
void GLGSRender : : get_occlusion_query_result ( rsx : : occlusion_query_info * query )
2017-07-27 18:04:55 +02:00
{
2017-11-16 22:52:21 +01:00
GLint result ;
glGetQueryObjectiv ( ( GLuint ) query - > driver_handle , GL_QUERY_RESULT , & result ) ;
2017-07-27 18:04:55 +02:00
2017-11-16 22:52:21 +01:00
query - > result + = result ;
2018-01-17 17:14:00 +01:00
}
void GLGSRender : : shell_do_cleanup ( )
{
2018-01-21 21:55:01 +01:00
//TODO: Key cleanup requests with UID to identify resources to remove
m_overlay_cleanup_requests . push_back ( 0 ) ;
}