#include "stdafx.h" #include "GLGSRender.h" #include "Emu/Cell/Modules/cellVideoOut.h" #include "Emu/RSX/Overlays/overlay_manager.h" #include "util/video_provider.h" LOG_CHANNEL(screenshot_log, "SCREENSHOT"); extern atomic_t g_user_asked_for_screenshot; extern atomic_t g_recording_mode; namespace gl { namespace debug { std::unique_ptr g_vis_texture; void set_vis_texture(texture* visual) { const auto target = static_cast(visual->get_target()); const auto ifmt = static_cast(visual->get_internal_format()); g_vis_texture.reset(new texture(target, visual->width(), visual->height(), 1, 1, ifmt, visual->format_class())); glCopyImageSubData(visual->id(), target, 0, 0, 0, 0, g_vis_texture->id(), target, 0, 0, 0, 0, visual->width(), visual->height(), 1); } } } gl::texture* GLGSRender::get_present_source(gl::present_surface_info* info, const rsx::avconf& avconfig) { gl::texture* image = nullptr; // Check the surface store first gl::command_context cmd = { gl_state }; const auto format_bpp = rsx::get_format_block_size_in_bytes(info->format); const auto overlap_info = m_rtts.get_merged_texture_memory_region(cmd, info->address, info->width, info->height, info->pitch, format_bpp, rsx::surface_access::transfer_read); if (!overlap_info.empty()) { const auto& section = overlap_info.back(); auto surface = gl::as_rtt(section.surface); bool viable = false; if (section.base_address >= info->address) { const auto surface_width = surface->get_surface_width(); const auto surface_height = surface->get_surface_height(); if (section.base_address == info->address) { // Check for fit or crop viable = (surface_width >= info->width && surface_height >= info->height); } else { // Check for borders and letterboxing const u32 inset_offset = section.base_address - info->address; const u32 inset_y = inset_offset / info->pitch; const u32 inset_x = (inset_offset % info->pitch) / format_bpp; const u32 full_width = surface_width + inset_x + inset_x; const u32 full_height = surface_height + inset_y + inset_y; viable = (full_width == info->width && full_height == info->height); } if (viable) { image = section.surface->get_surface(rsx::surface_access::transfer_read); std::tie(info->width, info->height) = rsx::apply_resolution_scale( std::min(surface_width, info->width), std::min(surface_height, info->height)); } } } else if (auto surface = m_gl_texture_cache.find_texture_from_dimensions(info->address, info->format); surface && surface->get_width() >= info->width && surface->get_height() >= info->height) { // Hack - this should be the first location to check for output // The render might have been done offscreen or in software and a blit used to display if (const auto tex = surface->get_raw_texture(); tex) image = tex; } if (!image) { rsx_log.warning("Flip texture was not found in cache. Uploading surface from CPU"); gl::pixel_unpack_settings unpack_settings; unpack_settings.alignment(1).row_length(info->pitch / 4); if (!m_flip_tex_color || m_flip_tex_color->size2D() != sizeu{info->width, info->height}) { m_flip_tex_color = std::make_unique(GL_TEXTURE_2D, info->width, info->height, 1, 1, GL_RGBA8); } gl::command_context cmd{ gl_state }; const auto range = utils::address_range::start_length(info->address, info->pitch * info->height); m_gl_texture_cache.invalidate_range(cmd, range, rsx::invalidation_cause::read); gl::texture::format fmt; switch (avconfig.format) { default: rsx_log.error("Unhandled video output format 0x%x", avconfig.format); [[fallthrough]]; case CELL_VIDEO_OUT_BUFFER_COLOR_FORMAT_X8R8G8B8: fmt = gl::texture::format::bgra; break; case CELL_VIDEO_OUT_BUFFER_COLOR_FORMAT_X8B8G8R8: fmt = gl::texture::format::rgba; break; } m_flip_tex_color->copy_from(vm::base(info->address), fmt, gl::texture::type::uint_8_8_8_8, unpack_settings); image = m_flip_tex_color.get(); } return image; } void GLGSRender::flip(const rsx::display_flip_info_t& info) { if (info.skip_frame) { m_frame->flip(m_context, true); rsx::thread::flip(info); return; } gl::command_context cmd{ gl_state }; u32 buffer_width = display_buffers[info.buffer].width; u32 buffer_height = display_buffers[info.buffer].height; u32 buffer_pitch = display_buffers[info.buffer].pitch; u32 av_format; const auto& avconfig = g_fxo->get(); if (!buffer_width) { buffer_width = avconfig.resolution_x; buffer_height = avconfig.resolution_y; } if (avconfig.state) { av_format = avconfig.get_compatible_gcm_format(); if (!buffer_pitch) buffer_pitch = buffer_width * avconfig.get_bpp(); const u32 video_frame_height = (avconfig.stereo_mode == stereo_render_mode_options::disabled? avconfig.resolution_y : ((avconfig.resolution_y - 30) / 2)); buffer_width = std::min(buffer_width, avconfig.resolution_x); buffer_height = std::min(buffer_height, video_frame_height); } else { av_format = CELL_GCM_TEXTURE_A8R8G8B8; if (!buffer_pitch) buffer_pitch = buffer_width * 4; } // Disable scissor test (affects blit, clear, etc) gl_state.disable(GL_SCISSOR_TEST); // Enable drawing to window backbuffer gl::screen.bind(); GLuint image_to_flip = GL_NONE, image_to_flip2 = GL_NONE; if (info.buffer < display_buffers_count && buffer_width && buffer_height) { // Find the source image gl::present_surface_info present_info; present_info.width = buffer_width; present_info.height = buffer_height; present_info.pitch = buffer_pitch; present_info.format = av_format; present_info.address = rsx::get_address(display_buffers[info.buffer].offset, CELL_GCM_LOCATION_LOCAL); const auto image_to_flip_ = get_present_source(&present_info, avconfig); image_to_flip = image_to_flip_->id(); if (avconfig.stereo_mode != stereo_render_mode_options::disabled) [[unlikely]] { const auto [unused, min_expected_height] = rsx::apply_resolution_scale(RSX_SURFACE_DIMENSION_IGNORED, buffer_height + 30); if (image_to_flip_->height() < min_expected_height) { // Get image for second eye const u32 image_offset = (buffer_height + 30) * buffer_pitch + display_buffers[info.buffer].offset; present_info.width = buffer_width; present_info.height = buffer_height; present_info.address = rsx::get_address(image_offset, CELL_GCM_LOCATION_LOCAL); image_to_flip2 = get_present_source(&present_info, avconfig)->id(); } else { // Account for possible insets const auto [unused2, scaled_buffer_height] = rsx::apply_resolution_scale(RSX_SURFACE_DIMENSION_IGNORED, buffer_height); buffer_height = std::min(image_to_flip_->height() - min_expected_height, scaled_buffer_height); } } buffer_width = present_info.width; buffer_height = present_info.height; } if (info.emu_flip) { evaluate_cpu_usage_reduction_limits(); } // Get window state const int width = m_frame->client_width(); const int height = m_frame->client_height(); // Calculate blit coordinates areai aspect_ratio; if (!g_cfg.video.stretch_to_display_area) { const sizeu csize(width, height); const auto converted = avconfig.aspect_convert_region(size2u{ buffer_width, buffer_height }, csize); aspect_ratio = static_cast(converted); } else { aspect_ratio = { 0, 0, width, height }; } if (!image_to_flip || aspect_ratio.x1 || aspect_ratio.y1) { // Clear the window background to black gl_state.clear_color(0, 0, 0, 0); gl::screen.clear(gl::buffers::color); } if (image_to_flip) { if (g_user_asked_for_screenshot || (g_recording_mode != recording_mode::stopped && m_frame->can_consume_frame())) { std::vector sshot_frame(buffer_height * buffer_width * 4); gl::pixel_pack_settings pack_settings{}; pack_settings.apply(); if (gl::get_driver_caps().ARB_dsa_supported) glGetTextureImage(image_to_flip, 0, GL_RGBA, GL_UNSIGNED_BYTE, buffer_height * buffer_width * 4, sshot_frame.data()); else glGetTextureImageEXT(image_to_flip, GL_TEXTURE_2D, 0, GL_RGBA, GL_UNSIGNED_BYTE, sshot_frame.data()); if (GLenum err = glGetError(); err != GL_NO_ERROR) { screenshot_log.error("Failed to capture image: 0x%x", err); } else if (g_user_asked_for_screenshot.exchange(false)) { m_frame->take_screenshot(std::move(sshot_frame), buffer_width, buffer_height, false); } else { m_frame->present_frame(sshot_frame, buffer_width, buffer_height, false); } } const areai screen_area = coordi({}, { static_cast(buffer_width), static_cast(buffer_height) }); const bool use_full_rgb_range_output = g_cfg.video.full_rgb_range_output.get(); // TODO: Implement FSR for OpenGL and remove this fallback to bilinear const gl::filter filter = g_cfg.video.output_scaling == output_scaling_mode::nearest ? gl::filter::nearest : gl::filter::linear; if (use_full_rgb_range_output && rsx::fcmp(avconfig.gamma, 1.f) && avconfig.stereo_mode == stereo_render_mode_options::disabled) { // Blit source image to the screen m_flip_fbo.recreate(); m_flip_fbo.bind(); m_flip_fbo.color = image_to_flip; m_flip_fbo.read_buffer(m_flip_fbo.color); m_flip_fbo.draw_buffer(m_flip_fbo.color); m_flip_fbo.blit(gl::screen, screen_area, aspect_ratio.flipped_vertical(), gl::buffers::color, filter); } else { const f32 gamma = avconfig.gamma; const bool limited_range = !use_full_rgb_range_output; const rsx::simple_array images{ image_to_flip, image_to_flip2 }; gl::screen.bind(); m_video_output_pass.run(cmd, areau(aspect_ratio), images, gamma, limited_range, avconfig.stereo_mode, filter); } } if (m_overlay_manager) { if (m_overlay_manager->has_dirty()) { m_overlay_manager->lock(); std::vector uids_to_dispose; uids_to_dispose.reserve(m_overlay_manager->get_dirty().size()); for (const auto& view : m_overlay_manager->get_dirty()) { m_ui_renderer.remove_temp_resources(view->uid); uids_to_dispose.push_back(view->uid); } m_overlay_manager->unlock(); m_overlay_manager->dispose(uids_to_dispose); } if (m_overlay_manager->has_visible()) { gl::screen.bind(); // Lock to avoid modification during run-update chain std::lock_guard lock(*m_overlay_manager); for (const auto& view : m_overlay_manager->get_views()) { m_ui_renderer.run(cmd, areau(aspect_ratio), 0, *view.get()); } } } if (g_cfg.video.overlay && gl::get_driver_caps().ARB_shader_draw_parameters_supported) { if (!m_text_printer.is_enabled()) { m_text_printer.init(); m_text_printer.set_enabled(true); } // Disable depth test gl_state.depth_func(GL_ALWAYS); gl::screen.bind(); glViewport(0, 0, width, height); m_text_printer.set_scale(m_frame->client_device_pixel_ratio()); int y_loc = 0; const auto println = [&](const std::string& text) { m_text_printer.print_text(cmd, 4, y_loc, width, height, text); y_loc += 16; }; println(fmt::format("RSX Load: %3d%%", get_load())); println(fmt::format("draw calls: %16d", info.stats.draw_calls)); println(fmt::format("draw call setup: %11dus", info.stats.setup_time)); println(fmt::format("vertex upload time: %8dus", info.stats.vertex_upload_time)); println(fmt::format("textures upload time: %6dus", info.stats.textures_upload_time)); println(fmt::format("draw call execution: %7dus", info.stats.draw_exec_time)); const auto num_dirty_textures = m_gl_texture_cache.get_unreleased_textures_count(); const auto texture_memory_size = m_gl_texture_cache.get_texture_memory_in_use() / (1024 * 1024); const auto num_flushes = m_gl_texture_cache.get_num_flush_requests(); const auto num_mispredict = m_gl_texture_cache.get_num_cache_mispredictions(); const auto num_speculate = m_gl_texture_cache.get_num_cache_speculative_writes(); const auto num_misses = m_gl_texture_cache.get_num_cache_misses(); const auto num_unavoidable = m_gl_texture_cache.get_num_unavoidable_hard_faults(); const auto cache_miss_ratio = static_cast(ceil(m_gl_texture_cache.get_cache_miss_ratio() * 100)); const auto num_texture_upload = m_gl_texture_cache.get_texture_upload_calls_this_frame(); const auto num_texture_upload_miss = m_gl_texture_cache.get_texture_upload_misses_this_frame(); const auto texture_upload_miss_ratio = m_gl_texture_cache.get_texture_upload_miss_percentage(); const auto texture_copies_ellided = m_gl_texture_cache.get_texture_copies_ellided_this_frame(); println(fmt::format("Unreleased textures: %7d", num_dirty_textures)); println(fmt::format("Texture memory: %12dM", texture_memory_size)); println(fmt::format("Flush requests: %12d = %2d (%3d%%) hard faults, %2d unavoidable, %2d misprediction(s), %2d speculation(s)", num_flushes, num_misses, cache_miss_ratio, num_unavoidable, num_mispredict, num_speculate)); println(fmt::format("Texture uploads: %11u (%u from CPU - %02u%%, %u copies avoided)", num_texture_upload, num_texture_upload_miss, texture_upload_miss_ratio, texture_copies_ellided)); const auto vertex_cache_hit_count = (info.stats.vertex_cache_request_count - info.stats.vertex_cache_miss_count); const auto vertex_cache_hit_ratio = info.stats.vertex_cache_request_count ? (vertex_cache_hit_count * 100) / info.stats.vertex_cache_request_count : 0; println(fmt::format("Vertex cache hits: %9u/%u (%u%%)", vertex_cache_hit_count, info.stats.vertex_cache_request_count, vertex_cache_hit_ratio)); } if (gl::debug::g_vis_texture) { // Optionally renders a single debug texture to framebuffer. // Only programmatic access provided at the moment. // TODO: Migrate to use overlay system. (kd-11) gl::fbo m_vis_buffer; m_vis_buffer.create(); m_vis_buffer.bind(); m_vis_buffer.color = gl::debug::g_vis_texture->id(); m_vis_buffer.read_buffer(m_vis_buffer.color); m_vis_buffer.draw_buffer(m_vis_buffer.color); const u32 vis_width = 320; const u32 vis_height = 240; areai display_view = areai(aspect_ratio).flipped_vertical(); display_view.x1 = display_view.x2 - vis_width; display_view.y1 = vis_height; // Blit const auto src_region = areau{ 0u, 0u, gl::debug::g_vis_texture->width(), gl::debug::g_vis_texture->height() }; m_vis_buffer.blit(gl::screen, static_cast(src_region), display_view, gl::buffers::color, gl::filter::linear); m_vis_buffer.remove(); } m_frame->flip(m_context); rsx::thread::flip(info); // Cleanup m_gl_texture_cache.on_frame_end(); m_vertex_cache->purge(); auto removed_textures = m_rtts.trim(cmd); m_framebuffer_cache.remove_if([&](auto& fbo) { if (fbo.unused_check_count() >= 2) return true; // Remove if stale if (fbo.references_any(removed_textures)) return true; // Remove if any of the attachments is invalid return false; }); if (m_draw_fbo && !m_graphics_state.test(rsx::rtt_config_dirty)) { // Always restore the active framebuffer m_draw_fbo->bind(); set_viewport(); set_scissor(m_graphics_state & rsx::pipeline_state::scissor_setup_clipped); } }