#pragma once #include "stdafx.h" #include #include #include #include #include #include #include #include #include "Utilities/mutex.h" #include "Emu/System.h" #include "GLRenderTargets.h" #include "../Common/TextureUtils.h" #include "../Common/texture_cache.h" #include "../../Memory/vm.h" #include "../rsx_utils.h" class GLGSRender; namespace gl { class blitter; extern GLenum get_sized_internal_format(u32); extern blitter *g_hw_blitter; class blitter { fbo blit_src; fbo blit_dst; public: void init() { blit_src.create(); blit_dst.create(); } void destroy() { blit_dst.remove(); blit_src.remove(); } u32 scale_image(u32 src, u32 dst, const areai src_rect, const areai dst_rect, bool linear_interpolation, bool is_depth_copy) { s32 old_fbo = 0; glGetIntegerv(GL_FRAMEBUFFER_BINDING, &old_fbo); u32 dst_tex = dst; filter interp = linear_interpolation ? filter::linear : filter::nearest; GLenum attachment = is_depth_copy ? GL_DEPTH_ATTACHMENT : GL_COLOR_ATTACHMENT0; blit_src.bind(); glFramebufferTexture2D(GL_FRAMEBUFFER, attachment, GL_TEXTURE_2D, src, 0); blit_src.check(); blit_dst.bind(); glFramebufferTexture2D(GL_FRAMEBUFFER, attachment, GL_TEXTURE_2D, dst_tex, 0); blit_dst.check(); GLboolean scissor_test_enabled = glIsEnabled(GL_SCISSOR_TEST); if (scissor_test_enabled) glDisable(GL_SCISSOR_TEST); blit_src.blit(blit_dst, src_rect, dst_rect, is_depth_copy ? buffers::depth : buffers::color, interp); if (scissor_test_enabled) glEnable(GL_SCISSOR_TEST); glBindFramebuffer(GL_FRAMEBUFFER, old_fbo); return dst_tex; } }; class cached_texture_section : public rsx::cached_texture_section { private: fence m_fence; u32 pbo_id = 0; u32 pbo_size = 0; u32 vram_texture = 0; u32 scaled_texture = 0; bool copied = false; bool flushed = false; bool is_depth = false; texture::format format = texture::format::rgba; texture::type type = texture::type::ubyte; bool pack_unpack_swap_bytes = false; u8 get_pixel_size(texture::format fmt_, texture::type type_) { u8 size = 1; switch (type_) { case texture::type::ubyte: case texture::type::sbyte: break; case texture::type::ushort: case texture::type::sshort: case texture::type::f16: size = 2; break; case texture::type::ushort_5_6_5: case texture::type::ushort_5_6_5_rev: case texture::type::ushort_4_4_4_4: case texture::type::ushort_4_4_4_4_rev: case texture::type::ushort_5_5_5_1: case texture::type::ushort_1_5_5_5_rev: return 2; case texture::type::uint_8_8_8_8: case texture::type::uint_8_8_8_8_rev: case texture::type::uint_10_10_10_2: case texture::type::uint_2_10_10_10_rev: case texture::type::uint_24_8: return 4; case texture::type::f32: case texture::type::sint: case texture::type::uint: size = 4; break; } switch (fmt_) { case texture::format::red: case texture::format::r: break; case texture::format::rg: size *= 2; break; case texture::format::rgb: case texture::format::bgr: size *= 3; break; case texture::format::rgba: case texture::format::bgra: size *= 4; break; //Depth formats.. case texture::format::depth: size = 2; break; case texture::format::depth_stencil: size = 4; break; default: LOG_ERROR(RSX, "Unsupported rtt format %d", (GLenum)fmt_); size = 4; } return size; } void init_buffer() { if (pbo_id) { glDeleteBuffers(1, &pbo_id); pbo_id = 0; pbo_size = 0; } glGenBuffers(1, &pbo_id); const u32 buffer_size = align(cpu_address_range, 4096); glBindBuffer(GL_PIXEL_PACK_BUFFER, pbo_id); glBufferStorage(GL_PIXEL_PACK_BUFFER, buffer_size, nullptr, GL_MAP_READ_BIT); pbo_size = buffer_size; } public: void reset(const u32 base, const u32 size, const bool flushable=false) { rsx::protection_policy policy = g_cfg.video.strict_rendering_mode ? rsx::protection_policy::protect_policy_full_range : rsx::protection_policy::protect_policy_one_page; rsx::buffered_section::reset(base, size, policy); if (flushable) init_buffer(); flushed = false; copied = false; is_depth = false; vram_texture = 0; } void create(const u16 w, const u16 h, const u16 depth, const u16 mipmaps, void*, gl::texture* image, const u32 rsx_pitch, bool read_only, gl::texture::format gl_format, gl::texture::type gl_type, bool swap_bytes) { if (!read_only && pbo_id == 0) init_buffer(); flushed = false; copied = false; is_depth = false; this->width = w; this->height = h; this->rsx_pitch = rsx_pitch; this->depth = depth; this->mipmaps = mipmaps; vram_texture = image->id(); set_format(gl_format, gl_type, swap_bytes); } void create_read_only(const u32 id, const u32 width, const u32 height, const u32 depth, const u32 mipmaps) { //Only to be used for ro memory, we dont care about most members, just dimensions and the vram texture handle this->width = width; this->height = height; this->depth = depth; this->mipmaps = mipmaps; vram_texture = id; rsx_pitch = 0; real_pitch = 0; } void set_dimensions(u32 width, u32 height, u32 depth, u32 pitch) { this->width = width; this->height = height; rsx_pitch = pitch; real_pitch = width * get_pixel_size(format, type); } void set_format(const texture::format gl_format, const texture::type gl_type, const bool swap_bytes) { format = gl_format; type = gl_type; pack_unpack_swap_bytes = swap_bytes; real_pitch = width * get_pixel_size(format, type); } void set_depth_flag(bool is_depth_fmt) { is_depth = is_depth_fmt; } void set_source(gl::texture &source) { vram_texture = source.id(); } void copy_texture(bool=false) { if (!glIsTexture(vram_texture)) { LOG_ERROR(RSX, "Attempted to download rtt texture, but texture handle was invalid! (0x%X)", vram_texture); return; } if (real_pitch != rsx_pitch || rsx::get_resolution_scale_percent() != 100) { const u32 real_width = (rsx_pitch * width) / real_pitch; if (scaled_texture == 0) { GLenum ifmt = 0; glBindTexture(GL_TEXTURE_2D, vram_texture); glGetTexLevelParameteriv(GL_TEXTURE_2D, 0, GL_TEXTURE_INTERNAL_FORMAT, (GLint*)&ifmt); //Get expected texture dimensions.. glGenTextures(1, &scaled_texture); glBindTexture(GL_TEXTURE_2D, scaled_texture); glTexStorage2D(GL_TEXTURE_2D, 1, ifmt, real_width, height); } areai src_area = { 0, 0, 0, 0 }; const areai dst_area = {0, 0, static_cast(real_width), height}; glBindTexture(GL_TEXTURE_2D, vram_texture); glGetTexLevelParameteriv(GL_TEXTURE_2D, 0, GL_TEXTURE_WIDTH, &src_area.x2); glGetTexLevelParameteriv(GL_TEXTURE_2D, 0, GL_TEXTURE_HEIGHT, &src_area.y2); g_hw_blitter->scale_image(vram_texture, scaled_texture, src_area, dst_area, true, is_depth); } glPixelStorei(GL_PACK_SWAP_BYTES, pack_unpack_swap_bytes); glBindBuffer(GL_PIXEL_PACK_BUFFER, pbo_id); const GLuint target_texture = (scaled_texture == 0) ? vram_texture : scaled_texture; if (get_driver_caps().EXT_dsa_supported) glGetTextureImageEXT(target_texture, GL_TEXTURE_2D, 0, (GLenum)format, (GLenum)type, nullptr); else glGetTextureImage(target_texture, 0, (GLenum)format, (GLenum)type, pbo_size, nullptr); glBindBuffer(GL_PIXEL_PACK_BUFFER, 0); m_fence.reset(); copied = true; } void fill_texture(gl::texture* tex) { if (!copied) { //LOG_WARNING(RSX, "Request to fill texture rejected because contents were not read"); return; } u32 min_width = std::min((u16)tex->width(), width); u32 min_height = std::min((u16)tex->height(), height); tex->bind(); glPixelStorei(GL_UNPACK_SWAP_BYTES, pack_unpack_swap_bytes); glBindBuffer(GL_PIXEL_UNPACK_BUFFER, pbo_id); glTexSubImage2D((GLenum)tex->get_target(), 0, 0, 0, min_width, min_height, (GLenum)format, (GLenum)type, nullptr); glBindBuffer(GL_PIXEL_UNPACK_BUFFER, 0); } bool flush() { if (!copied) { LOG_WARNING(RSX, "Cache miss at address 0x%X. This is gonna hurt...", cpu_address_base); copy_texture(); if (!copied) { LOG_WARNING(RSX, "Nothing to copy; Setting section to readable and moving on..."); protect(utils::protection::ro); return false; } } protect(utils::protection::rw); m_fence.wait_for_signal(); flushed = true; glBindBuffer(GL_PIXEL_PACK_BUFFER, pbo_id); void *data = glMapBufferRange(GL_PIXEL_PACK_BUFFER, 0, pbo_size, GL_MAP_READ_BIT); u8 *dst = vm::ps3::_ptr(cpu_address_base); //throw if map failed since we'll segfault anyway verify(HERE), data != nullptr; if (real_pitch >= rsx_pitch || scaled_texture != 0) { memcpy(dst, data, cpu_address_range); } else { //TODO: Use compression hint from the gcm tile information //TODO: Fall back to bilinear filtering if samples > 2 const u8 pixel_size = get_pixel_size(format, type); const u8 samples = rsx_pitch / real_pitch; rsx::scale_image_nearest(dst, const_cast(data), width, height, rsx_pitch, real_pitch, pixel_size, samples); } glUnmapBuffer(GL_PIXEL_PACK_BUFFER); glBindBuffer(GL_PIXEL_PACK_BUFFER, 0); return true; } void destroy() { if (!locked && pbo_id == 0 && vram_texture == 0 && m_fence.is_empty()) //Already destroyed return; if (locked) unprotect(); if (pbo_id == 0) { //Read-only texture, destroy texture memory glDeleteTextures(1, &vram_texture); vram_texture = 0; } else { //Destroy pbo cache since vram texture is managed elsewhere glDeleteBuffers(1, &pbo_id); pbo_id = 0; pbo_size = 0; if (scaled_texture) { glDeleteTextures(1, &scaled_texture); scaled_texture = 0; } } if (!m_fence.is_empty()) m_fence.destroy(); } texture::format get_format() const { return format; } bool exists() const { return vram_texture != 0; } bool is_flushable() const { return (locked && pbo_id != 0); } bool is_flushed() const { return flushed; } bool is_synchronized() const { return copied; } void set_flushed(const bool state) { flushed = state; } bool is_empty() const { return vram_texture == 0; } u32 get_raw_view() const { return vram_texture; } u32 get_raw_texture() const { return vram_texture; } bool is_depth_texture() const { return is_depth; } bool has_compatible_format(gl::texture* tex) const { GLenum fmt; glBindTexture(GL_TEXTURE_2D, vram_texture); glGetTexLevelParameteriv(GL_TEXTURE_2D, 0, GL_TEXTURE_INTERNAL_FORMAT, (GLint*)&fmt); if (auto as_rtt = dynamic_cast(tex)) { return (GLenum)as_rtt->get_compatible_internal_format() == fmt; } return (gl::texture::format)fmt == tex->get_internal_format(); } }; class texture_cache : public rsx::texture_cache { private: blitter m_hw_blitter; std::vector m_temporary_surfaces; cached_texture_section& create_texture(u32 id, u32 texaddr, u32 texsize, u32 w, u32 h, u32 depth, u32 mipmaps) { cached_texture_section& tex = find_cached_texture(texaddr, texsize, true, w, h, depth); tex.reset(texaddr, texsize, false); tex.create_read_only(id, w, h, depth, mipmaps); read_only_range = tex.get_min_max(read_only_range); return tex; } void clear() { for (auto &address_range : m_cache) { auto &range_data = address_range.second; for (auto &tex : range_data.data) { tex.destroy(); } range_data.data.resize(0); } clear_temporary_subresources(); m_unreleased_texture_objects = 0; } void clear_temporary_subresources() { for (u32 &id : m_temporary_surfaces) { glDeleteTextures(1, &id); } m_temporary_surfaces.resize(0); } u32 create_temporary_subresource(u32 src_id, GLenum sized_internal_fmt, u16 x, u16 y, u16 width, u16 height) { u32 dst_id = 0; GLenum ifmt; glBindTexture(GL_TEXTURE_2D, src_id); glGetTexLevelParameteriv(GL_TEXTURE_2D, 0, GL_TEXTURE_INTERNAL_FORMAT, (GLint*)&ifmt); switch (ifmt) { case GL_DEPTH_COMPONENT16: case GL_DEPTH_COMPONENT24: case GL_DEPTH24_STENCIL8: sized_internal_fmt = ifmt; break; } glGenTextures(1, &dst_id); glBindTexture(GL_TEXTURE_2D, dst_id); glTexStorage2D(GL_TEXTURE_2D, 1, sized_internal_fmt, width, height); glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_MIN_FILTER, GL_LINEAR); glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_MAG_FILTER, GL_LINEAR); //Empty GL_ERROR glGetError(); glCopyImageSubData(src_id, GL_TEXTURE_2D, 0, x, y, 0, dst_id, GL_TEXTURE_2D, 0, 0, 0, 0, width, height, 1); m_temporary_surfaces.push_back(dst_id); //Check for error if (GLenum err = glGetError()) { LOG_WARNING(RSX, "Failed to copy image subresource with GL error 0x%X", err); return 0; } return dst_id; } protected: void free_texture_section(cached_texture_section& tex) override { tex.destroy(); } u32 create_temporary_subresource_view(void*&, u32* src, u32 gcm_format, u16 x, u16 y, u16 w, u16 h) override { const GLenum ifmt = gl::get_sized_internal_format(gcm_format); return create_temporary_subresource(*src, ifmt, x, y, w, h); } u32 create_temporary_subresource_view(void*&, gl::texture* src, u32 gcm_format, u16 x, u16 y, u16 w, u16 h) override { if (auto as_rtt = dynamic_cast(src)) { return create_temporary_subresource(src->id(), (GLenum)as_rtt->get_compatible_internal_format(), x, y, w, h); } else { const GLenum ifmt = gl::get_sized_internal_format(gcm_format); return create_temporary_subresource(src->id(), ifmt, x, y, w, h); } } cached_texture_section* create_new_texture(void*&, u32 rsx_address, u32 rsx_size, u16 width, u16 height, u16 depth, u16 mipmaps, const u32 gcm_format, const rsx::texture_upload_context context, const rsx::texture_dimension_extended type, const rsx::texture_create_flags flags, std::pair, std::array>& remap_vector) override { u32 vram_texture = gl::create_texture(gcm_format, width, height, depth, mipmaps, type); bool depth_flag = false; switch (gcm_format) { case CELL_GCM_TEXTURE_DEPTH24_D8: case CELL_GCM_TEXTURE_DEPTH16: depth_flag = true; break; } if (flags == rsx::texture_create_flags::swapped_native_component_order) { glBindTexture(GL_TEXTURE_2D, vram_texture); glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_SWIZZLE_R, GL_ALPHA); glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_SWIZZLE_G, GL_RED); glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_SWIZZLE_B, GL_GREEN); glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_SWIZZLE_A, GL_BLUE); } auto& cached = create_texture(vram_texture, rsx_address, rsx_size, width, height, depth, mipmaps); cached.set_dirty(false); cached.set_depth_flag(depth_flag); cached.set_view_flags(flags); cached.set_context(context); //Its not necessary to lock blit dst textures as they are just reused as necessary if (context != rsx::texture_upload_context::blit_engine_dst || g_cfg.video.strict_rendering_mode) cached.protect(utils::protection::ro); return &cached; } cached_texture_section* upload_image_from_cpu(void*&, u32 rsx_address, u16 width, u16 height, u16 depth, u16 mipmaps, u16 pitch, const u32 gcm_format, const rsx::texture_upload_context context, std::vector& subresource_layout, const rsx::texture_dimension_extended type, const bool swizzled, std::pair, std::array>& remap_vector) override { void* unused = nullptr; auto section = create_new_texture(unused, rsx_address, pitch * height, width, height, depth, mipmaps, gcm_format, context, type, rsx::texture_create_flags::default_component_order, remap_vector); //Swizzling is ignored for blit engine copy and emulated using remapping bool input_swizzled = (context == rsx::texture_upload_context::blit_engine_src)? false : swizzled; gl::upload_texture(section->get_raw_texture(), rsx_address, gcm_format, width, height, depth, mipmaps, input_swizzled, type, subresource_layout, remap_vector, false); return section; } void enforce_surface_creation_type(cached_texture_section& section, const rsx::texture_create_flags flags) override { if (flags == section.get_view_flags()) return; if (flags == rsx::texture_create_flags::swapped_native_component_order) { glBindTexture(GL_TEXTURE_2D, section.get_raw_texture()); glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_SWIZZLE_R, GL_ALPHA); glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_SWIZZLE_G, GL_RED); glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_SWIZZLE_B, GL_GREEN); glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_SWIZZLE_A, GL_BLUE); } section.set_view_flags(flags); } void insert_texture_barrier() override { auto &caps = gl::get_driver_caps(); if (caps.ARB_texture_barrier_supported) glTextureBarrier(); else if (caps.NV_texture_barrier_supported) glTextureBarrierNV(); } public: texture_cache() {} ~texture_cache() {} void initialize() { m_hw_blitter.init(); g_hw_blitter = &m_hw_blitter; } void destroy() override { clear(); g_hw_blitter = nullptr; m_hw_blitter.destroy(); } bool is_depth_texture(const u32 rsx_address, const u32 rsx_size) override { reader_lock lock(m_cache_mutex); auto found = m_cache.find(get_block_address(rsx_address)); if (found == m_cache.end()) return false; if (found->second.valid_count == 0) return false; for (auto& tex : found->second.data) { if (tex.is_dirty()) continue; if (!tex.overlaps(rsx_address, true)) continue; if ((rsx_address + rsx_size - tex.get_section_base()) <= tex.get_section_size()) return tex.is_depth_texture(); } return false; } void on_frame_end() override { if (m_unreleased_texture_objects >= m_max_zombie_objects) { purge_dirty(); } clear_temporary_subresources(); } bool blit(rsx::blit_src_info& src, rsx::blit_dst_info& dst, bool linear_interpolate, gl_render_targets& m_rtts) { void* unused = nullptr; return upload_scaled_image(src, dst, linear_interpolate, unused, m_rtts, m_hw_blitter); } template void upload_and_bind_texture(int index, GLenum target, RsxTextureType &tex, gl_render_targets &m_rtts) { glActiveTexture(GL_TEXTURE0 + index); void* unused = nullptr; auto id = upload_texture(unused, tex, m_rtts); glBindTexture(target, id); } }; }