#include "stdafx.h" #include "Utilities/mutex.h" #include "VKRenderPass.h" namespace vk { shared_mutex g_renderpass_cache_mutex; std::unordered_map g_renderpass_cache; u64 get_renderpass_key(const std::vector& images) { // Key structure // 0-8 color_format // 8-16 depth_format // 16-21 sample_counts // 21-37 current layouts u64 key = 0; u64 layout_offset = 22; for (const auto &surface : images) { const auto format_code = u64(surface->format()) & 0xFF; switch (format_code) { case VK_FORMAT_D16_UNORM: case VK_FORMAT_D24_UNORM_S8_UINT: case VK_FORMAT_D32_SFLOAT_S8_UINT: key |= (format_code << 8); break; default: key |= format_code; break; } switch (const auto layout = surface->current_layout) { case VK_IMAGE_LAYOUT_DEPTH_STENCIL_ATTACHMENT_OPTIMAL: case VK_IMAGE_LAYOUT_COLOR_ATTACHMENT_OPTIMAL: case VK_IMAGE_LAYOUT_GENERAL: key |= (u64(layout) << layout_offset); layout_offset += 3; break; default: fmt::throw_exception("Unsupported image layout 0x%x", static_cast(layout)); } } key |= u64(images[0]->samples()) << 16; return key; } u64 get_renderpass_key(const std::vector& images, u64 previous_key) { // Partial update; assumes compatible renderpass keys const u64 layout_mask = (0x7FFFull << 22); u64 key = previous_key & ~layout_mask; u64 layout_offset = 22; for (const auto &surface : images) { switch (const auto layout = surface->current_layout) { case VK_IMAGE_LAYOUT_DEPTH_STENCIL_ATTACHMENT_OPTIMAL: case VK_IMAGE_LAYOUT_COLOR_ATTACHMENT_OPTIMAL: case VK_IMAGE_LAYOUT_GENERAL: key |= (u64(layout) << layout_offset); layout_offset += 3; break; default: fmt::throw_exception("Unsupported image layout 0x%x", static_cast(layout)); } } return key; } u64 get_renderpass_key(VkFormat surface_format) { u64 key = (1ull << 16); switch (surface_format) { case VK_FORMAT_D16_UNORM: case VK_FORMAT_D24_UNORM_S8_UINT: case VK_FORMAT_D32_SFLOAT_S8_UINT: key |= (u64(surface_format) << 8); key |= (u64(VK_IMAGE_LAYOUT_DEPTH_STENCIL_ATTACHMENT_OPTIMAL) << 22); break; default: key |= u64(surface_format); key |= (u64(VK_IMAGE_LAYOUT_COLOR_ATTACHMENT_OPTIMAL) << 22); break; } return key; } VkRenderPass get_renderpass(VkDevice dev, u64 renderpass_key) { // 99.999% of checks will go through this block once on-disk shader cache has loaded { reader_lock lock(g_renderpass_cache_mutex); auto found = g_renderpass_cache.find(renderpass_key); if (found != g_renderpass_cache.end()) { return found->second; } } std::lock_guard lock(g_renderpass_cache_mutex); // Check again auto found = g_renderpass_cache.find(renderpass_key); if (found != g_renderpass_cache.end()) { return found->second; } // Decode VkSampleCountFlagBits samples = VkSampleCountFlagBits((renderpass_key >> 16) & 0xF); std::vector rtv_layouts; VkImageLayout dsv_layout; u64 layout_offset = 22; for (int n = 0; n < 5; ++n) { const VkImageLayout layout = VkImageLayout((renderpass_key >> layout_offset) & 0x7); layout_offset += 3; if (layout) { rtv_layouts.push_back(layout); } else { break; } } VkFormat color_format = VkFormat(renderpass_key & 0xFF); VkFormat depth_format = VkFormat((renderpass_key >> 8) & 0xFF); if (depth_format) { dsv_layout = rtv_layouts.back(); rtv_layouts.pop_back(); } std::vector attachments = {}; std::vector attachment_references; u32 attachment_count = 0; for (const auto &layout : rtv_layouts) { VkAttachmentDescription color_attachment_description = {}; color_attachment_description.format = color_format; color_attachment_description.samples = samples; color_attachment_description.loadOp = VK_ATTACHMENT_LOAD_OP_LOAD; color_attachment_description.storeOp = VK_ATTACHMENT_STORE_OP_STORE; color_attachment_description.stencilLoadOp = VK_ATTACHMENT_LOAD_OP_DONT_CARE; color_attachment_description.stencilStoreOp = VK_ATTACHMENT_STORE_OP_DONT_CARE; color_attachment_description.initialLayout = layout; color_attachment_description.finalLayout = layout; attachments.push_back(color_attachment_description); attachment_references.push_back({ attachment_count++, layout }); } if (depth_format) { VkAttachmentDescription depth_attachment_description = {}; depth_attachment_description.format = depth_format; depth_attachment_description.samples = samples; depth_attachment_description.loadOp = VK_ATTACHMENT_LOAD_OP_LOAD; depth_attachment_description.storeOp = VK_ATTACHMENT_STORE_OP_STORE; depth_attachment_description.stencilLoadOp = VK_ATTACHMENT_LOAD_OP_LOAD; depth_attachment_description.stencilStoreOp = VK_ATTACHMENT_STORE_OP_STORE; depth_attachment_description.initialLayout = dsv_layout; depth_attachment_description.finalLayout = dsv_layout; attachments.push_back(depth_attachment_description); attachment_references.push_back({ attachment_count, dsv_layout }); } VkSubpassDescription subpass = {}; subpass.pipelineBindPoint = VK_PIPELINE_BIND_POINT_GRAPHICS; subpass.colorAttachmentCount = attachment_count; subpass.pColorAttachments = attachment_count? attachment_references.data() : nullptr; subpass.pDepthStencilAttachment = depth_format? &attachment_references.back() : nullptr; VkRenderPassCreateInfo rp_info = {}; rp_info.sType = VK_STRUCTURE_TYPE_RENDER_PASS_CREATE_INFO; rp_info.attachmentCount = static_cast(attachments.size()); rp_info.pAttachments = attachments.data(); rp_info.subpassCount = 1; rp_info.pSubpasses = &subpass; rp_info.pDependencies = nullptr; rp_info.dependencyCount = 0; VkRenderPass result; CHECK_RESULT(vkCreateRenderPass(dev, &rp_info, NULL, &result)); g_renderpass_cache[renderpass_key] = result; return result; } void clear_renderpass_cache(VkDevice dev) { for (const auto &renderpass : g_renderpass_cache) { vkDestroyRenderPass(dev, renderpass.second, nullptr); } g_renderpass_cache.clear(); } }