Browse Source
vk_renderpass_cache: Initial implementation
vk_renderpass_cache: Initial implementation
The renderpass cache is used to avoid creating renderpasses on each draw. The hashed structure is not currently optimized.nce_cpp
3 changed files with 199 additions and 0 deletions
-
2src/video_core/CMakeLists.txt
-
100src/video_core/renderer_vulkan/vk_renderpass_cache.cpp
-
97src/video_core/renderer_vulkan/vk_renderpass_cache.h
@ -0,0 +1,100 @@ |
|||||
|
// Copyright 2019 yuzu Emulator Project
|
||||
|
// Licensed under GPLv2 or any later version
|
||||
|
// Refer to the license.txt file included.
|
||||
|
|
||||
|
#include <memory>
|
||||
|
#include <vector>
|
||||
|
|
||||
|
#include "video_core/engines/maxwell_3d.h"
|
||||
|
#include "video_core/renderer_vulkan/declarations.h"
|
||||
|
#include "video_core/renderer_vulkan/maxwell_to_vk.h"
|
||||
|
#include "video_core/renderer_vulkan/vk_device.h"
|
||||
|
#include "video_core/renderer_vulkan/vk_renderpass_cache.h"
|
||||
|
|
||||
|
namespace Vulkan { |
||||
|
|
||||
|
VKRenderPassCache::VKRenderPassCache(const VKDevice& device) : device{device} {} |
||||
|
|
||||
|
VKRenderPassCache::~VKRenderPassCache() = default; |
||||
|
|
||||
|
vk::RenderPass VKRenderPassCache::GetRenderPass(const RenderPassParams& params) { |
||||
|
const auto [pair, is_cache_miss] = cache.try_emplace(params); |
||||
|
auto& entry = pair->second; |
||||
|
if (is_cache_miss) { |
||||
|
entry = CreateRenderPass(params); |
||||
|
} |
||||
|
return *entry; |
||||
|
} |
||||
|
|
||||
|
UniqueRenderPass VKRenderPassCache::CreateRenderPass(const RenderPassParams& params) const { |
||||
|
std::vector<vk::AttachmentDescription> descriptors; |
||||
|
std::vector<vk::AttachmentReference> color_references; |
||||
|
|
||||
|
for (std::size_t rt = 0; rt < params.color_attachments.size(); ++rt) { |
||||
|
const auto attachment = params.color_attachments[rt]; |
||||
|
const auto format = |
||||
|
MaxwellToVK::SurfaceFormat(device, FormatType::Optimal, attachment.pixel_format); |
||||
|
ASSERT_MSG(format.attachable, "Trying to attach a non-attachable format with format={}", |
||||
|
static_cast<u32>(attachment.pixel_format)); |
||||
|
|
||||
|
// TODO(Rodrigo): Add eMayAlias when it's needed.
|
||||
|
const auto color_layout = attachment.is_texception |
||||
|
? vk::ImageLayout::eGeneral |
||||
|
: vk::ImageLayout::eColorAttachmentOptimal; |
||||
|
descriptors.emplace_back(vk::AttachmentDescriptionFlagBits::eMayAlias, format.format, |
||||
|
vk::SampleCountFlagBits::e1, vk::AttachmentLoadOp::eLoad, |
||||
|
vk::AttachmentStoreOp::eStore, vk::AttachmentLoadOp::eDontCare, |
||||
|
vk::AttachmentStoreOp::eDontCare, color_layout, color_layout); |
||||
|
color_references.emplace_back(static_cast<u32>(rt), color_layout); |
||||
|
} |
||||
|
|
||||
|
vk::AttachmentReference zeta_attachment_ref; |
||||
|
if (params.has_zeta) { |
||||
|
const auto format = |
||||
|
MaxwellToVK::SurfaceFormat(device, FormatType::Optimal, params.zeta_pixel_format); |
||||
|
ASSERT_MSG(format.attachable, "Trying to attach a non-attachable format with format={}", |
||||
|
static_cast<u32>(params.zeta_pixel_format)); |
||||
|
|
||||
|
const auto zeta_layout = params.zeta_texception |
||||
|
? vk::ImageLayout::eGeneral |
||||
|
: vk::ImageLayout::eDepthStencilAttachmentOptimal; |
||||
|
descriptors.emplace_back(vk::AttachmentDescriptionFlags{}, format.format, |
||||
|
vk::SampleCountFlagBits::e1, vk::AttachmentLoadOp::eLoad, |
||||
|
vk::AttachmentStoreOp::eStore, vk::AttachmentLoadOp::eLoad, |
||||
|
vk::AttachmentStoreOp::eStore, zeta_layout, zeta_layout); |
||||
|
zeta_attachment_ref = |
||||
|
vk::AttachmentReference(static_cast<u32>(params.color_attachments.size()), zeta_layout); |
||||
|
} |
||||
|
|
||||
|
const vk::SubpassDescription subpass_description( |
||||
|
{}, vk::PipelineBindPoint::eGraphics, 0, nullptr, static_cast<u32>(color_references.size()), |
||||
|
color_references.data(), nullptr, params.has_zeta ? &zeta_attachment_ref : nullptr, 0, |
||||
|
nullptr); |
||||
|
|
||||
|
vk::AccessFlags access; |
||||
|
vk::PipelineStageFlags stage; |
||||
|
if (!color_references.empty()) { |
||||
|
access |= |
||||
|
vk::AccessFlagBits::eColorAttachmentRead | vk::AccessFlagBits::eColorAttachmentWrite; |
||||
|
stage |= vk::PipelineStageFlagBits::eColorAttachmentOutput; |
||||
|
} |
||||
|
|
||||
|
if (params.has_zeta) { |
||||
|
access |= vk::AccessFlagBits::eDepthStencilAttachmentRead | |
||||
|
vk::AccessFlagBits::eDepthStencilAttachmentWrite; |
||||
|
stage |= vk::PipelineStageFlagBits::eLateFragmentTests; |
||||
|
} |
||||
|
|
||||
|
const vk::SubpassDependency subpass_dependency(VK_SUBPASS_EXTERNAL, 0, stage, stage, {}, access, |
||||
|
{}); |
||||
|
|
||||
|
const vk::RenderPassCreateInfo create_info({}, static_cast<u32>(descriptors.size()), |
||||
|
descriptors.data(), 1, &subpass_description, 1, |
||||
|
&subpass_dependency); |
||||
|
|
||||
|
const auto dev = device.GetLogical(); |
||||
|
const auto& dld = device.GetDispatchLoader(); |
||||
|
return dev.createRenderPassUnique(create_info, nullptr, dld); |
||||
|
} |
||||
|
|
||||
|
} // namespace Vulkan
|
||||
@ -0,0 +1,97 @@ |
|||||
|
// Copyright 2019 yuzu Emulator Project |
||||
|
// Licensed under GPLv2 or any later version |
||||
|
// Refer to the license.txt file included. |
||||
|
|
||||
|
#pragma once |
||||
|
|
||||
|
#include <memory> |
||||
|
#include <tuple> |
||||
|
#include <unordered_map> |
||||
|
|
||||
|
#include <boost/container/static_vector.hpp> |
||||
|
#include <boost/functional/hash.hpp> |
||||
|
|
||||
|
#include "video_core/engines/maxwell_3d.h" |
||||
|
#include "video_core/renderer_vulkan/declarations.h" |
||||
|
#include "video_core/surface.h" |
||||
|
|
||||
|
namespace Vulkan { |
||||
|
|
||||
|
class VKDevice; |
||||
|
|
||||
|
// TODO(Rodrigo): Optimize this structure for faster hashing |
||||
|
|
||||
|
struct RenderPassParams { |
||||
|
struct ColorAttachment { |
||||
|
u32 index = 0; |
||||
|
VideoCore::Surface::PixelFormat pixel_format = VideoCore::Surface::PixelFormat::Invalid; |
||||
|
bool is_texception = false; |
||||
|
|
||||
|
std::size_t Hash() const noexcept { |
||||
|
return static_cast<std::size_t>(pixel_format) | |
||||
|
static_cast<std::size_t>(is_texception) << 6 | |
||||
|
static_cast<std::size_t>(index) << 7; |
||||
|
} |
||||
|
|
||||
|
bool operator==(const ColorAttachment& rhs) const noexcept { |
||||
|
return std::tie(index, pixel_format, is_texception) == |
||||
|
std::tie(rhs.index, rhs.pixel_format, rhs.is_texception); |
||||
|
} |
||||
|
}; |
||||
|
|
||||
|
boost::container::static_vector<ColorAttachment, |
||||
|
Tegra::Engines::Maxwell3D::Regs::NumRenderTargets> |
||||
|
color_attachments{}; |
||||
|
// TODO(Rodrigo): Unify has_zeta into zeta_pixel_format and zeta_component_type. |
||||
|
VideoCore::Surface::PixelFormat zeta_pixel_format = VideoCore::Surface::PixelFormat::Invalid; |
||||
|
bool has_zeta = false; |
||||
|
bool zeta_texception = false; |
||||
|
|
||||
|
std::size_t Hash() const noexcept { |
||||
|
std::size_t hash = 0; |
||||
|
for (const auto& rt : color_attachments) { |
||||
|
boost::hash_combine(hash, rt.Hash()); |
||||
|
} |
||||
|
boost::hash_combine(hash, zeta_pixel_format); |
||||
|
boost::hash_combine(hash, has_zeta); |
||||
|
boost::hash_combine(hash, zeta_texception); |
||||
|
return hash; |
||||
|
} |
||||
|
|
||||
|
bool operator==(const RenderPassParams& rhs) const { |
||||
|
return std::tie(color_attachments, zeta_pixel_format, has_zeta, zeta_texception) == |
||||
|
std::tie(rhs.color_attachments, rhs.zeta_pixel_format, rhs.has_zeta, |
||||
|
rhs.zeta_texception); |
||||
|
} |
||||
|
}; |
||||
|
|
||||
|
} // namespace Vulkan |
||||
|
|
||||
|
namespace std { |
||||
|
|
||||
|
template <> |
||||
|
struct hash<Vulkan::RenderPassParams> { |
||||
|
std::size_t operator()(const Vulkan::RenderPassParams& k) const noexcept { |
||||
|
return k.Hash(); |
||||
|
} |
||||
|
}; |
||||
|
|
||||
|
} // namespace std |
||||
|
|
||||
|
namespace Vulkan { |
||||
|
|
||||
|
class VKRenderPassCache final { |
||||
|
public: |
||||
|
explicit VKRenderPassCache(const VKDevice& device); |
||||
|
~VKRenderPassCache(); |
||||
|
|
||||
|
vk::RenderPass GetRenderPass(const RenderPassParams& params); |
||||
|
|
||||
|
private: |
||||
|
UniqueRenderPass CreateRenderPass(const RenderPassParams& params) const; |
||||
|
|
||||
|
const VKDevice& device; |
||||
|
std::unordered_map<RenderPassParams, UniqueRenderPass> cache; |
||||
|
}; |
||||
|
|
||||
|
} // namespace Vulkan |
||||
Write
Preview
Loading…
Cancel
Save
Reference in new issue