Browse Source
Merge pull request #10476 from ameerj/gl-memory-maps
Merge pull request #10476 from ameerj/gl-memory-maps
OpenGL: Make use of persistent buffer maps in buffer cachepull/15/merge
committed by
GitHub
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
15 changed files with 316 additions and 204 deletions
-
4src/video_core/CMakeLists.txt
-
10src/video_core/buffer_cache/buffer_cache.h
-
1src/video_core/buffer_cache/buffer_cache_base.h
-
58src/video_core/renderer_opengl/gl_buffer_cache.cpp
-
29src/video_core/renderer_opengl/gl_buffer_cache.h
-
6src/video_core/renderer_opengl/gl_rasterizer.cpp
-
1src/video_core/renderer_opengl/gl_rasterizer.h
-
150src/video_core/renderer_opengl/gl_staging_buffer_pool.cpp
-
44src/video_core/renderer_opengl/gl_staging_buffer_pool.h
-
63src/video_core/renderer_opengl/gl_stream_buffer.cpp
-
87src/video_core/renderer_opengl/gl_texture_cache.cpp
-
47src/video_core/renderer_opengl/gl_texture_cache.h
-
9src/video_core/renderer_opengl/util_shaders.cpp
-
10src/video_core/renderer_opengl/util_shaders.h
-
1src/video_core/renderer_vulkan/vk_buffer_cache.h
@ -0,0 +1,150 @@ |
|||
// SPDX-FileCopyrightText: Copyright 2021 yuzu Emulator Project
|
|||
// SPDX-License-Identifier: GPL-2.0-or-later
|
|||
|
|||
#include <array>
|
|||
#include <memory>
|
|||
#include <span>
|
|||
|
|||
#include <glad/glad.h>
|
|||
|
|||
#include "common/alignment.h"
|
|||
#include "common/assert.h"
|
|||
#include "common/bit_util.h"
|
|||
#include "common/microprofile.h"
|
|||
#include "video_core/renderer_opengl/gl_staging_buffer_pool.h"
|
|||
|
|||
MICROPROFILE_DEFINE(OpenGL_BufferRequest, "OpenGL", "BufferRequest", MP_RGB(128, 128, 192)); |
|||
|
|||
namespace OpenGL { |
|||
|
|||
StagingBufferMap::~StagingBufferMap() { |
|||
if (sync) { |
|||
sync->Create(); |
|||
} |
|||
} |
|||
|
|||
StagingBuffers::StagingBuffers(GLenum storage_flags_, GLenum map_flags_) |
|||
: storage_flags{storage_flags_}, map_flags{map_flags_} {} |
|||
|
|||
StagingBuffers::~StagingBuffers() = default; |
|||
|
|||
StagingBufferMap StagingBuffers::RequestMap(size_t requested_size, bool insert_fence) { |
|||
MICROPROFILE_SCOPE(OpenGL_BufferRequest); |
|||
|
|||
const size_t index = RequestBuffer(requested_size); |
|||
OGLSync* const sync = insert_fence ? &syncs[index] : nullptr; |
|||
sync_indices[index] = insert_fence ? ++current_sync_index : 0; |
|||
return StagingBufferMap{ |
|||
.mapped_span = std::span(maps[index], requested_size), |
|||
.sync = sync, |
|||
.buffer = buffers[index].handle, |
|||
}; |
|||
} |
|||
|
|||
size_t StagingBuffers::RequestBuffer(size_t requested_size) { |
|||
if (const std::optional<size_t> index = FindBuffer(requested_size); index) { |
|||
return *index; |
|||
} |
|||
|
|||
OGLBuffer& buffer = buffers.emplace_back(); |
|||
buffer.Create(); |
|||
const auto next_pow2_size = Common::NextPow2(requested_size); |
|||
glNamedBufferStorage(buffer.handle, next_pow2_size, nullptr, |
|||
storage_flags | GL_MAP_PERSISTENT_BIT); |
|||
maps.push_back(static_cast<u8*>(glMapNamedBufferRange(buffer.handle, 0, next_pow2_size, |
|||
map_flags | GL_MAP_PERSISTENT_BIT))); |
|||
syncs.emplace_back(); |
|||
sync_indices.emplace_back(); |
|||
sizes.push_back(next_pow2_size); |
|||
|
|||
ASSERT(syncs.size() == buffers.size() && buffers.size() == maps.size() && |
|||
maps.size() == sizes.size()); |
|||
|
|||
return buffers.size() - 1; |
|||
} |
|||
|
|||
std::optional<size_t> StagingBuffers::FindBuffer(size_t requested_size) { |
|||
size_t known_unsignaled_index = current_sync_index + 1; |
|||
size_t smallest_buffer = std::numeric_limits<size_t>::max(); |
|||
std::optional<size_t> found; |
|||
const size_t num_buffers = sizes.size(); |
|||
for (size_t index = 0; index < num_buffers; ++index) { |
|||
const size_t buffer_size = sizes[index]; |
|||
if (buffer_size < requested_size || buffer_size >= smallest_buffer) { |
|||
continue; |
|||
} |
|||
if (syncs[index].handle != 0) { |
|||
if (sync_indices[index] >= known_unsignaled_index) { |
|||
// This fence is later than a fence that is known to not be signaled
|
|||
continue; |
|||
} |
|||
if (!syncs[index].IsSignaled()) { |
|||
// Since this fence hasn't been signaled, it's safe to assume all later
|
|||
// fences haven't been signaled either
|
|||
known_unsignaled_index = std::min(known_unsignaled_index, sync_indices[index]); |
|||
continue; |
|||
} |
|||
syncs[index].Release(); |
|||
} |
|||
smallest_buffer = buffer_size; |
|||
found = index; |
|||
} |
|||
return found; |
|||
} |
|||
|
|||
StreamBuffer::StreamBuffer() { |
|||
static constexpr GLenum flags = GL_MAP_WRITE_BIT | GL_MAP_PERSISTENT_BIT | GL_MAP_COHERENT_BIT; |
|||
buffer.Create(); |
|||
glObjectLabel(GL_BUFFER, buffer.handle, -1, "Stream Buffer"); |
|||
glNamedBufferStorage(buffer.handle, STREAM_BUFFER_SIZE, nullptr, flags); |
|||
mapped_pointer = |
|||
static_cast<u8*>(glMapNamedBufferRange(buffer.handle, 0, STREAM_BUFFER_SIZE, flags)); |
|||
for (OGLSync& sync : fences) { |
|||
sync.Create(); |
|||
} |
|||
} |
|||
|
|||
std::pair<std::span<u8>, size_t> StreamBuffer::Request(size_t size) noexcept { |
|||
ASSERT(size < REGION_SIZE); |
|||
for (size_t region = Region(used_iterator), region_end = Region(iterator); region < region_end; |
|||
++region) { |
|||
fences[region].Create(); |
|||
} |
|||
used_iterator = iterator; |
|||
|
|||
for (size_t region = Region(free_iterator) + 1, |
|||
region_end = std::min(Region(iterator + size) + 1, NUM_SYNCS); |
|||
region < region_end; ++region) { |
|||
glClientWaitSync(fences[region].handle, 0, GL_TIMEOUT_IGNORED); |
|||
fences[region].Release(); |
|||
} |
|||
if (iterator + size >= free_iterator) { |
|||
free_iterator = iterator + size; |
|||
} |
|||
if (iterator + size > STREAM_BUFFER_SIZE) { |
|||
for (size_t region = Region(used_iterator); region < NUM_SYNCS; ++region) { |
|||
fences[region].Create(); |
|||
} |
|||
used_iterator = 0; |
|||
iterator = 0; |
|||
free_iterator = size; |
|||
|
|||
for (size_t region = 0, region_end = Region(size); region <= region_end; ++region) { |
|||
glClientWaitSync(fences[region].handle, 0, GL_TIMEOUT_IGNORED); |
|||
fences[region].Release(); |
|||
} |
|||
} |
|||
const size_t offset = iterator; |
|||
iterator = Common::AlignUp(iterator + size, MAX_ALIGNMENT); |
|||
return {std::span(mapped_pointer + offset, size), offset}; |
|||
} |
|||
|
|||
StagingBufferMap StagingBufferPool::RequestUploadBuffer(size_t size) { |
|||
return upload_buffers.RequestMap(size, true); |
|||
} |
|||
|
|||
StagingBufferMap StagingBufferPool::RequestDownloadBuffer(size_t size) { |
|||
return download_buffers.RequestMap(size, false); |
|||
} |
|||
|
|||
} // namespace OpenGL
|
|||
@ -1,63 +0,0 @@ |
|||
// SPDX-FileCopyrightText: Copyright 2021 yuzu Emulator Project
|
|||
// SPDX-License-Identifier: GPL-2.0-or-later
|
|||
|
|||
#include <array>
|
|||
#include <memory>
|
|||
#include <span>
|
|||
|
|||
#include <glad/glad.h>
|
|||
|
|||
#include "common/alignment.h"
|
|||
#include "common/assert.h"
|
|||
#include "video_core/renderer_opengl/gl_stream_buffer.h"
|
|||
|
|||
namespace OpenGL { |
|||
|
|||
StreamBuffer::StreamBuffer() { |
|||
static constexpr GLenum flags = GL_MAP_WRITE_BIT | GL_MAP_PERSISTENT_BIT | GL_MAP_COHERENT_BIT; |
|||
buffer.Create(); |
|||
glObjectLabel(GL_BUFFER, buffer.handle, -1, "Stream Buffer"); |
|||
glNamedBufferStorage(buffer.handle, STREAM_BUFFER_SIZE, nullptr, flags); |
|||
mapped_pointer = |
|||
static_cast<u8*>(glMapNamedBufferRange(buffer.handle, 0, STREAM_BUFFER_SIZE, flags)); |
|||
for (OGLSync& sync : fences) { |
|||
sync.Create(); |
|||
} |
|||
} |
|||
|
|||
std::pair<std::span<u8>, size_t> StreamBuffer::Request(size_t size) noexcept { |
|||
ASSERT(size < REGION_SIZE); |
|||
for (size_t region = Region(used_iterator), region_end = Region(iterator); region < region_end; |
|||
++region) { |
|||
fences[region].Create(); |
|||
} |
|||
used_iterator = iterator; |
|||
|
|||
for (size_t region = Region(free_iterator) + 1, |
|||
region_end = std::min(Region(iterator + size) + 1, NUM_SYNCS); |
|||
region < region_end; ++region) { |
|||
glClientWaitSync(fences[region].handle, 0, GL_TIMEOUT_IGNORED); |
|||
fences[region].Release(); |
|||
} |
|||
if (iterator + size >= free_iterator) { |
|||
free_iterator = iterator + size; |
|||
} |
|||
if (iterator + size > STREAM_BUFFER_SIZE) { |
|||
for (size_t region = Region(used_iterator); region < NUM_SYNCS; ++region) { |
|||
fences[region].Create(); |
|||
} |
|||
used_iterator = 0; |
|||
iterator = 0; |
|||
free_iterator = size; |
|||
|
|||
for (size_t region = 0, region_end = Region(size); region <= region_end; ++region) { |
|||
glClientWaitSync(fences[region].handle, 0, GL_TIMEOUT_IGNORED); |
|||
fences[region].Release(); |
|||
} |
|||
} |
|||
const size_t offset = iterator; |
|||
iterator = Common::AlignUp(iterator + size, MAX_ALIGNMENT); |
|||
return {std::span(mapped_pointer + offset, size), offset}; |
|||
} |
|||
|
|||
} // namespace OpenGL
|
|||
Write
Preview
Loading…
Cancel
Save
Reference in new issue