summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorGravatar ameerj2023-05-27 22:04:16 -0400
committerGravatar ameerj2023-05-28 00:38:47 -0400
commitcb0a41090705f974d5bec009c571344bf72aa375 (patch)
treef96606db55cddbdeb8d48853b0b7aa85c4a4dab6
parentOpenGL: Make use of persistent buffer maps in buffer cache downloads (diff)
downloadyuzu-cb0a41090705f974d5bec009c571344bf72aa375.tar.gz
yuzu-cb0a41090705f974d5bec009c571344bf72aa375.tar.xz
yuzu-cb0a41090705f974d5bec009c571344bf72aa375.zip
gl_staging_buffers: Optimization to reduce fence waiting
-rw-r--r--src/video_core/renderer_opengl/gl_staging_buffer_pool.cpp24
-rw-r--r--src/video_core/renderer_opengl/gl_staging_buffer_pool.h2
2 files changed, 22 insertions, 4 deletions
diff --git a/src/video_core/renderer_opengl/gl_staging_buffer_pool.cpp b/src/video_core/renderer_opengl/gl_staging_buffer_pool.cpp
index 72b1dbb32..bbb06e51f 100644
--- a/src/video_core/renderer_opengl/gl_staging_buffer_pool.cpp
+++ b/src/video_core/renderer_opengl/gl_staging_buffer_pool.cpp
@@ -9,8 +9,12 @@
9 9
10#include "common/alignment.h" 10#include "common/alignment.h"
11#include "common/assert.h" 11#include "common/assert.h"
12#include "common/bit_util.h"
13#include "common/microprofile.h"
12#include "video_core/renderer_opengl/gl_staging_buffer_pool.h" 14#include "video_core/renderer_opengl/gl_staging_buffer_pool.h"
13 15
16MICROPROFILE_DEFINE(OpenGL_BufferRequest, "OpenGL", "BufferRequest", MP_RGB(128, 128, 192));
17
14namespace OpenGL { 18namespace OpenGL {
15 19
16StagingBufferMap::~StagingBufferMap() { 20StagingBufferMap::~StagingBufferMap() {
@@ -25,8 +29,11 @@ StagingBuffers::StagingBuffers(GLenum storage_flags_, GLenum map_flags_)
25StagingBuffers::~StagingBuffers() = default; 29StagingBuffers::~StagingBuffers() = default;
26 30
27StagingBufferMap StagingBuffers::RequestMap(size_t requested_size, bool insert_fence) { 31StagingBufferMap StagingBuffers::RequestMap(size_t requested_size, bool insert_fence) {
32 MICROPROFILE_SCOPE(OpenGL_BufferRequest);
33
28 const size_t index = RequestBuffer(requested_size); 34 const size_t index = RequestBuffer(requested_size);
29 OGLSync* const sync = insert_fence ? &syncs[index] : nullptr; 35 OGLSync* const sync = insert_fence ? &syncs[index] : nullptr;
36 sync_indices[index] = insert_fence ? ++current_sync_index : 0;
30 return StagingBufferMap{ 37 return StagingBufferMap{
31 .mapped_span = std::span(maps[index], requested_size), 38 .mapped_span = std::span(maps[index], requested_size),
32 .sync = sync, 39 .sync = sync,
@@ -41,13 +48,14 @@ size_t StagingBuffers::RequestBuffer(size_t requested_size) {
41 48
42 OGLBuffer& buffer = buffers.emplace_back(); 49 OGLBuffer& buffer = buffers.emplace_back();
43 buffer.Create(); 50 buffer.Create();
44 glNamedBufferStorage(buffer.handle, requested_size, nullptr, 51 const auto next_pow2_size = Common::NextPow2(requested_size);
52 glNamedBufferStorage(buffer.handle, next_pow2_size, nullptr,
45 storage_flags | GL_MAP_PERSISTENT_BIT); 53 storage_flags | GL_MAP_PERSISTENT_BIT);
46 maps.push_back(static_cast<u8*>(glMapNamedBufferRange(buffer.handle, 0, requested_size, 54 maps.push_back(static_cast<u8*>(glMapNamedBufferRange(buffer.handle, 0, next_pow2_size,
47 map_flags | GL_MAP_PERSISTENT_BIT))); 55 map_flags | GL_MAP_PERSISTENT_BIT)));
48
49 syncs.emplace_back(); 56 syncs.emplace_back();
50 sizes.push_back(requested_size); 57 sync_indices.emplace_back();
58 sizes.push_back(next_pow2_size);
51 59
52 ASSERT(syncs.size() == buffers.size() && buffers.size() == maps.size() && 60 ASSERT(syncs.size() == buffers.size() && buffers.size() == maps.size() &&
53 maps.size() == sizes.size()); 61 maps.size() == sizes.size());
@@ -56,6 +64,7 @@ size_t StagingBuffers::RequestBuffer(size_t requested_size) {
56} 64}
57 65
58std::optional<size_t> StagingBuffers::FindBuffer(size_t requested_size) { 66std::optional<size_t> StagingBuffers::FindBuffer(size_t requested_size) {
67 size_t known_unsignaled_index = current_sync_index + 1;
59 size_t smallest_buffer = std::numeric_limits<size_t>::max(); 68 size_t smallest_buffer = std::numeric_limits<size_t>::max();
60 std::optional<size_t> found; 69 std::optional<size_t> found;
61 const size_t num_buffers = sizes.size(); 70 const size_t num_buffers = sizes.size();
@@ -65,7 +74,14 @@ std::optional<size_t> StagingBuffers::FindBuffer(size_t requested_size) {
65 continue; 74 continue;
66 } 75 }
67 if (syncs[index].handle != 0) { 76 if (syncs[index].handle != 0) {
77 if (sync_indices[index] >= known_unsignaled_index) {
78 // This fence is later than a fence that is known to not be signaled
79 continue;
80 }
68 if (!syncs[index].IsSignaled()) { 81 if (!syncs[index].IsSignaled()) {
82 // Since this fence hasn't been signaled, it's safe to assume all later
83 // fences haven't been signaled either
84 known_unsignaled_index = std::min(known_unsignaled_index, sync_indices[index]);
69 continue; 85 continue;
70 } 86 }
71 syncs[index].Release(); 87 syncs[index].Release();
diff --git a/src/video_core/renderer_opengl/gl_staging_buffer_pool.h b/src/video_core/renderer_opengl/gl_staging_buffer_pool.h
index 2c467be3d..60f72d3a0 100644
--- a/src/video_core/renderer_opengl/gl_staging_buffer_pool.h
+++ b/src/video_core/renderer_opengl/gl_staging_buffer_pool.h
@@ -42,8 +42,10 @@ struct StagingBuffers {
42 std::vector<OGLBuffer> buffers; 42 std::vector<OGLBuffer> buffers;
43 std::vector<u8*> maps; 43 std::vector<u8*> maps;
44 std::vector<size_t> sizes; 44 std::vector<size_t> sizes;
45 std::vector<size_t> sync_indices;
45 GLenum storage_flags; 46 GLenum storage_flags;
46 GLenum map_flags; 47 GLenum map_flags;
48 size_t current_sync_index = 0;
47}; 49};
48 50
49class StreamBuffer { 51class StreamBuffer {