diff options
| author | 2023-05-27 22:04:16 -0400 | |
|---|---|---|
| committer | 2023-05-28 00:38:47 -0400 | |
| commit | cb0a41090705f974d5bec009c571344bf72aa375 (patch) | |
| tree | f96606db55cddbdeb8d48853b0b7aa85c4a4dab6 | |
| parent | OpenGL: Make use of persistent buffer maps in buffer cache downloads (diff) | |
| download | yuzu-cb0a41090705f974d5bec009c571344bf72aa375.tar.gz yuzu-cb0a41090705f974d5bec009c571344bf72aa375.tar.xz yuzu-cb0a41090705f974d5bec009c571344bf72aa375.zip | |
gl_staging_buffers: Optimization to reduce fence waiting
| -rw-r--r-- | src/video_core/renderer_opengl/gl_staging_buffer_pool.cpp | 24 | ||||
| -rw-r--r-- | src/video_core/renderer_opengl/gl_staging_buffer_pool.h | 2 |
2 files changed, 22 insertions, 4 deletions
diff --git a/src/video_core/renderer_opengl/gl_staging_buffer_pool.cpp b/src/video_core/renderer_opengl/gl_staging_buffer_pool.cpp index 72b1dbb32..bbb06e51f 100644 --- a/src/video_core/renderer_opengl/gl_staging_buffer_pool.cpp +++ b/src/video_core/renderer_opengl/gl_staging_buffer_pool.cpp | |||
| @@ -9,8 +9,12 @@ | |||
| 9 | 9 | ||
| 10 | #include "common/alignment.h" | 10 | #include "common/alignment.h" |
| 11 | #include "common/assert.h" | 11 | #include "common/assert.h" |
| 12 | #include "common/bit_util.h" | ||
| 13 | #include "common/microprofile.h" | ||
| 12 | #include "video_core/renderer_opengl/gl_staging_buffer_pool.h" | 14 | #include "video_core/renderer_opengl/gl_staging_buffer_pool.h" |
| 13 | 15 | ||
| 16 | MICROPROFILE_DEFINE(OpenGL_BufferRequest, "OpenGL", "BufferRequest", MP_RGB(128, 128, 192)); | ||
| 17 | |||
| 14 | namespace OpenGL { | 18 | namespace OpenGL { |
| 15 | 19 | ||
| 16 | StagingBufferMap::~StagingBufferMap() { | 20 | StagingBufferMap::~StagingBufferMap() { |
| @@ -25,8 +29,11 @@ StagingBuffers::StagingBuffers(GLenum storage_flags_, GLenum map_flags_) | |||
| 25 | StagingBuffers::~StagingBuffers() = default; | 29 | StagingBuffers::~StagingBuffers() = default; |
| 26 | 30 | ||
| 27 | StagingBufferMap StagingBuffers::RequestMap(size_t requested_size, bool insert_fence) { | 31 | StagingBufferMap StagingBuffers::RequestMap(size_t requested_size, bool insert_fence) { |
| 32 | MICROPROFILE_SCOPE(OpenGL_BufferRequest); | ||
| 33 | |||
| 28 | const size_t index = RequestBuffer(requested_size); | 34 | const size_t index = RequestBuffer(requested_size); |
| 29 | OGLSync* const sync = insert_fence ? &syncs[index] : nullptr; | 35 | OGLSync* const sync = insert_fence ? &syncs[index] : nullptr; |
| 36 | sync_indices[index] = insert_fence ? ++current_sync_index : 0; | ||
| 30 | return StagingBufferMap{ | 37 | return StagingBufferMap{ |
| 31 | .mapped_span = std::span(maps[index], requested_size), | 38 | .mapped_span = std::span(maps[index], requested_size), |
| 32 | .sync = sync, | 39 | .sync = sync, |
| @@ -41,13 +48,14 @@ size_t StagingBuffers::RequestBuffer(size_t requested_size) { | |||
| 41 | 48 | ||
| 42 | OGLBuffer& buffer = buffers.emplace_back(); | 49 | OGLBuffer& buffer = buffers.emplace_back(); |
| 43 | buffer.Create(); | 50 | buffer.Create(); |
| 44 | glNamedBufferStorage(buffer.handle, requested_size, nullptr, | 51 | const auto next_pow2_size = Common::NextPow2(requested_size); |
| 52 | glNamedBufferStorage(buffer.handle, next_pow2_size, nullptr, | ||
| 45 | storage_flags | GL_MAP_PERSISTENT_BIT); | 53 | storage_flags | GL_MAP_PERSISTENT_BIT); |
| 46 | maps.push_back(static_cast<u8*>(glMapNamedBufferRange(buffer.handle, 0, requested_size, | 54 | maps.push_back(static_cast<u8*>(glMapNamedBufferRange(buffer.handle, 0, next_pow2_size, |
| 47 | map_flags | GL_MAP_PERSISTENT_BIT))); | 55 | map_flags | GL_MAP_PERSISTENT_BIT))); |
| 48 | |||
| 49 | syncs.emplace_back(); | 56 | syncs.emplace_back(); |
| 50 | sizes.push_back(requested_size); | 57 | sync_indices.emplace_back(); |
| 58 | sizes.push_back(next_pow2_size); | ||
| 51 | 59 | ||
| 52 | ASSERT(syncs.size() == buffers.size() && buffers.size() == maps.size() && | 60 | ASSERT(syncs.size() == buffers.size() && buffers.size() == maps.size() && |
| 53 | maps.size() == sizes.size()); | 61 | maps.size() == sizes.size()); |
| @@ -56,6 +64,7 @@ size_t StagingBuffers::RequestBuffer(size_t requested_size) { | |||
| 56 | } | 64 | } |
| 57 | 65 | ||
| 58 | std::optional<size_t> StagingBuffers::FindBuffer(size_t requested_size) { | 66 | std::optional<size_t> StagingBuffers::FindBuffer(size_t requested_size) { |
| 67 | size_t known_unsignaled_index = current_sync_index + 1; | ||
| 59 | size_t smallest_buffer = std::numeric_limits<size_t>::max(); | 68 | size_t smallest_buffer = std::numeric_limits<size_t>::max(); |
| 60 | std::optional<size_t> found; | 69 | std::optional<size_t> found; |
| 61 | const size_t num_buffers = sizes.size(); | 70 | const size_t num_buffers = sizes.size(); |
| @@ -65,7 +74,14 @@ std::optional<size_t> StagingBuffers::FindBuffer(size_t requested_size) { | |||
| 65 | continue; | 74 | continue; |
| 66 | } | 75 | } |
| 67 | if (syncs[index].handle != 0) { | 76 | if (syncs[index].handle != 0) { |
| 77 | if (sync_indices[index] >= known_unsignaled_index) { | ||
| 78 | // This fence is later than a fence that is known to not be signaled | ||
| 79 | continue; | ||
| 80 | } | ||
| 68 | if (!syncs[index].IsSignaled()) { | 81 | if (!syncs[index].IsSignaled()) { |
| 82 | // Since this fence hasn't been signaled, it's safe to assume all later | ||
| 83 | // fences haven't been signaled either | ||
| 84 | known_unsignaled_index = std::min(known_unsignaled_index, sync_indices[index]); | ||
| 69 | continue; | 85 | continue; |
| 70 | } | 86 | } |
| 71 | syncs[index].Release(); | 87 | syncs[index].Release(); |
diff --git a/src/video_core/renderer_opengl/gl_staging_buffer_pool.h b/src/video_core/renderer_opengl/gl_staging_buffer_pool.h index 2c467be3d..60f72d3a0 100644 --- a/src/video_core/renderer_opengl/gl_staging_buffer_pool.h +++ b/src/video_core/renderer_opengl/gl_staging_buffer_pool.h | |||
| @@ -42,8 +42,10 @@ struct StagingBuffers { | |||
| 42 | std::vector<OGLBuffer> buffers; | 42 | std::vector<OGLBuffer> buffers; |
| 43 | std::vector<u8*> maps; | 43 | std::vector<u8*> maps; |
| 44 | std::vector<size_t> sizes; | 44 | std::vector<size_t> sizes; |
| 45 | std::vector<size_t> sync_indices; | ||
| 45 | GLenum storage_flags; | 46 | GLenum storage_flags; |
| 46 | GLenum map_flags; | 47 | GLenum map_flags; |
| 48 | size_t current_sync_index = 0; | ||
| 47 | }; | 49 | }; |
| 48 | 50 | ||
| 49 | class StreamBuffer { | 51 | class StreamBuffer { |