From 03ccd8bf432e8b2c945b68f00e8fa88f67388098 Mon Sep 17 00:00:00 2001
From: Fernando Sahmkow
Date: Wed, 28 Dec 2022 09:32:31 -0500
Subject: Texture Cache: Implement async texture downloads.
---
src/video_core/texture_cache/texture_cache.h | 104 +++++++++++++++-------
src/video_core/texture_cache/texture_cache_base.h | 6 +-
2 files changed, 78 insertions(+), 32 deletions(-)
(limited to 'src/video_core/texture_cache')
diff --git a/src/video_core/texture_cache/texture_cache.h b/src/video_core/texture_cache/texture_cache.h
index 7fe451b5a..87152c8e9 100644
--- a/src/video_core/texture_cache/texture_cache.h
+++ b/src/video_core/texture_cache/texture_cache.h
@@ -646,7 +646,28 @@ bool TextureCache
::ShouldWaitAsyncFlushes() const noexcept {
template
void TextureCache::CommitAsyncFlushes() {
// This is intentionally passing the value by copy
- committed_downloads.push(uncommitted_downloads);
+ if constexpr (IMPLEMENTS_ASYNC_DOWNLOADS) {
+ const std::span download_ids = uncommitted_downloads;
+ if (download_ids.empty()) {
+ committed_downloads.emplace_back(std::move(uncommitted_downloads));
+ uncommitted_downloads.clear();
+ async_buffers.emplace_back(std::optional{});
+ return;
+ }
+ size_t total_size_bytes = 0;
+ for (const ImageId image_id : download_ids) {
+ total_size_bytes += slot_images[image_id].unswizzled_size_bytes;
+ }
+ auto download_map = runtime.DownloadStagingBuffer(total_size_bytes, true);
+ for (const ImageId image_id : download_ids) {
+ Image& image = slot_images[image_id];
+ const auto copies = FullDownloadCopies(image.info);
+ image.DownloadMemory(download_map, copies);
+ download_map.offset += Common::AlignUp(image.unswizzled_size_bytes, 64);
+ }
+ async_buffers.emplace_back(download_map);
+ }
+ committed_downloads.emplace_back(std::move(uncommitted_downloads));
uncommitted_downloads.clear();
}
@@ -655,37 +676,58 @@ void TextureCache::PopAsyncFlushes() {
if (committed_downloads.empty()) {
return;
}
- const std::span download_ids = committed_downloads.front();
- if (download_ids.empty()) {
- committed_downloads.pop();
- return;
- }
- size_t total_size_bytes = 0;
- for (const ImageId image_id : download_ids) {
- total_size_bytes += slot_images[image_id].unswizzled_size_bytes;
- }
- auto download_map = runtime.DownloadStagingBuffer(total_size_bytes);
- const size_t original_offset = download_map.offset;
- for (const ImageId image_id : download_ids) {
- Image& image = slot_images[image_id];
- const auto copies = FullDownloadCopies(image.info);
- image.DownloadMemory(download_map, copies);
- download_map.offset += image.unswizzled_size_bytes;
- }
- // Wait for downloads to finish
- runtime.Finish();
-
- download_map.offset = original_offset;
- std::span download_span = download_map.mapped_span;
- for (const ImageId image_id : download_ids) {
- const ImageBase& image = slot_images[image_id];
- const auto copies = FullDownloadCopies(image.info);
- SwizzleImage(*gpu_memory, image.gpu_addr, image.info, copies, download_span,
- swizzle_data_buffer);
- download_map.offset += image.unswizzled_size_bytes;
- download_span = download_span.subspan(image.unswizzled_size_bytes);
+ if constexpr (IMPLEMENTS_ASYNC_DOWNLOADS) {
+ const std::span download_ids = committed_downloads.front();
+ if (download_ids.empty()) {
+ committed_downloads.pop_front();
+ async_buffers.pop_front();
+ return;
+ }
+ auto download_map = *async_buffers.front();
+ std::span download_span = download_map.mapped_span;
+ for (size_t i = download_ids.size(); i > 0; i--) {
+ const ImageBase& image = slot_images[download_ids[i - 1]];
+ const auto copies = FullDownloadCopies(image.info);
+ download_map.offset -= Common::AlignUp(image.unswizzled_size_bytes, 64);
+ std::span download_span_alt = download_span.subspan(download_map.offset);
+ SwizzleImage(*gpu_memory, image.gpu_addr, image.info, copies, download_span_alt,
+ swizzle_data_buffer);
+ }
+ runtime.FreeDeferredStagingBuffer(download_map);
+ committed_downloads.pop_front();
+ async_buffers.pop_front();
+ } else {
+ const std::span download_ids = committed_downloads.front();
+ if (download_ids.empty()) {
+ committed_downloads.pop_front();
+ return;
+ }
+ size_t total_size_bytes = 0;
+ for (const ImageId image_id : download_ids) {
+ total_size_bytes += slot_images[image_id].unswizzled_size_bytes;
+ }
+ auto download_map = runtime.DownloadStagingBuffer(total_size_bytes);
+ const size_t original_offset = download_map.offset;
+ for (const ImageId image_id : download_ids) {
+ Image& image = slot_images[image_id];
+ const auto copies = FullDownloadCopies(image.info);
+ image.DownloadMemory(download_map, copies);
+ download_map.offset += image.unswizzled_size_bytes;
+ }
+ // Wait for downloads to finish
+ runtime.Finish();
+ download_map.offset = original_offset;
+ std::span download_span = download_map.mapped_span;
+ for (const ImageId image_id : download_ids) {
+ const ImageBase& image = slot_images[image_id];
+ const auto copies = FullDownloadCopies(image.info);
+ SwizzleImage(*gpu_memory, image.gpu_addr, image.info, copies, download_span,
+ swizzle_data_buffer);
+ download_map.offset += image.unswizzled_size_bytes;
+ download_span = download_span.subspan(image.unswizzled_size_bytes);
+ }
+ committed_downloads.pop_front();
}
- committed_downloads.pop();
}
template
diff --git a/src/video_core/texture_cache/texture_cache_base.h b/src/video_core/texture_cache/texture_cache_base.h
index 6b2898705..4eea1f609 100644
--- a/src/video_core/texture_cache/texture_cache_base.h
+++ b/src/video_core/texture_cache/texture_cache_base.h
@@ -92,6 +92,8 @@ class TextureCache : public VideoCommon::ChannelSetupCaches::max()};
@@ -106,6 +108,7 @@ class TextureCache : public VideoCommon::ChannelSetupCaches uncommitted_downloads;
- std::queue> committed_downloads;
+ std::deque> committed_downloads;
+ std::deque> async_buffers;
struct LRUItemParams {
using ObjectType = ImageId;
--
cgit v1.2.3