diff options
| author | 2020-12-30 22:06:05 -0800 | |
|---|---|---|
| committer | 2020-12-30 22:06:05 -0800 | |
| commit | 25d607f5f63929369fb74f386a920b69bb24f442 (patch) | |
| tree | 9ee5a023f033d99561a0358c5c71aeecc92c9d64 /src/video_core/gpu_thread.cpp | |
| parent | Merge pull request #5263 from lioncash/uninit (diff) | |
| parent | hle: kernel: service_thread: Make thread naming more consistent. (diff) | |
| download | yuzu-25d607f5f63929369fb74f386a920b69bb24f442.tar.gz yuzu-25d607f5f63929369fb74f386a920b69bb24f442.tar.xz yuzu-25d607f5f63929369fb74f386a920b69bb24f442.zip | |
Merge pull request #5208 from bunnei/service-threads
Service threads
Diffstat (limited to 'src/video_core/gpu_thread.cpp')
| -rw-r--r-- | src/video_core/gpu_thread.cpp | 36 |
1 files changed, 29 insertions, 7 deletions
diff --git a/src/video_core/gpu_thread.cpp b/src/video_core/gpu_thread.cpp index e27218b96..7e490bcc3 100644 --- a/src/video_core/gpu_thread.cpp +++ b/src/video_core/gpu_thread.cpp | |||
| @@ -4,6 +4,7 @@ | |||
| 4 | 4 | ||
| 5 | #include "common/assert.h" | 5 | #include "common/assert.h" |
| 6 | #include "common/microprofile.h" | 6 | #include "common/microprofile.h" |
| 7 | #include "common/scope_exit.h" | ||
| 7 | #include "common/thread.h" | 8 | #include "common/thread.h" |
| 8 | #include "core/core.h" | 9 | #include "core/core.h" |
| 9 | #include "core/frontend/emu_window.h" | 10 | #include "core/frontend/emu_window.h" |
| @@ -21,6 +22,8 @@ static void RunThread(Core::System& system, VideoCore::RendererBase& renderer, | |||
| 21 | SynchState& state, Tegra::CDmaPusher& cdma_pusher) { | 22 | SynchState& state, Tegra::CDmaPusher& cdma_pusher) { |
| 22 | std::string name = "yuzu:GPU"; | 23 | std::string name = "yuzu:GPU"; |
| 23 | MicroProfileOnThreadCreate(name.c_str()); | 24 | MicroProfileOnThreadCreate(name.c_str()); |
| 25 | SCOPE_EXIT({ MicroProfileOnThreadExit(); }); | ||
| 26 | |||
| 24 | Common::SetCurrentThreadName(name.c_str()); | 27 | Common::SetCurrentThreadName(name.c_str()); |
| 25 | Common::SetCurrentThreadPriority(Common::ThreadPriority::High); | 28 | Common::SetCurrentThreadPriority(Common::ThreadPriority::High); |
| 26 | system.RegisterHostThread(); | 29 | system.RegisterHostThread(); |
| @@ -65,7 +68,8 @@ static void RunThread(Core::System& system, VideoCore::RendererBase& renderer, | |||
| 65 | } | 68 | } |
| 66 | } | 69 | } |
| 67 | 70 | ||
| 68 | ThreadManager::ThreadManager(Core::System& system_) : system{system_} {} | 71 | ThreadManager::ThreadManager(Core::System& system_, bool is_async_) |
| 72 | : system{system_}, is_async{is_async_} {} | ||
| 69 | 73 | ||
| 70 | ThreadManager::~ThreadManager() { | 74 | ThreadManager::~ThreadManager() { |
| 71 | if (!thread.joinable()) { | 75 | if (!thread.joinable()) { |
| @@ -97,19 +101,30 @@ void ThreadManager::SwapBuffers(const Tegra::FramebufferConfig* framebuffer) { | |||
| 97 | } | 101 | } |
| 98 | 102 | ||
| 99 | void ThreadManager::FlushRegion(VAddr addr, u64 size) { | 103 | void ThreadManager::FlushRegion(VAddr addr, u64 size) { |
| 100 | if (!Settings::IsGPULevelHigh()) { | 104 | if (!is_async) { |
| 105 | // Always flush with synchronous GPU mode | ||
| 101 | PushCommand(FlushRegionCommand(addr, size)); | 106 | PushCommand(FlushRegionCommand(addr, size)); |
| 102 | return; | 107 | return; |
| 103 | } | 108 | } |
| 104 | if (!Settings::IsGPULevelExtreme()) { | 109 | |
| 105 | return; | 110 | // Asynchronous GPU mode |
| 106 | } | 111 | switch (Settings::values.gpu_accuracy.GetValue()) { |
| 107 | if (system.Renderer().Rasterizer().MustFlushRegion(addr, size)) { | 112 | case Settings::GPUAccuracy::Normal: |
| 113 | PushCommand(FlushRegionCommand(addr, size)); | ||
| 114 | break; | ||
| 115 | case Settings::GPUAccuracy::High: | ||
| 116 | // TODO(bunnei): Is this right? Preserving existing behavior for now | ||
| 117 | break; | ||
| 118 | case Settings::GPUAccuracy::Extreme: { | ||
| 108 | auto& gpu = system.GPU(); | 119 | auto& gpu = system.GPU(); |
| 109 | u64 fence = gpu.RequestFlush(addr, size); | 120 | u64 fence = gpu.RequestFlush(addr, size); |
| 110 | PushCommand(GPUTickCommand()); | 121 | PushCommand(GPUTickCommand()); |
| 111 | while (fence > gpu.CurrentFlushRequestFence()) { | 122 | while (fence > gpu.CurrentFlushRequestFence()) { |
| 112 | } | 123 | } |
| 124 | break; | ||
| 125 | } | ||
| 126 | default: | ||
| 127 | UNIMPLEMENTED_MSG("Unsupported gpu_accuracy {}", Settings::values.gpu_accuracy.GetValue()); | ||
| 113 | } | 128 | } |
| 114 | } | 129 | } |
| 115 | 130 | ||
| @@ -123,7 +138,8 @@ void ThreadManager::FlushAndInvalidateRegion(VAddr addr, u64 size) { | |||
| 123 | } | 138 | } |
| 124 | 139 | ||
| 125 | void ThreadManager::WaitIdle() const { | 140 | void ThreadManager::WaitIdle() const { |
| 126 | while (state.last_fence > state.signaled_fence.load(std::memory_order_relaxed)) { | 141 | while (state.last_fence > state.signaled_fence.load(std::memory_order_relaxed) && |
| 142 | system.IsPoweredOn()) { | ||
| 127 | } | 143 | } |
| 128 | } | 144 | } |
| 129 | 145 | ||
| @@ -134,6 +150,12 @@ void ThreadManager::OnCommandListEnd() { | |||
| 134 | u64 ThreadManager::PushCommand(CommandData&& command_data) { | 150 | u64 ThreadManager::PushCommand(CommandData&& command_data) { |
| 135 | const u64 fence{++state.last_fence}; | 151 | const u64 fence{++state.last_fence}; |
| 136 | state.queue.Push(CommandDataContainer(std::move(command_data), fence)); | 152 | state.queue.Push(CommandDataContainer(std::move(command_data), fence)); |
| 153 | |||
| 154 | if (!is_async) { | ||
| 155 | // In synchronous GPU mode, block the caller until the command has executed | ||
| 156 | WaitIdle(); | ||
| 157 | } | ||
| 158 | |||
| 137 | return fence; | 159 | return fence; |
| 138 | } | 160 | } |
| 139 | 161 | ||