Merge pull request #5208 from bunnei/service-threads

Service threads
author: bunnei 2020-12-30 22:06:05 -0800
committer: GitHub 2020-12-30 22:06:05 -0800
commit: 25d607f5f63929369fb74f386a920b69bb24f442 (patch)
tree: 9ee5a023f033d99561a0358c5c71aeecc92c9d64 /src/video_core/gpu_thread.cpp
parent: Merge pull request #5263 from lioncash/uninit (diff)
parent: hle: kernel: service_thread: Make thread naming more consistent. (diff)
download: yuzu-25d607f5f63929369fb74f386a920b69bb24f442.tar.gz
yuzu-25d607f5f63929369fb74f386a920b69bb24f442.tar.xz
yuzu-25d607f5f63929369fb74f386a920b69bb24f442.zip
1 files changed, 29 insertions, 7 deletions
diff --git a/src/video_core/gpu_thread.cpp b/src/video_core/gpu_thread.cpp
index e27218b96..7e490bcc3 100644
--- a/src/video_core/gpu_thread.cpp
+++ b/src/video_core/gpu_thread.cpp
@@ -4,6 +4,7 @@
 #include "common/assert.h"
 #include "common/microprofile.h"
+#include "common/scope_exit.h"
 #include "common/thread.h"
 #include "core/core.h"
 #include "core/frontend/emu_window.h"
@@ -21,6 +22,8 @@ static void RunThread(Core::System& system, VideoCore::RendererBase& renderer,
                      SynchState& state, Tegra::CDmaPusher& cdma_pusher) {
    std::string name = "yuzu:GPU";
    MicroProfileOnThreadCreate(name.c_str());
+    SCOPE_EXIT({ MicroProfileOnThreadExit(); });
    Common::SetCurrentThreadName(name.c_str());
    Common::SetCurrentThreadPriority(Common::ThreadPriority::High);
    system.RegisterHostThread();
@@ -65,7 +68,8 @@ static void RunThread(Core::System& system, VideoCore::RendererBase& renderer,
    }
 }
-ThreadManager::ThreadManager(Core::System& system_) : system{system_} {}
+ThreadManager::ThreadManager(Core::System& system_, bool is_async_)
+    : system{system_}, is_async{is_async_} {}
 ThreadManager::~ThreadManager() {
    if (!thread.joinable()) {
@@ -97,19 +101,30 @@ void ThreadManager::SwapBuffers(const Tegra::FramebufferConfig* framebuffer) {
 }
 void ThreadManager::FlushRegion(VAddr addr, u64 size) {
-    if (!Settings::IsGPULevelHigh()) {
+    if (!is_async) {
+        // Always flush with synchronous GPU mode
        PushCommand(FlushRegionCommand(addr, size));
        return;
    }
-    if (!Settings::IsGPULevelExtreme()) {
-        return;
+    // Asynchronous GPU mode
-    }
+    switch (Settings::values.gpu_accuracy.GetValue()) {
-    if (system.Renderer().Rasterizer().MustFlushRegion(addr, size)) {
+    case Settings::GPUAccuracy::Normal:
+        PushCommand(FlushRegionCommand(addr, size));
+        break;
+    case Settings::GPUAccuracy::High:
+        // TODO(bunnei): Is this right? Preserving existing behavior for now
+        break;
+    case Settings::GPUAccuracy::Extreme: {
        auto& gpu = system.GPU();
        u64 fence = gpu.RequestFlush(addr, size);
        PushCommand(GPUTickCommand());
        while (fence > gpu.CurrentFlushRequestFence()) {
        }
+        break;
+    }
+    default:
+        UNIMPLEMENTED_MSG("Unsupported gpu_accuracy {}", Settings::values.gpu_accuracy.GetValue());
    }
 }
@@ -123,7 +138,8 @@ void ThreadManager::FlushAndInvalidateRegion(VAddr addr, u64 size) {
 }
 void ThreadManager::WaitIdle() const {
-    while (state.last_fence > state.signaled_fence.load(std::memory_order_relaxed)) {
+    while (state.last_fence > state.signaled_fence.load(std::memory_order_relaxed) &&
+           system.IsPoweredOn()) {
    }
 }
@@ -134,6 +150,12 @@ void ThreadManager::OnCommandListEnd() {
 u64 ThreadManager::PushCommand(CommandData&& command_data) {
    const u64 fence{++state.last_fence};
    state.queue.Push(CommandDataContainer(std::move(command_data), fence));
+    if (!is_async) {
+        // In synchronous GPU mode, block the caller until the command has executed
+        WaitIdle();
+    }
    return fence;
 }
author	bunnei	2020-12-30 22:06:05 -0800
committer	GitHub	2020-12-30 22:06:05 -0800
commit	25d607f5f63929369fb74f386a920b69bb24f442 (patch)
tree	9ee5a023f033d99561a0358c5c71aeecc92c9d64 /src/video_core/gpu_thread.cpp
parent	Merge pull request #5263 from lioncash/uninit (diff)
parent	hle: kernel: service_thread: Make thread naming more consistent. (diff)
download	yuzu-25d607f5f63929369fb74f386a920b69bb24f442.tar.gz yuzu-25d607f5f63929369fb74f386a920b69bb24f442.tar.xz yuzu-25d607f5f63929369fb74f386a920b69bb24f442.zip

diff --git a/src/video_core/gpu_thread.cpp b/src/video_core/gpu_thread.cpp index e27218b96..7e490bcc3 100644 --- a/src/video_core/gpu_thread.cpp +++ b/src/video_core/gpu_thread.cpp
@@ -4,6 +4,7 @@
4		4
5	#include "common/assert.h"	5	#include "common/assert.h"
6	#include "common/microprofile.h"	6	#include "common/microprofile.h"
		7	#include "common/scope_exit.h"
7	#include "common/thread.h"	8	#include "common/thread.h"
8	#include "core/core.h"	9	#include "core/core.h"
9	#include "core/frontend/emu_window.h"	10	#include "core/frontend/emu_window.h"
@@ -21,6 +22,8 @@ static void RunThread(Core::System& system, VideoCore::RendererBase& renderer,
21	SynchState& state, Tegra::CDmaPusher& cdma_pusher) {	22	SynchState& state, Tegra::CDmaPusher& cdma_pusher) {
22	std::string name = "yuzu:GPU";	23	std::string name = "yuzu:GPU";
23	MicroProfileOnThreadCreate(name.c_str());	24	MicroProfileOnThreadCreate(name.c_str());
		25	SCOPE_EXIT({ MicroProfileOnThreadExit(); });
		26
24	Common::SetCurrentThreadName(name.c_str());	27	Common::SetCurrentThreadName(name.c_str());
25	Common::SetCurrentThreadPriority(Common::ThreadPriority::High);	28	Common::SetCurrentThreadPriority(Common::ThreadPriority::High);
26	system.RegisterHostThread();	29	system.RegisterHostThread();
@@ -65,7 +68,8 @@ static void RunThread(Core::System& system, VideoCore::RendererBase& renderer,
65	}	68	}
66	}	69	}
67		70
68	ThreadManager::ThreadManager(Core::System& system_) : system{system_} {}	71	ThreadManager::ThreadManager(Core::System& system_, bool is_async_)
		72	: system{system_}, is_async{is_async_} {}
69		73
70	ThreadManager::~ThreadManager() {	74	ThreadManager::~ThreadManager() {
71	if (!thread.joinable()) {	75	if (!thread.joinable()) {
@@ -97,19 +101,30 @@ void ThreadManager::SwapBuffers(const Tegra::FramebufferConfig* framebuffer) {
97	}	101	}
98		102
99	void ThreadManager::FlushRegion(VAddr addr, u64 size) {	103	void ThreadManager::FlushRegion(VAddr addr, u64 size) {
100	if (!Settings::IsGPULevelHigh()) {	104	if (!is_async) {
		105	// Always flush with synchronous GPU mode
101	PushCommand(FlushRegionCommand(addr, size));	106	PushCommand(FlushRegionCommand(addr, size));
102	return;	107	return;
103	}	108	}
104	if (!Settings::IsGPULevelExtreme()) {	109
105	return;	110	// Asynchronous GPU mode
106	}	111	switch (Settings::values.gpu_accuracy.GetValue()) {
107	if (system.Renderer().Rasterizer().MustFlushRegion(addr, size)) {	112	case Settings::GPUAccuracy::Normal:
		113	PushCommand(FlushRegionCommand(addr, size));
		114	break;
		115	case Settings::GPUAccuracy::High:
		116	// TODO(bunnei): Is this right? Preserving existing behavior for now
		117	break;
		118	case Settings::GPUAccuracy::Extreme: {
108	auto& gpu = system.GPU();	119	auto& gpu = system.GPU();
109	u64 fence = gpu.RequestFlush(addr, size);	120	u64 fence = gpu.RequestFlush(addr, size);
110	PushCommand(GPUTickCommand());	121	PushCommand(GPUTickCommand());
111	while (fence > gpu.CurrentFlushRequestFence()) {	122	while (fence > gpu.CurrentFlushRequestFence()) {
112	}	123	}
		124	break;
		125	}
		126	default:
		127	UNIMPLEMENTED_MSG("Unsupported gpu_accuracy {}", Settings::values.gpu_accuracy.GetValue());
113	}	128	}
114	}	129	}
115		130
@@ -123,7 +138,8 @@ void ThreadManager::FlushAndInvalidateRegion(VAddr addr, u64 size) {
123	}	138	}
124		139
125	void ThreadManager::WaitIdle() const {	140	void ThreadManager::WaitIdle() const {
126	while (state.last_fence > state.signaled_fence.load(std::memory_order_relaxed)) {	141	while (state.last_fence > state.signaled_fence.load(std::memory_order_relaxed) &&
		142	system.IsPoweredOn()) {
127	}	143	}
128	}	144	}
129		145
@@ -134,6 +150,12 @@ void ThreadManager::OnCommandListEnd() {
134	u64 ThreadManager::PushCommand(CommandData&& command_data) {	150	u64 ThreadManager::PushCommand(CommandData&& command_data) {
135	const u64 fence{++state.last_fence};	151	const u64 fence{++state.last_fence};
136	state.queue.Push(CommandDataContainer(std::move(command_data), fence));	152	state.queue.Push(CommandDataContainer(std::move(command_data), fence));
		153
		154	if (!is_async) {
		155	// In synchronous GPU mode, block the caller until the command has executed
		156	WaitIdle();
		157	}
		158
137	return fence;	159	return fence;
138	}	160	}
139		161