citra/src/video_core/gpu_thread.cpp

// Copyright 2019 yuzu Emulator Project
// Licensed under GPLv2 or any later version
// Refer to the license.txt file included.

#include "common/assert.h"
#include "common/microprofile.h"
#include "common/scope_exit.h"
#include "common/thread.h"
#include "core/core.h"
#include "core/frontend/emu_window.h"
#include "core/settings.h"
#include "video_core/dma_pusher.h"
#include "video_core/gpu.h"
#include "video_core/gpu_thread.h"
#include "video_core/renderer_base.h"

namespace VideoCommon::GPUThread {

/// Runs the GPU thread
static void RunThread(Core::System& system, VideoCore::RendererBase& renderer,
                      Core::Frontend::GraphicsContext& context, Tegra::DmaPusher& dma_pusher,
                      SynchState& state, Tegra::CDmaPusher& cdma_pusher) {
    std::string name = "yuzu:GPU";
    MicroProfileOnThreadCreate(name.c_str());
    SCOPE_EXIT({ MicroProfileOnThreadExit(); });

    Common::SetCurrentThreadName(name.c_str());
    Common::SetCurrentThreadPriority(Common::ThreadPriority::High);
    system.RegisterHostThread();

    // Wait for first GPU command before acquiring the window context
    while (state.queue.Empty())
        ;

    // If emulation was stopped during disk shader loading, abort before trying to acquire context
    if (!state.is_running) {
        return;
    }

    auto current_context = context.Acquire();

    CommandDataContainer next;
    while (state.is_running) {
        next = state.queue.PopWait();
        if (auto* submit_list = std::get_if<SubmitListCommand>(&next.data)) {
            dma_pusher.Push(std::move(submit_list->entries));
            dma_pusher.DispatchCalls();
        } else if (auto* command_list = std::get_if<SubmitChCommandEntries>(&next.data)) {
            // NVDEC
            cdma_pusher.Push(std::move(command_list->entries));
            cdma_pusher.DispatchCalls();
        } else if (const auto* data = std::get_if<SwapBuffersCommand>(&next.data)) {
            renderer.SwapBuffers(data->framebuffer ? &*data->framebuffer : nullptr);
        } else if (std::holds_alternative<OnCommandListEndCommand>(next.data)) {
            renderer.Rasterizer().ReleaseFences();
        } else if (std::holds_alternative<GPUTickCommand>(next.data)) {
            system.GPU().TickWork();
        } else if (const auto* flush = std::get_if<FlushRegionCommand>(&next.data)) {
            renderer.Rasterizer().FlushRegion(flush->addr, flush->size);
        } else if (const auto* invalidate = std::get_if<InvalidateRegionCommand>(&next.data)) {
            renderer.Rasterizer().OnCPUWrite(invalidate->addr, invalidate->size);
        } else if (std::holds_alternative<EndProcessingCommand>(next.data)) {
            return;
        } else {
            UNREACHABLE();
        }
        state.signaled_fence.store(next.fence);
    }
}

ThreadManager::ThreadManager(Core::System& system_, bool is_async_)
    : system{system_}, is_async{is_async_} {}

ThreadManager::~ThreadManager() {
    if (!thread.joinable()) {
        return;
    }

    // Notify GPU thread that a shutdown is pending
    PushCommand(EndProcessingCommand());
    thread.join();
}

void ThreadManager::StartThread(VideoCore::RendererBase& renderer,
                                Core::Frontend::GraphicsContext& context,
                                Tegra::DmaPusher& dma_pusher, Tegra::CDmaPusher& cdma_pusher) {
    thread = std::thread(RunThread, std::ref(system), std::ref(renderer), std::ref(context),
                         std::ref(dma_pusher), std::ref(state), std::ref(cdma_pusher));
}

void ThreadManager::SubmitList(Tegra::CommandList&& entries) {
    PushCommand(SubmitListCommand(std::move(entries)));
}

void ThreadManager::SubmitCommandBuffer(Tegra::ChCommandHeaderList&& entries) {
    PushCommand(SubmitChCommandEntries(std::move(entries)));
}

void ThreadManager::SwapBuffers(const Tegra::FramebufferConfig* framebuffer) {
    PushCommand(SwapBuffersCommand(framebuffer ? std::make_optional(*framebuffer) : std::nullopt));
}

void ThreadManager::FlushRegion(VAddr addr, u64 size) {
    if (!is_async) {
        // Always flush with synchronous GPU mode
        PushCommand(FlushRegionCommand(addr, size));
        return;
    }

    // Asynchronous GPU mode
    switch (Settings::values.gpu_accuracy.GetValue()) {
    case Settings::GPUAccuracy::Normal:
        PushCommand(FlushRegionCommand(addr, size));
        break;
    case Settings::GPUAccuracy::High:
        // TODO(bunnei): Is this right? Preserving existing behavior for now
        break;
    case Settings::GPUAccuracy::Extreme: {
        auto& gpu = system.GPU();
        u64 fence = gpu.RequestFlush(addr, size);
        PushCommand(GPUTickCommand());
        while (fence > gpu.CurrentFlushRequestFence()) {
        }
        break;
    }
    default:
        UNIMPLEMENTED_MSG("Unsupported gpu_accuracy {}", Settings::values.gpu_accuracy.GetValue());
    }
}

void ThreadManager::InvalidateRegion(VAddr addr, u64 size) {
    system.Renderer().Rasterizer().OnCPUWrite(addr, size);
}

void ThreadManager::FlushAndInvalidateRegion(VAddr addr, u64 size) {
    // Skip flush on asynch mode, as FlushAndInvalidateRegion is not used for anything too important
    system.Renderer().Rasterizer().OnCPUWrite(addr, size);
}

void ThreadManager::WaitIdle() const {
    while (state.last_fence > state.signaled_fence.load(std::memory_order_relaxed) &&
           system.IsPoweredOn()) {
    }
}

void ThreadManager::OnCommandListEnd() {
    PushCommand(OnCommandListEndCommand());
}

u64 ThreadManager::PushCommand(CommandData&& command_data) {
    const u64 fence{++state.last_fence};
    state.queue.Push(CommandDataContainer(std::move(command_data), fence));

    if (!is_async) {
        // In synchronous GPU mode, block the caller until the command has executed
        WaitIdle();
    }

    return fence;
}

} // namespace VideoCommon::GPUThread
gpu: Move command processing to another thread. 2019-01-24 03:17:55 +00:00			`// Copyright 2019 yuzu Emulator Project`
			`// Licensed under GPLv2 or any later version`
			`// Refer to the license.txt file included.`

			`#include "common/assert.h"`
			`#include "common/microprofile.h"`
gpu: gpu_thread: Ensure MicroProfile is shutdown on exit. 2020-12-25 07:28:46 +00:00			`#include "common/scope_exit.h"`
General: Setup yuzu threads' microprofile, naming and registry. 2020-02-25 15:12:46 +00:00			`#include "common/thread.h"`
gpu_thread: Improve synchronization by using CoreTiming. 2019-03-31 00:08:09 +00:00			`#include "core/core.h"`
Frontend/GPU: Refactor context management Changes the GraphicsContext to be managed by the GPU core. This eliminates the need for the frontends to fool around with tricky MakeCurrent/DoneCurrent calls that are dependent on the settings (such as async gpu option). This also refactors out the need to use QWidget::fromWindowContainer as that caused issues with focus and input handling. Now we use a regular QWidget and just access the native windowHandle() directly. Another change is removing the debug tool setting in FrameMailbox. Instead of trying to block the frontend until a new frame is ready, the core will now take over presentation and draw directly to the window if the renderer detects that its hooked by NSight or RenderDoc Lastly, since it was in the way, I removed ScopeAcquireWindowContext and replaced it with a simple subclass in GraphicsContext that achieves the same result 2020-03-25 02:58:49 +00:00			`#include "core/frontend/emu_window.h"`
ThreadManager: Sync async reads on accurate gpu. 2020-02-18 02:29:04 +00:00			`#include "core/settings.h"`
gpu: Move command processing to another thread. 2019-01-24 03:17:55 +00:00			`#include "video_core/dma_pusher.h"`
			`#include "video_core/gpu.h"`
			`#include "video_core/gpu_thread.h"`
			`#include "video_core/renderer_base.h"`

			`namespace VideoCommon::GPUThread {`

			`/// Runs the GPU thread`
GPU: Implement Flush Requests for Async mode. 2020-02-20 15:55:32 +00:00			`static void RunThread(Core::System& system, VideoCore::RendererBase& renderer,`
			`Core::Frontend::GraphicsContext& context, Tegra::DmaPusher& dma_pusher,`
video_core: NVDEC Implementation This commit aims to implement the NVDEC (Nvidia Decoder) functionality, with video frame decoding being handled by the FFmpeg library. The process begins with Ioctl commands being sent to the NVDEC and VIC (Video Image Composer) emulated devices. These allocate the necessary GPU buffers for the frame data, along with providing information on the incoming video data. A Submit command then signals the GPU to process and decode the frame data. To decode the frame, the respective codec's header must be manually composed from the information provided by NVDEC, then sent with the raw frame data to the ffmpeg library. Currently, H264 and VP9 are supported, with VP9 having some minor artifacting issues related mainly to the reference frame composition in its uncompressed header. Async GPU is not properly implemented at the moment. Co-Authored-By: David <25727384+ogniK5377@users.noreply.github.com> 2020-10-27 03:07:36 +00:00			`SynchState& state, Tegra::CDmaPusher& cdma_pusher) {`
General: Setup yuzu threads' microprofile, naming and registry. 2020-02-25 15:12:46 +00:00			`std::string name = "yuzu:GPU";`
			`MicroProfileOnThreadCreate(name.c_str());`
gpu: gpu_thread: Ensure MicroProfile is shutdown on exit. 2020-12-25 07:28:46 +00:00			`SCOPE_EXIT({ MicroProfileOnThreadExit(); });`

General: Setup yuzu threads' microprofile, naming and registry. 2020-02-25 15:12:46 +00:00			`Common::SetCurrentThreadName(name.c_str());`
General: Tune the priority of main emulation threads so they have higher priority than less important helper threads. 2020-04-05 13:48:53 +00:00			`Common::SetCurrentThreadPriority(Common::ThreadPriority::High);`
General: Setup yuzu threads' microprofile, naming and registry. 2020-02-25 15:12:46 +00:00			`system.RegisterHostThread();`
gpu: Move command processing to another thread. 2019-01-24 03:17:55 +00:00
			`// Wait for first GPU command before acquiring the window context`
NVFlinger: Correct GCC compile error 2019-06-18 20:58:29 +00:00			`while (state.queue.Empty())`
			`;`
gpu: Move command processing to another thread. 2019-01-24 03:17:55 +00:00
			`// If emulation was stopped during disk shader loading, abort before trying to acquire context`
			`if (!state.is_running) {`
			`return;`
			`}`

Frontend/GPU: Refactor context management Changes the GraphicsContext to be managed by the GPU core. This eliminates the need for the frontends to fool around with tricky MakeCurrent/DoneCurrent calls that are dependent on the settings (such as async gpu option). This also refactors out the need to use QWidget::fromWindowContainer as that caused issues with focus and input handling. Now we use a regular QWidget and just access the native windowHandle() directly. Another change is removing the debug tool setting in FrameMailbox. Instead of trying to block the frontend until a new frame is ready, the core will now take over presentation and draw directly to the window if the renderer detects that its hooked by NSight or RenderDoc Lastly, since it was in the way, I removed ScopeAcquireWindowContext and replaced it with a simple subclass in GraphicsContext that achieves the same result 2020-03-25 02:58:49 +00:00			`auto current_context = context.Acquire();`
gpu: Move command processing to another thread. 2019-01-24 03:17:55 +00:00
gpu: Use host address for caching instead of guest address. 2019-02-19 01:58:32 +00:00			`CommandDataContainer next;`
gpu: Move command processing to another thread. 2019-01-24 03:17:55 +00:00			`while (state.is_running) {`
gpu_thread: Don't spin wait if there are no GPU commands. 2019-11-23 20:17:28 +00:00			`next = state.queue.PopWait();`
video_core: Resolve more variable shadowing scenarios Resolves variable shadowing scenarios up to the end of the OpenGL code to make it nicer to review. The rest will be resolved in a following commit. 2020-12-04 19:39:12 +00:00			`if (auto* submit_list = std::get_if<SubmitListCommand>(&next.data)) {`
gpu_thread: Don't spin wait if there are no GPU commands. 2019-11-23 20:17:28 +00:00			`dma_pusher.Push(std::move(submit_list->entries));`
			`dma_pusher.DispatchCalls();`
video_core: Resolve more variable shadowing scenarios Resolves variable shadowing scenarios up to the end of the OpenGL code to make it nicer to review. The rest will be resolved in a following commit. 2020-12-04 19:39:12 +00:00			`} else if (auto* command_list = std::get_if<SubmitChCommandEntries>(&next.data)) {`
video_core: NVDEC Implementation This commit aims to implement the NVDEC (Nvidia Decoder) functionality, with video frame decoding being handled by the FFmpeg library. The process begins with Ioctl commands being sent to the NVDEC and VIC (Video Image Composer) emulated devices. These allocate the necessary GPU buffers for the frame data, along with providing information on the incoming video data. A Submit command then signals the GPU to process and decode the frame data. To decode the frame, the respective codec's header must be manually composed from the information provided by NVDEC, then sent with the raw frame data to the ffmpeg library. Currently, H264 and VP9 are supported, with VP9 having some minor artifacting issues related mainly to the reference frame composition in its uncompressed header. Async GPU is not properly implemented at the moment. Co-Authored-By: David <25727384+ogniK5377@users.noreply.github.com> 2020-10-27 03:07:36 +00:00			`// NVDEC`
			`cdma_pusher.Push(std::move(command_list->entries));`
			`cdma_pusher.DispatchCalls();`
video_core: Resolve more variable shadowing scenarios Resolves variable shadowing scenarios up to the end of the OpenGL code to make it nicer to review. The rest will be resolved in a following commit. 2020-12-04 19:39:12 +00:00			`} else if (const auto* data = std::get_if<SwapBuffersCommand>(&next.data)) {`
gpu_thread: Don't spin wait if there are no GPU commands. 2019-11-23 20:17:28 +00:00			`renderer.SwapBuffers(data->framebuffer ? &*data->framebuffer : nullptr);`
video_core: Remove unused variables Silences several compiler warnings about unused variables. 2020-07-21 04:52:27 +00:00			`} else if (std::holds_alternative<OnCommandListEndCommand>(next.data)) {`
OpenGL: Implement Fencing backend. 2020-02-17 22:10:23 +00:00			`renderer.Rasterizer().ReleaseFences();`
video_core: Remove unused variables Silences several compiler warnings about unused variables. 2020-07-21 04:52:27 +00:00			`} else if (std::holds_alternative<GPUTickCommand>(next.data)) {`
GPU: Implement Flush Requests for Async mode. 2020-02-20 15:55:32 +00:00			`system.GPU().TickWork();`
video_core: Resolve more variable shadowing scenarios Resolves variable shadowing scenarios up to the end of the OpenGL code to make it nicer to review. The rest will be resolved in a following commit. 2020-12-04 19:39:12 +00:00			`} else if (const auto* flush = std::get_if<FlushRegionCommand>(&next.data)) {`
			`renderer.Rasterizer().FlushRegion(flush->addr, flush->size);`
			`} else if (const auto* invalidate = std::get_if<InvalidateRegionCommand>(&next.data)) {`
			`renderer.Rasterizer().OnCPUWrite(invalidate->addr, invalidate->size);`
gpu_thread: Don't spin wait if there are no GPU commands. 2019-11-23 20:17:28 +00:00			`} else if (std::holds_alternative<EndProcessingCommand>(next.data)) {`
			`return;`
			`} else {`
			`UNREACHABLE();`
gpu: Move command processing to another thread. 2019-01-24 03:17:55 +00:00			`}`
gpu_thread: Don't spin wait if there are no GPU commands. 2019-11-23 20:17:28 +00:00			`state.signaled_fence.store(next.fence);`
gpu: Move command processing to another thread. 2019-01-24 03:17:55 +00:00			`}`
			`}`

video_core: gpu: Implement synchronous mode using threaded GPU. 2020-12-12 08:24:33 +00:00			`ThreadManager::ThreadManager(Core::System& system_, bool is_async_)`
			`: system{system_}, is_async{is_async_} {}`
gpu: Move command processing to another thread. 2019-01-24 03:17:55 +00:00
			`ThreadManager::~ThreadManager() {`
video_core/gpu: Create threads separately from initialization Like with CPU emulation, we generally don't want to fire off the threads immediately after the relevant classes are initialized, we want to do this after all necessary data is done loading first. This splits the thread creation into its own interface member function to allow controlling when these threads in particular get created. 2019-04-09 18:02:00 +00:00			`if (!thread.joinable()) {`
			`return;`
			`}`

gpu: Use host address for caching instead of guest address. 2019-02-19 01:58:32 +00:00			`// Notify GPU thread that a shutdown is pending`
			`PushCommand(EndProcessingCommand());`
gpu: Move command processing to another thread. 2019-01-24 03:17:55 +00:00			`thread.join();`
			`}`

Frontend/GPU: Refactor context management Changes the GraphicsContext to be managed by the GPU core. This eliminates the need for the frontends to fool around with tricky MakeCurrent/DoneCurrent calls that are dependent on the settings (such as async gpu option). This also refactors out the need to use QWidget::fromWindowContainer as that caused issues with focus and input handling. Now we use a regular QWidget and just access the native windowHandle() directly. Another change is removing the debug tool setting in FrameMailbox. Instead of trying to block the frontend until a new frame is ready, the core will now take over presentation and draw directly to the window if the renderer detects that its hooked by NSight or RenderDoc Lastly, since it was in the way, I removed ScopeAcquireWindowContext and replaced it with a simple subclass in GraphicsContext that achieves the same result 2020-03-25 02:58:49 +00:00			`void ThreadManager::StartThread(VideoCore::RendererBase& renderer,`
			`Core::Frontend::GraphicsContext& context,`
video_core: NVDEC Implementation This commit aims to implement the NVDEC (Nvidia Decoder) functionality, with video frame decoding being handled by the FFmpeg library. The process begins with Ioctl commands being sent to the NVDEC and VIC (Video Image Composer) emulated devices. These allocate the necessary GPU buffers for the frame data, along with providing information on the incoming video data. A Submit command then signals the GPU to process and decode the frame data. To decode the frame, the respective codec's header must be manually composed from the information provided by NVDEC, then sent with the raw frame data to the ffmpeg library. Currently, H264 and VP9 are supported, with VP9 having some minor artifacting issues related mainly to the reference frame composition in its uncompressed header. Async GPU is not properly implemented at the moment. Co-Authored-By: David <25727384+ogniK5377@users.noreply.github.com> 2020-10-27 03:07:36 +00:00			`Tegra::DmaPusher& dma_pusher, Tegra::CDmaPusher& cdma_pusher) {`
			`thread = std::thread(RunThread, std::ref(system), std::ref(renderer), std::ref(context),`
			`std::ref(dma_pusher), std::ref(state), std::ref(cdma_pusher));`
video_core/gpu: Create threads separately from initialization Like with CPU emulation, we generally don't want to fire off the threads immediately after the relevant classes are initialized, we want to do this after all necessary data is done loading first. This splits the thread creation into its own interface member function to allow controlling when these threads in particular get created. 2019-04-09 18:02:00 +00:00			`}`

gpu: Move command processing to another thread. 2019-01-24 03:17:55 +00:00			`void ThreadManager::SubmitList(Tegra::CommandList&& entries) {`
GPU_Async: Correct fences, display events and more. This commit uses guest fences on vSync event instead of an articial fake fence we had. It also corrects to keep signaling display events while loading the game as the OS is suppose to send buffers to vSync during that time. 2019-09-25 23:43:23 +00:00			`PushCommand(SubmitListCommand(std::move(entries)));`
gpu: Move command processing to another thread. 2019-01-24 03:17:55 +00:00			`}`

video_core: NVDEC Implementation This commit aims to implement the NVDEC (Nvidia Decoder) functionality, with video frame decoding being handled by the FFmpeg library. The process begins with Ioctl commands being sent to the NVDEC and VIC (Video Image Composer) emulated devices. These allocate the necessary GPU buffers for the frame data, along with providing information on the incoming video data. A Submit command then signals the GPU to process and decode the frame data. To decode the frame, the respective codec's header must be manually composed from the information provided by NVDEC, then sent with the raw frame data to the ffmpeg library. Currently, H264 and VP9 are supported, with VP9 having some minor artifacting issues related mainly to the reference frame composition in its uncompressed header. Async GPU is not properly implemented at the moment. Co-Authored-By: David <25727384+ogniK5377@users.noreply.github.com> 2020-10-27 03:07:36 +00:00			`void ThreadManager::SubmitCommandBuffer(Tegra::ChCommandHeaderList&& entries) {`
			`PushCommand(SubmitChCommandEntries(std::move(entries)));`
			`}`

gpu: Change optional<reference_wrapper<T>> to T* for FramebufferConfig 2019-08-21 04:55:25 +00:00			`void ThreadManager::SwapBuffers(const Tegra::FramebufferConfig* framebuffer) {`
video_core/gpu_thread: Tidy up SwapBuffers() We can just use std::nullopt and std::make_optional to make this a little bit less noisy. 2019-11-27 22:46:07 +00:00			`PushCommand(SwapBuffersCommand(framebuffer ? std::make_optional(*framebuffer) : std::nullopt));`
gpu: Move command processing to another thread. 2019-01-24 03:17:55 +00:00			`}`

GPU: Setup Flush/Invalidate to use VAddr instead of CacheAddr 2020-04-05 16:58:23 +00:00			`void ThreadManager::FlushRegion(VAddr addr, u64 size) {`
video_core: gpu: Implement synchronous mode using threaded GPU. 2020-12-12 08:24:33 +00:00			`if (!is_async) {`
			`// Always flush with synchronous GPU mode`
Async GPU: Correct flushing behavior to be similar to old async GPU behavior. 2020-04-19 17:47:45 +00:00			`PushCommand(FlushRegionCommand(addr, size));`
			`return;`
			`}`
video_core: gpu: Implement synchronous mode using threaded GPU. 2020-12-12 08:24:33 +00:00
			`// Asynchronous GPU mode`
			`switch (Settings::values.gpu_accuracy.GetValue()) {`
			`case Settings::GPUAccuracy::Normal:`
			`PushCommand(FlushRegionCommand(addr, size));`
			`break;`
			`case Settings::GPUAccuracy::High:`
			`// TODO(bunnei): Is this right? Preserving existing behavior for now`
			`break;`
			`case Settings::GPUAccuracy::Extreme: {`
GPU: Implement Flush Requests for Async mode. 2020-02-20 15:55:32 +00:00			`auto& gpu = system.GPU();`
			`u64 fence = gpu.RequestFlush(addr, size);`
			`PushCommand(GPUTickCommand());`
			`while (fence > gpu.CurrentFlushRequestFence()) {`
ThreadManager: Sync async reads on accurate gpu. 2020-02-18 02:29:04 +00:00			`}`
video_core: gpu: Implement synchronous mode using threaded GPU. 2020-12-12 08:24:33 +00:00			`break;`
			`}`
			`default:`
			`UNIMPLEMENTED_MSG("Unsupported gpu_accuracy {}", Settings::values.gpu_accuracy.GetValue());`
ThreadManager: Sync async reads on accurate gpu. 2020-02-18 02:29:04 +00:00			`}`
gpu: Move command processing to another thread. 2019-01-24 03:17:55 +00:00			`}`

GPU: Setup Flush/Invalidate to use VAddr instead of CacheAddr 2020-04-05 16:58:23 +00:00			`void ThreadManager::InvalidateRegion(VAddr addr, u64 size) {`
GPU: Refactor synchronization on Async GPU 2020-02-16 13:51:37 +00:00			`system.Renderer().Rasterizer().OnCPUWrite(addr, size);`
gpu: Move command processing to another thread. 2019-01-24 03:17:55 +00:00			`}`

GPU: Setup Flush/Invalidate to use VAddr instead of CacheAddr 2020-04-05 16:58:23 +00:00			`void ThreadManager::FlushAndInvalidateRegion(VAddr addr, u64 size) {`
gpu: Use host address for caching instead of guest address. 2019-02-19 01:58:32 +00:00			`// Skip flush on asynch mode, as FlushAndInvalidateRegion is not used for anything too important`
GPU: Refactor synchronization on Async GPU 2020-02-16 13:51:37 +00:00			`system.Renderer().Rasterizer().OnCPUWrite(addr, size);`
gpu: Move command processing to another thread. 2019-01-24 03:17:55 +00:00			`}`

Core: Wait for GPU to be idle before shutting down. 2019-09-26 23:08:22 +00:00			`void ThreadManager::WaitIdle() const {`
video_core: gpu_thread: Do not wait when system is powered down. 2020-12-12 09:37:06 +00:00			`while (state.last_fence > state.signaled_fence.load(std::memory_order_relaxed) &&`
			`system.IsPoweredOn()) {`
Core: Wait for GPU to be idle before shutting down. 2019-09-26 23:08:22 +00:00			`}`
			`}`

OpenGL: Implement Fencing backend. 2020-02-17 22:10:23 +00:00			`void ThreadManager::OnCommandListEnd() {`
			`PushCommand(OnCommandListEndCommand());`
			`}`

gpu_thread: Improve synchronization by using CoreTiming. 2019-03-31 00:08:09 +00:00			`u64 ThreadManager::PushCommand(CommandData&& command_data) {`
			`const u64 fence{++state.last_fence};`
			`state.queue.Push(CommandDataContainer(std::move(command_data), fence));`
video_core: gpu: Implement synchronous mode using threaded GPU. 2020-12-12 08:24:33 +00:00
			`if (!is_async) {`
			`// In synchronous GPU mode, block the caller until the command has executed`
			`WaitIdle();`
			`}`

gpu_thread: Improve synchronization by using CoreTiming. 2019-03-31 00:08:09 +00:00			`return fence;`
			`}`

gpu: Move command processing to another thread. 2019-01-24 03:17:55 +00:00			`} // namespace VideoCommon::GPUThread`