rpcs3/rpcs3/Emu/RSX/VK/VKAsyncScheduler.cpp
2021-04-30 08:23:16 +02:00

229 lines
6 KiB
C++

#include "VKAsyncScheduler.h"
#include "VKHelpers.h"
#include "VKResourceManager.h"
#include "Emu/IdManager.h"
#include "Utilities/lockless.h"
#include "Utilities/mutex.h"
#include <vector>
namespace vk
{
void AsyncTaskScheduler::operator()()
{
init_config_options();
if (!m_use_host_scheduler)
{
// No need to keep the GPU alive using a CPU thread.
rsx_log.notice("Host scheduler is disabled. This thread will now exit.");
return;
}
// If this thread is unavailable for too long, your GPU will hard crash and force a full reset
// TODO: Investigate if this can be executed outside the application context. Attach a debugger to rpcs3 and boom - GPU reset. Not fun rebooting so often.
thread_ctrl::set_native_priority(1);
add_ref();
while (thread_ctrl::state() != thread_state::aborting)
{
for (auto&& job : m_event_queue.pop_all())
{
if (job->type == xqueue_event_type::barrier)
{
// Blocks the queue from progressing until the work items are actually submitted to the GPU
// Avoids spamming the GPU with event requests when the events have not even been submitted yet
while (job->completion_eid == m_submit_count.load())
{
thread_ctrl::wait_for(100);
}
continue;
}
vk::wait_for_event(job->queue1_signal.get(), GENERAL_WAIT_TIMEOUT);
job->queue2_signal->host_signal();
}
}
release();
}
void AsyncTaskScheduler::init_config_options()
{
std::lock_guard lock(m_config_mutex);
if (std::exchange(m_options_initialized, true))
{
// Nothing to do
return;
}
m_use_host_scheduler = g_cfg.video.vk.asynchronous_scheduler == vk_gpu_scheduler_mode::host || g_cfg.video.strict_rendering_mode;
rsx_log.notice("Asynchronous task scheduler is active running in %s mode", m_use_host_scheduler? "'Host'" : "'Device'");
}
void AsyncTaskScheduler::delayed_init()
{
init_config_options();
auto pdev = get_current_renderer();
m_command_pool.create(*const_cast<render_device*>(pdev), pdev->get_transfer_queue_family());
for (usz i = 0; i < events_pool_size; ++i)
{
auto ev1 = std::make_unique<event>(*get_current_renderer(), sync_domain::gpu);
auto ev2 = std::make_unique<event>(*get_current_renderer(), sync_domain::gpu);
m_events_pool.emplace_back(ev1, ev2, 0ull, i);
}
for (usz i = 0; i < VK_MAX_ASYNC_COMPUTE_QUEUES; ++i)
{
m_barriers_pool.emplace_back(0ull, 0xFFFF0000 + i);
}
}
void AsyncTaskScheduler::insert_sync_event()
{
ensure(m_current_cb);
ensure(m_next_event_id < events_pool_size);
auto sync_label = &m_events_pool[m_next_event_id];
if (++m_next_event_id == events_pool_size)
{
// Wrap
m_next_event_id = 0;
}
ensure(sync_label->completion_eid <= vk::last_completed_event_id());
m_sync_label_debug_uid = sync_label->uid;
sync_label->queue1_signal->reset();
sync_label->queue2_signal->reset();
sync_label->completion_eid = vk::current_event_id();
sync_label->queue1_signal->signal(*m_current_cb, VK_PIPELINE_STAGE_TOP_OF_PIPE_BIT, 0);
if (m_use_host_scheduler)
{
m_event_queue.push(sync_label);
m_sync_label = sync_label->queue2_signal.get();
}
else
{
m_sync_label = sync_label->queue1_signal.get();
}
}
AsyncTaskScheduler::~AsyncTaskScheduler()
{
if (!m_async_command_queue.empty())
{
// Driver resources should be destroyed before driver is detached or you get crashes. RAII won't save you here.
rsx_log.error("Async task scheduler resources were not freed correctly!");
}
}
command_buffer* AsyncTaskScheduler::get_current()
{
std::lock_guard lock(m_submit_mutex);
m_sync_required = true;
// 0. Anything still active?
if (m_current_cb)
{
return m_current_cb;
}
// 1. Check if there is a 'next' entry
if (m_async_command_queue.empty())
{
delayed_init();
}
else if (m_next_cb_index < m_async_command_queue.size())
{
m_current_cb = &m_async_command_queue[m_next_cb_index];
}
// 2. Create entry
if (!m_current_cb)
{
if (m_next_cb_index == VK_MAX_ASYNC_COMPUTE_QUEUES)
{
m_next_cb_index = 0;
m_current_cb = &m_async_command_queue[m_next_cb_index];
}
else
{
m_async_command_queue.emplace_back();
m_current_cb = &m_async_command_queue.back();
m_current_cb->create(m_command_pool, true);
}
}
// 3. Insert a barrier for this CB. A job is about to be scheduled on it immediately.
auto barrier = &m_barriers_pool[m_next_cb_index];
barrier->completion_eid = m_submit_count;
m_event_queue.push(barrier);
m_next_cb_index++;
return m_current_cb;
}
event* AsyncTaskScheduler::get_primary_sync_label()
{
if (m_sync_required) [[unlikely]]
{
std::lock_guard lock(m_submit_mutex); // For some reason this is inexplicably expensive. WTF!
ensure(m_current_cb);
insert_sync_event();
m_sync_required = false;
}
return std::exchange(m_sync_label, nullptr);
}
u64 AsyncTaskScheduler::get_primary_sync_label_debug_uid()
{
return std::exchange(m_sync_label_debug_uid, ~0ull);
}
void AsyncTaskScheduler::flush(VkBool32 force_flush, VkSemaphore wait_semaphore, VkPipelineStageFlags wait_dst_stage_mask)
{
if (!m_current_cb)
{
return;
}
std::lock_guard lock(m_submit_mutex);
if (m_sync_required)
{
insert_sync_event();
}
m_current_cb->end();
m_current_cb->submit(get_current_renderer()->get_transfer_queue(), wait_semaphore, VK_NULL_HANDLE, nullptr, wait_dst_stage_mask, force_flush);
m_submit_count++;
thread_ctrl::notify(g_fxo->get<async_scheduler_thread>());
m_last_used_cb = m_current_cb;
m_current_cb = nullptr;
m_sync_required = false;
}
void AsyncTaskScheduler::kill()
{
g_fxo->get<async_scheduler_thread>() = thread_state::aborting;
while (has_refs());
for (auto& cb : m_async_command_queue)
{
cb.destroy();
}
m_async_command_queue.clear();
m_next_cb_index = 0;
m_command_pool.destroy();
m_events_pool.clear();
}
}