rpcs3/rpcs3/Emu/RSX/Overlays/overlay_perf_metrics.cpp
2019-11-15 14:53:18 +01:00

640 lines
16 KiB
C++

#include "stdafx.h"
#include "overlay_perf_metrics.h"
#include "../GSRender.h"
#include "Emu/Cell/SPUThread.h"
#include "Emu/Cell/RawSPUThread.h"
#include "Emu/Cell/PPUThread.h"
#include "Utilities/sysinfo.h"
#include <algorithm>
#include <utility>
namespace rsx
{
namespace overlays
{
inline color4f convert_color_code(std::string hex_color, f32 opacity = 1.0f)
{
if (hex_color.length() > 0 && hex_color[0] == '#')
{
hex_color.erase(0, 1);
}
unsigned long hexval;
const size_t len = hex_color.length();
try
{
if (len != 6 && len != 8)
{
fmt::throw_exception("wrong length: %d", len);
}
hexval = std::stoul(hex_color, nullptr, 16);
}
catch (const std::exception& e)
{
LOG_ERROR(RSX, "Overlays: tried to convert incompatible color code: '%s' exception: '%s'", hex_color, e.what());
return color4f(0.0f, 0.0f, 0.0f, 0.0f);
}
const int r = (len == 8 ? (hexval >> 24) : (hexval >> 16)) & 0xff;
const int g = (len == 8 ? (hexval >> 16) : (hexval >> 8)) & 0xff;
const int b = (len == 8 ? (hexval >> 8) : (hexval >> 0)) & 0xff;
const int a = len == 8 ? ((hexval >> 0) & 0xff) : 255;
return color4f(r / 255.f, g / 255.f, b / 255.f, a / 255.f * opacity);
}
void perf_metrics_overlay::reset_transform(label& elm, u16 bottom_margin) const
{
const u32 text_padding = m_font_size / 2;
// left, top, right, bottom
const areau padding { text_padding, text_padding - 4, text_padding, text_padding };
const positionu margin { m_margin_x, m_margin_y };
positionu pos;
const auto overlay_width = m_body.w + margin.x;
const auto overlay_height = m_body.h + margin.y;
switch (m_quadrant)
{
case screen_quadrant::top_left:
pos.x = margin.x;
pos.y = margin.y;
break;
case screen_quadrant::top_right:
pos.x = virtual_width - overlay_width;
pos.y = margin.y;
break;
case screen_quadrant::bottom_left:
pos.x = margin.x;
pos.y = virtual_height - overlay_height - bottom_margin;
break;
case screen_quadrant::bottom_right:
pos.x = virtual_width - overlay_width;
pos.y = virtual_height - overlay_height - bottom_margin;
break;
}
if (g_cfg.video.perf_overlay.center_x)
{
pos.x = (virtual_width - m_body.w) / 2;
}
if (g_cfg.video.perf_overlay.center_y)
{
pos.y = (virtual_height - m_body.h - bottom_margin) / 2;
}
elm.set_pos(pos.x, pos.y);
elm.set_padding(padding.x1, padding.x2, padding.y1, padding.y2);
}
void perf_metrics_overlay::reset_transforms()
{
const u16 perf_overlay_padding = m_font_size / 2;
const u16 graphs_padding = m_font_size * 2;
const u16 fps_graph_h = 60;
const u16 frametime_graph_h = 45;
u16 bottom_margin{};
if (m_framerate_graph_enabled || m_frametime_graph_enabled)
{
// Adjust body size to account for the graphs
// TODO: Bit hacky, could do this with margins if overlay_element had bottom margin (or negative top at least)
bottom_margin = perf_overlay_padding;
if (m_framerate_graph_enabled)
{
bottom_margin += fps_graph_h;
if (m_frametime_graph_enabled)
{
bottom_margin += graphs_padding;
}
}
if (m_frametime_graph_enabled)
{
bottom_margin += frametime_graph_h;
}
}
// Set body/titles transform
reset_transform(m_body, bottom_margin);
reset_transform(m_titles, bottom_margin);
if (m_framerate_graph_enabled || m_frametime_graph_enabled)
{
// Position the graphs within the body
const u16 graphs_width = m_body.w;
const u16 body_left = m_body.x;
const u16 body_bottom = m_body.y + m_body.h + perf_overlay_padding;
if (m_framerate_graph_enabled)
{
m_fps_graph.set_pos(body_left, body_bottom);
m_fps_graph.set_size(graphs_width, fps_graph_h);
}
if (m_frametime_graph_enabled)
{
u16 padding = 0;
if (m_framerate_graph_enabled)
{
padding = m_fps_graph.h + graphs_padding;
}
m_frametime_graph.set_pos(body_left, body_bottom + padding);
m_frametime_graph.set_size(graphs_width, frametime_graph_h);
}
}
}
void perf_metrics_overlay::reset_body()
{
m_body.set_font(m_font.c_str(), m_font_size);
m_body.fore_color = convert_color_code(g_cfg.video.perf_overlay.color_body, m_opacity);
m_body.back_color = convert_color_code(g_cfg.video.perf_overlay.background_body, m_opacity);
reset_transform(m_body);
}
void perf_metrics_overlay::reset_titles()
{
m_titles.set_font(m_font.c_str(), m_font_size);
m_titles.fore_color = convert_color_code(g_cfg.video.perf_overlay.color_title, m_opacity);
m_titles.back_color = convert_color_code(g_cfg.video.perf_overlay.background_title, m_opacity);
reset_transform(m_titles);
switch (m_detail)
{
case detail_level::minimal:
case detail_level::low: m_titles.text = ""; break;
case detail_level::medium: m_titles.text = fmt::format("\n\n%s", title1_medium); break;
case detail_level::high: m_titles.text = fmt::format("\n\n%s\n\n\n\n\n\n%s", title1_high, title2); break;
}
m_titles.auto_resize();
m_titles.refresh();
}
void perf_metrics_overlay::reset_text()
{
reset_body();
reset_titles();
}
void perf_metrics_overlay::init()
{
reset_text();
force_next_update();
m_update_timer.Start();
m_frametime_timer.Start();
update();
m_is_initialised = true;
}
void perf_metrics_overlay::set_framerate_graph_enabled(bool enabled)
{
m_framerate_graph_enabled = enabled;
if (enabled)
{
m_fps_graph.set_title("Framerate");
m_fps_graph.set_font_size(m_font_size * 0.8);
m_fps_graph.set_count(50);
m_fps_graph.set_color(convert_color_code(g_cfg.video.perf_overlay.color_body));
m_fps_graph.set_guide_interval(10);
}
if (m_is_initialised)
{
reset_transforms();
}
}
void perf_metrics_overlay::set_frametime_graph_enabled(bool enabled)
{
m_frametime_graph_enabled = enabled;
if (enabled)
{
m_frametime_graph.set_title("Frametime");
m_frametime_graph.set_font_size(m_font_size * 0.8);
m_frametime_graph.set_count(170);
m_frametime_graph.set_color(convert_color_code(g_cfg.video.perf_overlay.color_body));
m_frametime_graph.set_guide_interval(8);
}
if (m_is_initialised)
{
reset_transforms();
}
}
void perf_metrics_overlay::set_detail_level(detail_level level)
{
m_detail = level;
if (m_is_initialised)
{
reset_titles();
}
}
void perf_metrics_overlay::set_position(screen_quadrant quadrant)
{
m_quadrant = quadrant;
if (m_is_initialised)
{
reset_transforms();
}
}
// In ms
void perf_metrics_overlay::set_update_interval(u32 update_interval)
{
m_update_interval = update_interval;
}
void perf_metrics_overlay::set_font(std::string font)
{
m_font = std::move(font);
if (m_is_initialised)
{
reset_text();
}
}
void perf_metrics_overlay::set_font_size(u32 font_size)
{
m_font_size = font_size;
if (m_is_initialised)
{
reset_text();
}
}
void perf_metrics_overlay::set_margins(u32 margin_x, u32 margin_y)
{
m_margin_x = margin_x;
m_margin_y = margin_y;
if (m_is_initialised)
{
reset_transforms();
}
}
void perf_metrics_overlay::set_opacity(f32 opacity)
{
m_opacity = opacity;
if (m_is_initialised)
{
reset_text();
}
}
void perf_metrics_overlay::force_next_update()
{
m_force_update = true;
}
void perf_metrics_overlay::update()
{
const auto elapsed_update = m_update_timer.GetElapsedTimeInMilliSec();
if (m_is_initialised && m_frametime_graph_enabled)
{
const auto elapsed_frame = m_frametime_timer.GetElapsedTimeInMilliSec();
m_frametime_graph.record_datapoint(elapsed_frame);
}
if (!m_force_update)
{
++m_frames;
}
if (elapsed_update >= m_update_interval || m_force_update)
{
if (!m_force_update)
{
m_update_timer.Start();
}
f32 fps{0};
f32 frametime{0};
u64 ppu_cycles{0};
u64 spu_cycles{0};
u64 rsx_cycles{0};
u64 total_cycles{0};
u32 ppus{0};
u32 spus{0};
f32 cpu_usage{-1.f};
u32 total_threads{0};
f32 ppu_usage{0};
f32 spu_usage{0};
f32 rsx_usage{0};
u32 rsx_load{0};
const auto rsx_thread = g_fxo->get<rsx::thread>();
std::string perf_text;
// 1. Fetch/calculate metrics we'll need
switch (m_detail)
{
case detail_level::high:
{
frametime = m_force_update ? 0 : std::max(0.0, elapsed_update / m_frames);
rsx_load = rsx_thread->get_load();
total_threads = CPUStats::get_thread_count();
// fallthrough
}
case detail_level::medium:
{
ppus = idm::select<named_thread<ppu_thread>>([&ppu_cycles](u32, named_thread<ppu_thread>& ppu)
{
ppu_cycles += thread_ctrl::get_cycles(ppu);
});
spus = idm::select<named_thread<spu_thread>>([&spu_cycles](u32, named_thread<spu_thread>& spu)
{
spu_cycles += thread_ctrl::get_cycles(spu);
});
rsx_cycles += rsx_thread->get_cycles();
total_cycles = ppu_cycles + spu_cycles + rsx_cycles;
cpu_usage = m_cpu_stats.get_usage();
ppu_usage = std::clamp(cpu_usage * ppu_cycles / total_cycles, 0.f, 100.f);
spu_usage = std::clamp(cpu_usage * spu_cycles / total_cycles, 0.f, 100.f);
rsx_usage = std::clamp(cpu_usage * rsx_cycles / total_cycles, 0.f, 100.f);
// fallthrough
}
case detail_level::low:
{
if (cpu_usage < 0.)
cpu_usage = m_cpu_stats.get_usage();
// fallthrough
}
case detail_level::minimal:
{
fps = m_force_update ? 0 : std::max(0.0, static_cast<f32>(m_frames) / (elapsed_update / 1000));
if (m_is_initialised && m_framerate_graph_enabled)
m_fps_graph.record_datapoint(fps);
}
}
// 2. Format output string
switch (m_detail)
{
case detail_level::minimal:
{
perf_text += fmt::format("FPS : %05.2f", fps);
break;
}
case detail_level::low:
{
perf_text += fmt::format("FPS : %05.2f\n"
"CPU : %04.1f %%",
fps, cpu_usage);
break;
}
case detail_level::medium:
{
perf_text += fmt::format("FPS : %05.2f\n\n"
"%s\n"
" PPU : %04.1f %%\n"
" SPU : %04.1f %%\n"
" RSX : %04.1f %%\n"
" Total : %04.1f %%",
fps, std::string(title1_medium.size(), ' '), ppu_usage, spu_usage, rsx_usage, cpu_usage, std::string(title2.size(), ' '));
break;
}
case detail_level::high:
{
perf_text += fmt::format("FPS : %05.2f (%03.1fms)\n\n"
"%s\n"
" PPU : %04.1f %% (%2u)\n"
" SPU : %04.1f %% (%2u)\n"
" RSX : %04.1f %% ( 1)\n"
" Total : %04.1f %% (%2u)\n\n"
"%s\n"
" RSX : %02u %%",
fps, frametime, std::string(title1_high.size(), ' '), ppu_usage, ppus, spu_usage, spus, rsx_usage, cpu_usage, total_threads, std::string(title2.size(), ' '), rsx_load);
break;
}
}
m_body.text = perf_text;
if (m_body.auto_resize())
{
reset_transforms();
}
m_body.refresh();
if (!m_force_update)
{
m_frames = 0;
}
else
{
// Only force once
m_force_update = false;
}
}
if (m_framerate_graph_enabled)
{
m_fps_graph.update();
}
if (m_frametime_graph_enabled)
{
m_frametime_graph.update();
m_frametime_timer.Start();
}
}
compiled_resource perf_metrics_overlay::get_compiled()
{
auto compiled_resources = m_body.get_compiled();
compiled_resources.add(m_titles.get_compiled());
if (m_framerate_graph_enabled)
{
compiled_resources.add(m_fps_graph.get_compiled());
}
if (m_frametime_graph_enabled)
{
compiled_resources.add(m_frametime_graph.get_compiled());
}
return compiled_resources;
}
graph::graph()
{
m_label.set_font("e046323ms.ttf", 8);
m_label.fore_color = { 1.f, 1.f, 1.f, 1.f };
m_label.back_color = { 0.f, 0.f, 0.f, .7f };
back_color = { 0.f, 0.f, 0.f, 0.5f };
}
void graph::set_pos(u16 _x, u16 _y)
{
overlay_element::set_pos(_x, _y);
m_label.set_pos(x, y + h);
}
void graph::set_size(u16 _w, u16 _h)
{
overlay_element::set_size(_w, _h);
set_padding(0, 0, h, 0);
m_label.set_size(w, m_label.h);
m_label.set_pos(x, y + h);
}
void graph::set_title(const char* title)
{
m_title = title;
}
void graph::set_font(const char* font_name, u16 font_size)
{
m_label.set_font(font_name, font_size);
}
void graph::set_font_size(u16 font_size)
{
const auto font_name = m_label.get_font()->font_name.c_str();
m_label.set_font(font_name, font_size);
}
void graph::set_count(u32 datapoint_count)
{
m_datapoint_count = datapoint_count;
m_datapoints.resize(datapoint_count, 0);
}
void graph::set_color(color4f color)
{
m_color = color;
}
void graph::set_guide_interval(f32 guide_interval)
{
m_guide_interval = guide_interval;
}
void graph::record_datapoint(f32 datapoint)
{
// std::dequeue is only faster for large sizes, so just use a std::vector and resize once in while
// Record datapoint
m_datapoints.push_back(datapoint);
// Calculate new min/max
// Make sure min/max reflects the data being displayed, not the entire datapoints vector
m_min = *std::min_element(m_datapoints.end() - m_datapoint_count, m_datapoints.end());
m_max = *std::max_element(m_datapoints.end() - m_datapoint_count, m_datapoints.end());
// Cull vector when it gets large
if (m_datapoints.size() > m_datapoint_count * 16ull)
{
std::copy(m_datapoints.begin() + m_datapoints.size() - m_datapoint_count, m_datapoints.end(), m_datapoints.begin());
m_datapoints.resize(m_datapoint_count);
}
}
void graph::update()
{
m_label.set_text(fmt::format("%s min:%5.2f max:%6.2f", m_title.c_str(), m_min, m_max));
m_label.set_padding(4, 4, 0, 4);
m_label.auto_resize();
m_label.refresh();
}
compiled_resource& graph::get_compiled()
{
refresh();
overlay_element::get_compiled();
const f32 normalize_factor = f32(h) / m_max;
// Don't show guide lines if they'd be more dense than 1 guide line every 3 pixels
const bool guides_too_dense = (m_max / m_guide_interval) > (h / 3);
if (m_guide_interval > 0 && !guides_too_dense)
{
auto& cmd_guides = compiled_resources.append({});
auto& config_guides = cmd_guides.config;
config_guides.color = { 1.f, 1.f, 1.f, .2f };
config_guides.primitives = primitive_type::line_list;
auto& verts_guides = compiled_resources.draw_commands.back().verts;
for (auto y_off = m_guide_interval; y_off < m_max; y_off += m_guide_interval)
{
const f32 guide_y = y + y_off * normalize_factor;
verts_guides.emplace_back(x, guide_y);
verts_guides.emplace_back(x + w, guide_y);
}
}
auto& cmd_graph = compiled_resources.append({});
auto& config_graph = cmd_graph.config;
config_graph.color = m_color;
config_graph.primitives = primitive_type::line_strip;
auto& verts_graph = compiled_resources.draw_commands.back().verts;
const f32 x_stride = f32(w) / m_datapoint_count;
const u32 tail_index_offset = m_datapoints.size() - m_datapoint_count;
for (u32 i = 0; i < m_datapoint_count; ++i)
{
const f32 x_line = x + i * x_stride;
const f32 y_line = y + h - (m_datapoints[i + tail_index_offset] * normalize_factor);
verts_graph.emplace_back(x_line, y_line);
}
compiled_resources.add(m_label.get_compiled());
return compiled_resources;
}
} // namespace overlays
} // namespace rsx