368 lines
11 KiB
C
368 lines
11 KiB
C
/*
|
|
* ***** BEGIN GPL LICENSE BLOCK *****
|
|
*
|
|
* This program is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU General Public License
|
|
* as published by the Free Software Foundation; either version 2
|
|
* of the License, or (at your option) any later version.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License
|
|
* along with this program; if not, write to the Free Software Foundation,
|
|
* Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
|
|
*
|
|
* Copyright 2016, Blender Foundation.
|
|
* Contributor(s): Blender Institute
|
|
*
|
|
* ***** END GPL LICENSE BLOCK *****
|
|
*
|
|
*/
|
|
|
|
/** \file draw_manager_profiling.c
|
|
* \ingroup draw
|
|
*/
|
|
|
|
#include "BLI_rect.h"
|
|
#include "BLI_string.h"
|
|
|
|
#include "BKE_global.h"
|
|
|
|
#include "BLF_api.h"
|
|
|
|
#include "MEM_guardedalloc.h"
|
|
|
|
#include "draw_manager.h"
|
|
|
|
#include "GPU_glew.h"
|
|
#include "GPU_texture.h"
|
|
|
|
#include "UI_resources.h"
|
|
|
|
#include "WM_api.h"
|
|
#include "WM_types.h"
|
|
|
|
#include "draw_manager_profiling.h"
|
|
|
|
#define MAX_TIMER_NAME 32
|
|
#define MAX_NESTED_TIMER 8
|
|
#define CHUNK_SIZE 8
|
|
#define GPU_TIMER_FALLOFF 0.1
|
|
|
|
typedef struct DRWTimer {
|
|
GLuint query[2];
|
|
GLuint64 time_average;
|
|
char name[MAX_TIMER_NAME];
|
|
int lvl; /* Hierarchy level for nested timer. */
|
|
bool is_query; /* Does this timer actually perform queries or is it just a group. */
|
|
} DRWTimer;
|
|
|
|
static struct DRWTimerPool {
|
|
DRWTimer *timers;
|
|
int chunk_count; /* Number of chunk allocated. */
|
|
int timer_count; /* chunk_count * CHUNK_SIZE */
|
|
int timer_increment; /* Keep track of where we are in the stack. */
|
|
int end_increment; /* Keep track of bad usage. */
|
|
bool is_recording; /* Are we in the render loop? */
|
|
bool is_querying; /* Keep track of bad usage. */
|
|
} DTP = {NULL};
|
|
|
|
void DRW_stats_free(void)
|
|
{
|
|
if (DTP.timers != NULL) {
|
|
for (int i = 0; i < DTP.timer_count; ++i) {
|
|
DRWTimer *timer = &DTP.timers[i];
|
|
glDeleteQueries(2, timer->query);
|
|
}
|
|
MEM_freeN(DTP.timers);
|
|
DTP.timers = NULL;
|
|
}
|
|
}
|
|
|
|
void DRW_stats_begin(void)
|
|
{
|
|
if (G.debug_value > 20 && G.debug_value < 30) {
|
|
DTP.is_recording = true;
|
|
}
|
|
|
|
if (DTP.is_recording && DTP.timers == NULL) {
|
|
DTP.chunk_count = 1;
|
|
DTP.timer_count = DTP.chunk_count * CHUNK_SIZE;
|
|
DTP.timers = MEM_callocN(sizeof(DRWTimer) * DTP.timer_count, "DRWTimer stack");
|
|
}
|
|
else if (!DTP.is_recording && DTP.timers != NULL) {
|
|
DRW_stats_free();
|
|
}
|
|
|
|
DTP.is_querying = false;
|
|
DTP.timer_increment = 0;
|
|
DTP.end_increment = 0;
|
|
}
|
|
|
|
static DRWTimer *drw_stats_timer_get(void)
|
|
{
|
|
if (UNLIKELY(DTP.timer_increment >= DTP.timer_count)) {
|
|
/* Resize the stack. */
|
|
DTP.chunk_count++;
|
|
DTP.timer_count = DTP.chunk_count * CHUNK_SIZE;
|
|
DTP.timers = MEM_recallocN(DTP.timers, sizeof(DRWTimer) * DTP.timer_count);
|
|
}
|
|
|
|
return &DTP.timers[DTP.timer_increment++];
|
|
}
|
|
|
|
static void drw_stats_timer_start_ex(const char *name, const bool is_query)
|
|
{
|
|
if (DTP.is_recording) {
|
|
DRWTimer *timer = drw_stats_timer_get();
|
|
BLI_strncpy(timer->name, name, MAX_TIMER_NAME);
|
|
timer->lvl = DTP.timer_increment - DTP.end_increment - 1;
|
|
timer->is_query = is_query;
|
|
|
|
/* Queries cannot be nested or interleaved. */
|
|
BLI_assert(!DTP.is_querying);
|
|
if (timer->is_query) {
|
|
if (timer->query[0] == 0) {
|
|
glGenQueries(1, timer->query);
|
|
}
|
|
|
|
glFinish();
|
|
/* Issue query for the next frame */
|
|
glBeginQuery(GL_TIME_ELAPSED, timer->query[0]);
|
|
DTP.is_querying = true;
|
|
}
|
|
}
|
|
}
|
|
|
|
/* Use this to group the queries. It does NOT keep track
|
|
* of the time, it only sum what the queries inside it. */
|
|
void DRW_stats_group_start(const char *name)
|
|
{
|
|
drw_stats_timer_start_ex(name, false);
|
|
}
|
|
|
|
void DRW_stats_group_end(void)
|
|
{
|
|
if (DTP.is_recording) {
|
|
BLI_assert(!DTP.is_querying);
|
|
DTP.end_increment++;
|
|
}
|
|
}
|
|
|
|
/* NOTE: Only call this when no sub timer will be called. */
|
|
void DRW_stats_query_start(const char *name)
|
|
{
|
|
drw_stats_timer_start_ex(name, true);
|
|
}
|
|
|
|
void DRW_stats_query_end(void)
|
|
{
|
|
if (DTP.is_recording) {
|
|
DTP.end_increment++;
|
|
BLI_assert(DTP.is_querying);
|
|
glEndQuery(GL_TIME_ELAPSED);
|
|
DTP.is_querying = false;
|
|
}
|
|
}
|
|
|
|
void DRW_stats_reset(void)
|
|
{
|
|
BLI_assert((DTP.timer_increment - DTP.end_increment) <= 0 && "You forgot a DRW_stats_group/query_end somewhere!");
|
|
BLI_assert((DTP.timer_increment - DTP.end_increment) >= 0 && "You forgot a DRW_stats_group/query_start somewhere!");
|
|
|
|
if (DTP.is_recording) {
|
|
GLuint64 lvl_time[MAX_NESTED_TIMER] = {0};
|
|
|
|
/* Swap queries for the next frame and sum up each lvl time. */
|
|
for (int i = DTP.timer_increment - 1; i >= 0; --i) {
|
|
DRWTimer *timer = &DTP.timers[i];
|
|
SWAP(GLuint, timer->query[0], timer->query[1]);
|
|
|
|
BLI_assert(timer->lvl < MAX_NESTED_TIMER);
|
|
|
|
if (timer->is_query) {
|
|
GLuint64 time;
|
|
if (timer->query[0] != 0) {
|
|
glGetQueryObjectui64v(timer->query[0], GL_QUERY_RESULT, &time);
|
|
}
|
|
else {
|
|
time = 1000000000; /* 1ms default */
|
|
}
|
|
|
|
timer->time_average = timer->time_average * (1.0 - GPU_TIMER_FALLOFF) + time * GPU_TIMER_FALLOFF;
|
|
timer->time_average = MIN2(timer->time_average, 1000000000);
|
|
}
|
|
else {
|
|
timer->time_average = lvl_time[timer->lvl + 1];
|
|
lvl_time[timer->lvl + 1] = 0;
|
|
}
|
|
|
|
lvl_time[timer->lvl] += timer->time_average;
|
|
}
|
|
|
|
DTP.is_recording = false;
|
|
}
|
|
}
|
|
|
|
static void draw_stat_5row(rcti *rect, int u, int v, const char *txt, const int size)
|
|
{
|
|
BLF_draw_default_ascii(rect->xmin + (1 + u * 5) * U.widget_unit,
|
|
rect->ymax - (3 + v) * U.widget_unit, 0.0f,
|
|
txt, size);
|
|
}
|
|
|
|
static void draw_stat(rcti *rect, int u, int v, const char *txt, const int size)
|
|
{
|
|
BLF_draw_default_ascii(rect->xmin + (1 + u) * U.widget_unit,
|
|
rect->ymax - (3 + v) * U.widget_unit, 0.0f,
|
|
txt, size);
|
|
}
|
|
|
|
void DRW_stats_draw(rcti *rect)
|
|
{
|
|
char stat_string[64];
|
|
int lvl_index[MAX_NESTED_TIMER];
|
|
int v = 0, u = 0;
|
|
|
|
double init_tot_time = 0.0, background_tot_time = 0.0, render_tot_time = 0.0, tot_time = 0.0;
|
|
|
|
int fontid = BLF_default();
|
|
UI_FontThemeColor(fontid, TH_TEXT_HI);
|
|
BLF_enable(fontid, BLF_SHADOW);
|
|
BLF_shadow(fontid, 5, (const float[4]){0.0f, 0.0f, 0.0f, 0.75f});
|
|
BLF_shadow_offset(fontid, 0, -1);
|
|
|
|
BLF_batch_draw_begin();
|
|
|
|
/* ------------------------------------------ */
|
|
/* ---------------- CPU stats --------------- */
|
|
/* ------------------------------------------ */
|
|
/* Label row */
|
|
char col_label[32];
|
|
sprintf(col_label, "Engine");
|
|
draw_stat_5row(rect, u++, v, col_label, sizeof(col_label));
|
|
sprintf(col_label, "Init");
|
|
draw_stat_5row(rect, u++, v, col_label, sizeof(col_label));
|
|
sprintf(col_label, "Background");
|
|
draw_stat_5row(rect, u++, v, col_label, sizeof(col_label));
|
|
sprintf(col_label, "Render");
|
|
draw_stat_5row(rect, u++, v, col_label, sizeof(col_label));
|
|
sprintf(col_label, "Total (w/o cache)");
|
|
draw_stat_5row(rect, u++, v, col_label, sizeof(col_label));
|
|
v++;
|
|
|
|
/* Engines rows */
|
|
char time_to_txt[16];
|
|
for (LinkData *link = DST.enabled_engines.first; link; link = link->next) {
|
|
u = 0;
|
|
DrawEngineType *engine = link->data;
|
|
ViewportEngineData *data = drw_viewport_engine_data_ensure(engine);
|
|
|
|
draw_stat_5row(rect, u++, v, engine->idname, sizeof(engine->idname));
|
|
|
|
init_tot_time += data->init_time;
|
|
sprintf(time_to_txt, "%.2fms", data->init_time);
|
|
draw_stat_5row(rect, u++, v, time_to_txt, sizeof(time_to_txt));
|
|
|
|
background_tot_time += data->background_time;
|
|
sprintf(time_to_txt, "%.2fms", data->background_time);
|
|
draw_stat_5row(rect, u++, v, time_to_txt, sizeof(time_to_txt));
|
|
|
|
render_tot_time += data->render_time;
|
|
sprintf(time_to_txt, "%.2fms", data->render_time);
|
|
draw_stat_5row(rect, u++, v, time_to_txt, sizeof(time_to_txt));
|
|
|
|
tot_time += data->init_time + data->background_time + data->render_time;
|
|
sprintf(time_to_txt, "%.2fms", data->init_time + data->background_time + data->render_time);
|
|
draw_stat_5row(rect, u++, v, time_to_txt, sizeof(time_to_txt));
|
|
v++;
|
|
}
|
|
|
|
/* Totals row */
|
|
u = 0;
|
|
sprintf(col_label, "Sub Total");
|
|
draw_stat_5row(rect, u++, v, col_label, sizeof(col_label));
|
|
sprintf(time_to_txt, "%.2fms", init_tot_time);
|
|
draw_stat_5row(rect, u++, v, time_to_txt, sizeof(time_to_txt));
|
|
sprintf(time_to_txt, "%.2fms", background_tot_time);
|
|
draw_stat_5row(rect, u++, v, time_to_txt, sizeof(time_to_txt));
|
|
sprintf(time_to_txt, "%.2fms", render_tot_time);
|
|
draw_stat_5row(rect, u++, v, time_to_txt, sizeof(time_to_txt));
|
|
sprintf(time_to_txt, "%.2fms", tot_time);
|
|
draw_stat_5row(rect, u++, v, time_to_txt, sizeof(time_to_txt));
|
|
v += 2;
|
|
|
|
u = 0;
|
|
double *cache_time = GPU_viewport_cache_time_get(DST.viewport);
|
|
sprintf(col_label, "Cache Time");
|
|
draw_stat_5row(rect, u++, v, col_label, sizeof(col_label));
|
|
sprintf(time_to_txt, "%.2fms", *cache_time);
|
|
draw_stat_5row(rect, u++, v, time_to_txt, sizeof(time_to_txt));
|
|
v += 2;
|
|
|
|
/* ------------------------------------------ */
|
|
/* ---------------- GPU stats --------------- */
|
|
/* ------------------------------------------ */
|
|
|
|
/* Memory Stats */
|
|
uint tex_mem = GPU_texture_memory_usage_get();
|
|
uint vbo_mem = GPU_vertbuf_get_memory_usage();
|
|
|
|
sprintf(stat_string, "GPU Memory");
|
|
draw_stat(rect, 0, v, stat_string, sizeof(stat_string));
|
|
sprintf(stat_string, "%.2fMB", (double)(tex_mem + vbo_mem) / 1000000.0);
|
|
draw_stat_5row(rect, 1, v++, stat_string, sizeof(stat_string));
|
|
sprintf(stat_string, "Textures");
|
|
draw_stat(rect, 1, v, stat_string, sizeof(stat_string));
|
|
sprintf(stat_string, "%.2fMB", (double)tex_mem / 1000000.0);
|
|
draw_stat_5row(rect, 1, v++, stat_string, sizeof(stat_string));
|
|
sprintf(stat_string, "Meshes");
|
|
draw_stat(rect, 1, v, stat_string, sizeof(stat_string));
|
|
sprintf(stat_string, "%.2fMB", (double)vbo_mem / 1000000.0);
|
|
draw_stat_5row(rect, 1, v++, stat_string, sizeof(stat_string));
|
|
v += 1;
|
|
|
|
/* GPU Timings */
|
|
BLI_snprintf(stat_string, sizeof(stat_string), "GPU Render Timings");
|
|
draw_stat(rect, 0, v++, stat_string, sizeof(stat_string));
|
|
|
|
for (int i = 0; i < DTP.timer_increment; ++i) {
|
|
double time_ms, time_percent;
|
|
DRWTimer *timer = &DTP.timers[i];
|
|
DRWTimer *timer_parent = (timer->lvl > 0) ? &DTP.timers[lvl_index[timer->lvl - 1]] : NULL;
|
|
|
|
/* Only display a number of lvl at a time */
|
|
if ((G.debug_value - 21) < timer->lvl) continue;
|
|
|
|
BLI_assert(timer->lvl < MAX_NESTED_TIMER);
|
|
lvl_index[timer->lvl] = i;
|
|
|
|
time_ms = timer->time_average / 1000000.0;
|
|
|
|
if (timer_parent != NULL) {
|
|
time_percent = ((double)timer->time_average / (double)timer_parent->time_average) * 100.0;
|
|
}
|
|
else {
|
|
time_percent = 100.0;
|
|
}
|
|
|
|
/* avoid very long number */
|
|
time_ms = MIN2(time_ms, 999.0);
|
|
time_percent = MIN2(time_percent, 100.0);
|
|
|
|
BLI_snprintf(stat_string, sizeof(stat_string), "%s", timer->name);
|
|
draw_stat(rect, 0 + timer->lvl, v, stat_string, sizeof(stat_string));
|
|
BLI_snprintf(stat_string, sizeof(stat_string), "%.2fms", time_ms);
|
|
draw_stat(rect, 12 + timer->lvl, v, stat_string, sizeof(stat_string));
|
|
BLI_snprintf(stat_string, sizeof(stat_string), "%.0f", time_percent);
|
|
draw_stat(rect, 16 + timer->lvl, v, stat_string, sizeof(stat_string));
|
|
v++;
|
|
}
|
|
|
|
BLF_batch_draw_end();
|
|
BLF_disable(fontid, BLF_SHADOW);
|
|
}
|