2015-05-24 06:55:12 +02:00
|
|
|
// Copyright 2012 Dolphin Emulator Project
|
2021-07-05 03:22:19 +02:00
|
|
|
// SPDX-License-Identifier: GPL-2.0-or-later
|
2013-12-30 07:22:50 -06:00
|
|
|
|
2020-09-15 05:00:24 -07:00
|
|
|
#include "VideoBackends/OGL/OGLPerfQuery.h"
|
2019-07-16 20:18:48 -04:00
|
|
|
|
2015-12-20 21:49:49 -05:00
|
|
|
#include <memory>
|
|
|
|
|
2016-01-17 16:54:31 -05:00
|
|
|
#include "Common/CommonTypes.h"
|
2018-10-03 23:03:26 +10:00
|
|
|
#include "Common/GL/GLExtensions/GLExtensions.h"
|
2015-09-19 04:40:00 +12:00
|
|
|
|
2023-01-27 13:21:09 +13:00
|
|
|
#include "VideoBackends/OGL/OGLGfx.h"
|
2023-01-31 17:26:46 +13:00
|
|
|
#include "VideoCommon/FramebufferManager.h"
|
2019-07-16 20:18:48 -04:00
|
|
|
#include "VideoCommon/VideoCommon.h"
|
2016-06-13 15:41:29 +10:00
|
|
|
#include "VideoCommon/VideoConfig.h"
|
2012-06-17 13:58:29 +02:00
|
|
|
|
2013-02-16 17:50:40 -06:00
|
|
|
namespace OGL
|
|
|
|
{
|
2023-01-28 14:53:19 +13:00
|
|
|
std::unique_ptr<PerfQueryBase> GetPerfQuery(bool is_gles)
|
2015-02-21 16:58:53 -06:00
|
|
|
{
|
2018-10-03 23:03:26 +10:00
|
|
|
if (is_gles && GLExtensions::Supports("GL_NV_occlusion_query_samples"))
|
2015-12-20 21:49:49 -05:00
|
|
|
return std::make_unique<PerfQueryGLESNV>();
|
2018-10-03 23:03:26 +10:00
|
|
|
else if (is_gles)
|
2015-12-20 21:49:49 -05:00
|
|
|
return std::make_unique<PerfQueryGL>(GL_ANY_SAMPLES_PASSED);
|
2018-10-03 23:03:26 +10:00
|
|
|
else
|
|
|
|
return std::make_unique<PerfQueryGL>(GL_SAMPLES_PASSED);
|
2015-02-21 16:58:53 -06:00
|
|
|
}
|
2012-06-17 13:58:29 +02:00
|
|
|
|
|
|
|
PerfQuery::PerfQuery() : m_query_read_pos()
|
2015-02-21 16:58:53 -06:00
|
|
|
{
|
|
|
|
ResetQuery();
|
|
|
|
}
|
|
|
|
|
2022-11-17 21:54:43 +01:00
|
|
|
void PerfQuery::EnableQuery(PerfQueryGroup group)
|
2015-02-21 16:58:53 -06:00
|
|
|
{
|
2022-11-17 21:54:43 +01:00
|
|
|
m_query->EnableQuery(group);
|
2015-02-21 16:58:53 -06:00
|
|
|
}
|
|
|
|
|
2022-11-17 21:54:43 +01:00
|
|
|
void PerfQuery::DisableQuery(PerfQueryGroup group)
|
2015-02-21 16:58:53 -06:00
|
|
|
{
|
2022-11-17 21:54:43 +01:00
|
|
|
m_query->DisableQuery(group);
|
2015-02-21 16:58:53 -06:00
|
|
|
}
|
|
|
|
|
|
|
|
bool PerfQuery::IsFlushed() const
|
|
|
|
{
|
2021-05-13 19:30:30 +02:00
|
|
|
return m_query_count.load(std::memory_order_relaxed) == 0;
|
2015-02-21 16:58:53 -06:00
|
|
|
}
|
|
|
|
|
|
|
|
// TODO: could selectively flush things, but I don't think that will do much
|
|
|
|
void PerfQuery::FlushResults()
|
|
|
|
{
|
|
|
|
m_query->FlushResults();
|
|
|
|
}
|
|
|
|
|
|
|
|
void PerfQuery::ResetQuery()
|
|
|
|
{
|
2021-05-13 19:30:30 +02:00
|
|
|
m_query_count.store(0, std::memory_order_relaxed);
|
|
|
|
for (size_t i = 0; i < m_results.size(); ++i)
|
|
|
|
m_results[i].store(0, std::memory_order_relaxed);
|
2015-02-21 16:58:53 -06:00
|
|
|
}
|
|
|
|
|
|
|
|
u32 PerfQuery::GetQueryResult(PerfQueryType type)
|
|
|
|
{
|
|
|
|
u32 result = 0;
|
2016-06-24 10:43:46 +02:00
|
|
|
|
2015-02-21 16:58:53 -06:00
|
|
|
if (type == PQ_ZCOMP_INPUT_ZCOMPLOC || type == PQ_ZCOMP_OUTPUT_ZCOMPLOC)
|
|
|
|
{
|
2021-05-13 19:30:30 +02:00
|
|
|
result = m_results[PQG_ZCOMP_ZCOMPLOC].load(std::memory_order_relaxed);
|
2015-02-21 16:58:53 -06:00
|
|
|
}
|
|
|
|
else if (type == PQ_ZCOMP_INPUT || type == PQ_ZCOMP_OUTPUT)
|
|
|
|
{
|
2021-05-13 19:30:30 +02:00
|
|
|
result = m_results[PQG_ZCOMP].load(std::memory_order_relaxed);
|
2015-02-21 16:58:53 -06:00
|
|
|
}
|
|
|
|
else if (type == PQ_BLEND_INPUT)
|
|
|
|
{
|
2021-05-13 19:30:30 +02:00
|
|
|
result = m_results[PQG_ZCOMP].load(std::memory_order_relaxed) +
|
|
|
|
m_results[PQG_ZCOMP_ZCOMPLOC].load(std::memory_order_relaxed);
|
2015-02-21 16:58:53 -06:00
|
|
|
}
|
|
|
|
else if (type == PQ_EFB_COPY_CLOCKS)
|
|
|
|
{
|
2021-05-13 19:30:30 +02:00
|
|
|
result = m_results[PQG_EFB_COPY_CLOCKS].load(std::memory_order_relaxed);
|
2015-02-21 16:58:53 -06:00
|
|
|
}
|
2016-06-24 10:43:46 +02:00
|
|
|
|
2016-06-13 15:41:29 +10:00
|
|
|
return result;
|
2015-02-21 16:58:53 -06:00
|
|
|
}
|
|
|
|
|
|
|
|
// Implementations
|
|
|
|
PerfQueryGL::PerfQueryGL(GLenum query_type) : m_query_type(query_type)
|
2012-06-17 13:58:29 +02:00
|
|
|
{
|
2014-02-15 01:12:13 -05:00
|
|
|
for (ActiveQuery& query : m_query_buffer)
|
|
|
|
glGenQueries(1, &query.query_id);
|
2012-06-17 13:58:29 +02:00
|
|
|
}
|
|
|
|
|
2015-02-21 16:58:53 -06:00
|
|
|
PerfQueryGL::~PerfQueryGL()
|
2012-06-17 13:58:29 +02:00
|
|
|
{
|
2014-02-15 01:12:13 -05:00
|
|
|
for (ActiveQuery& query : m_query_buffer)
|
|
|
|
glDeleteQueries(1, &query.query_id);
|
2012-06-17 13:58:29 +02:00
|
|
|
}
|
|
|
|
|
2022-11-17 21:54:43 +01:00
|
|
|
void PerfQueryGL::EnableQuery(PerfQueryGroup group)
|
2012-06-17 13:58:29 +02:00
|
|
|
{
|
2021-05-21 12:48:27 +02:00
|
|
|
u32 query_count = m_query_count.load(std::memory_order_relaxed);
|
2021-05-13 19:30:30 +02:00
|
|
|
|
2013-02-16 17:50:40 -06:00
|
|
|
// Is this sane?
|
2021-05-13 19:30:30 +02:00
|
|
|
if (query_count > m_query_buffer.size() / 2)
|
2021-05-21 12:48:27 +02:00
|
|
|
{
|
2013-02-16 17:50:40 -06:00
|
|
|
WeakFlush();
|
2021-05-21 12:48:27 +02:00
|
|
|
query_count = m_query_count.load(std::memory_order_relaxed);
|
|
|
|
}
|
2016-06-24 10:43:46 +02:00
|
|
|
|
2021-05-13 19:30:30 +02:00
|
|
|
if (m_query_buffer.size() == query_count)
|
2013-02-16 17:50:40 -06:00
|
|
|
{
|
|
|
|
FlushOne();
|
2021-05-21 12:48:27 +02:00
|
|
|
query_count = m_query_count.load(std::memory_order_relaxed);
|
2020-11-09 03:08:00 -05:00
|
|
|
// ERROR_LOG_FMT(VIDEO, "Flushed query buffer early!");
|
2013-02-16 17:50:40 -06:00
|
|
|
}
|
2016-06-24 10:43:46 +02:00
|
|
|
|
2012-06-17 13:58:29 +02:00
|
|
|
// start query
|
2022-11-17 21:54:43 +01:00
|
|
|
if (group == PQG_ZCOMP_ZCOMPLOC || group == PQG_ZCOMP)
|
2012-06-17 13:58:29 +02:00
|
|
|
{
|
2021-05-13 19:30:30 +02:00
|
|
|
auto& entry = m_query_buffer[(m_query_read_pos + query_count) % m_query_buffer.size()];
|
2016-06-24 10:43:46 +02:00
|
|
|
|
2015-02-21 16:58:53 -06:00
|
|
|
glBeginQuery(m_query_type, entry.query_id);
|
2022-11-17 21:54:43 +01:00
|
|
|
entry.query_group = group;
|
2016-06-24 10:43:46 +02:00
|
|
|
|
2021-05-13 19:30:30 +02:00
|
|
|
m_query_count.fetch_add(1, std::memory_order_relaxed);
|
2012-06-17 13:58:29 +02:00
|
|
|
}
|
|
|
|
}
|
2022-11-17 21:54:43 +01:00
|
|
|
void PerfQueryGL::DisableQuery(PerfQueryGroup group)
|
2012-06-17 13:58:29 +02:00
|
|
|
{
|
|
|
|
// stop query
|
2022-11-17 21:54:43 +01:00
|
|
|
if (group == PQG_ZCOMP_ZCOMPLOC || group == PQG_ZCOMP)
|
2012-06-17 13:58:29 +02:00
|
|
|
{
|
2015-02-21 16:58:53 -06:00
|
|
|
glEndQuery(m_query_type);
|
2013-02-16 17:50:40 -06:00
|
|
|
}
|
|
|
|
}
|
2012-06-17 13:58:29 +02:00
|
|
|
|
2015-02-21 16:58:53 -06:00
|
|
|
void PerfQueryGL::WeakFlush()
|
2013-02-16 17:50:40 -06:00
|
|
|
{
|
2015-02-21 16:58:53 -06:00
|
|
|
while (!IsFlushed())
|
|
|
|
{
|
|
|
|
auto& entry = m_query_buffer[m_query_read_pos];
|
2016-06-24 10:43:46 +02:00
|
|
|
|
2015-02-21 16:58:53 -06:00
|
|
|
GLuint result = GL_FALSE;
|
|
|
|
glGetQueryObjectuiv(entry.query_id, GL_QUERY_RESULT_AVAILABLE, &result);
|
2016-06-24 10:43:46 +02:00
|
|
|
|
2015-02-21 16:58:53 -06:00
|
|
|
if (GL_TRUE == result)
|
|
|
|
{
|
|
|
|
FlushOne();
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
2013-02-16 17:50:40 -06:00
|
|
|
}
|
|
|
|
|
2015-02-21 16:58:53 -06:00
|
|
|
void PerfQueryGL::FlushOne()
|
2013-02-16 17:50:40 -06:00
|
|
|
{
|
|
|
|
auto& entry = m_query_buffer[m_query_read_pos];
|
2013-03-01 23:12:41 +01:00
|
|
|
|
2013-02-16 17:50:40 -06:00
|
|
|
GLuint result = 0;
|
|
|
|
glGetQueryObjectuiv(entry.query_id, GL_QUERY_RESULT, &result);
|
2013-03-01 23:12:41 +01:00
|
|
|
|
|
|
|
// NOTE: Reported pixel metrics should be referenced to native resolution
|
2016-06-13 15:41:29 +10:00
|
|
|
// TODO: Dropping the lower 2 bits from this count should be closer to actual
|
|
|
|
// hardware behavior when drawing triangles.
|
|
|
|
result = static_cast<u64>(result) * EFB_WIDTH * EFB_HEIGHT /
|
2023-01-31 17:26:46 +13:00
|
|
|
(g_framebuffer_manager->GetEFBWidth() * g_framebuffer_manager->GetEFBHeight());
|
2016-06-13 15:41:29 +10:00
|
|
|
|
|
|
|
// Adjust for multisampling
|
|
|
|
if (g_ActiveConfig.iMultisamples > 1)
|
|
|
|
result /= g_ActiveConfig.iMultisamples;
|
|
|
|
|
2022-11-17 21:54:43 +01:00
|
|
|
m_results[entry.query_group].fetch_add(result, std::memory_order_relaxed);
|
2013-03-01 23:12:41 +01:00
|
|
|
|
2014-02-15 01:12:13 -05:00
|
|
|
m_query_read_pos = (m_query_read_pos + 1) % m_query_buffer.size();
|
2021-05-13 19:30:30 +02:00
|
|
|
m_query_count.fetch_sub(1, std::memory_order_relaxed);
|
2013-02-16 17:50:40 -06:00
|
|
|
}
|
2012-06-17 13:58:29 +02:00
|
|
|
|
2013-02-16 17:50:40 -06:00
|
|
|
// TODO: could selectively flush things, but I don't think that will do much
|
2015-02-21 16:58:53 -06:00
|
|
|
void PerfQueryGL::FlushResults()
|
2013-02-16 17:50:40 -06:00
|
|
|
{
|
|
|
|
while (!IsFlushed())
|
|
|
|
FlushOne();
|
|
|
|
}
|
2012-06-17 13:58:29 +02:00
|
|
|
|
2015-02-21 16:58:53 -06:00
|
|
|
PerfQueryGLESNV::PerfQueryGLESNV()
|
|
|
|
{
|
|
|
|
for (ActiveQuery& query : m_query_buffer)
|
|
|
|
glGenOcclusionQueriesNV(1, &query.query_id);
|
|
|
|
}
|
|
|
|
|
|
|
|
PerfQueryGLESNV::~PerfQueryGLESNV()
|
|
|
|
{
|
|
|
|
for (ActiveQuery& query : m_query_buffer)
|
|
|
|
glDeleteOcclusionQueriesNV(1, &query.query_id);
|
|
|
|
}
|
|
|
|
|
2022-11-17 21:54:43 +01:00
|
|
|
void PerfQueryGLESNV::EnableQuery(PerfQueryGroup group)
|
2015-02-21 16:58:53 -06:00
|
|
|
{
|
2021-05-21 12:48:27 +02:00
|
|
|
u32 query_count = m_query_count.load(std::memory_order_relaxed);
|
|
|
|
|
2015-02-21 16:58:53 -06:00
|
|
|
// Is this sane?
|
2021-05-13 19:30:30 +02:00
|
|
|
if (query_count > m_query_buffer.size() / 2)
|
2021-05-21 12:48:27 +02:00
|
|
|
{
|
2015-02-21 16:58:53 -06:00
|
|
|
WeakFlush();
|
2021-05-21 12:48:27 +02:00
|
|
|
query_count = m_query_count.load(std::memory_order_relaxed);
|
|
|
|
}
|
2016-06-24 10:43:46 +02:00
|
|
|
|
2021-05-13 19:30:30 +02:00
|
|
|
if (m_query_buffer.size() == query_count)
|
2015-02-21 16:58:53 -06:00
|
|
|
{
|
|
|
|
FlushOne();
|
2021-05-21 12:48:27 +02:00
|
|
|
query_count = m_query_count.load(std::memory_order_relaxed);
|
2020-11-09 03:08:00 -05:00
|
|
|
// ERROR_LOG_FMT(VIDEO, "Flushed query buffer early!");
|
2015-02-21 16:58:53 -06:00
|
|
|
}
|
2016-06-24 10:43:46 +02:00
|
|
|
|
2015-02-21 16:58:53 -06:00
|
|
|
// start query
|
2022-11-17 21:54:43 +01:00
|
|
|
if (group == PQG_ZCOMP_ZCOMPLOC || group == PQG_ZCOMP)
|
2015-02-21 16:58:53 -06:00
|
|
|
{
|
2021-05-13 19:30:30 +02:00
|
|
|
auto& entry = m_query_buffer[(m_query_read_pos + query_count) % m_query_buffer.size()];
|
2016-06-24 10:43:46 +02:00
|
|
|
|
2015-02-21 16:58:53 -06:00
|
|
|
glBeginOcclusionQueryNV(entry.query_id);
|
2022-11-17 21:54:43 +01:00
|
|
|
entry.query_group = group;
|
2016-06-24 10:43:46 +02:00
|
|
|
|
2021-05-13 19:30:30 +02:00
|
|
|
m_query_count.fetch_add(1, std::memory_order_relaxed);
|
2015-02-21 16:58:53 -06:00
|
|
|
}
|
|
|
|
}
|
2022-11-17 21:54:43 +01:00
|
|
|
void PerfQueryGLESNV::DisableQuery(PerfQueryGroup group)
|
2015-02-21 16:58:53 -06:00
|
|
|
{
|
|
|
|
// stop query
|
2022-11-17 21:54:43 +01:00
|
|
|
if (group == PQG_ZCOMP_ZCOMPLOC || group == PQG_ZCOMP)
|
2015-02-21 16:58:53 -06:00
|
|
|
{
|
|
|
|
glEndOcclusionQueryNV();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
void PerfQueryGLESNV::WeakFlush()
|
2013-02-16 17:50:40 -06:00
|
|
|
{
|
|
|
|
while (!IsFlushed())
|
|
|
|
{
|
|
|
|
auto& entry = m_query_buffer[m_query_read_pos];
|
2016-06-24 10:43:46 +02:00
|
|
|
|
2013-02-16 17:50:40 -06:00
|
|
|
GLuint result = GL_FALSE;
|
2015-02-21 16:58:53 -06:00
|
|
|
glGetOcclusionQueryuivNV(entry.query_id, GL_PIXEL_COUNT_AVAILABLE_NV, &result);
|
2016-06-24 10:43:46 +02:00
|
|
|
|
2013-02-16 17:50:40 -06:00
|
|
|
if (GL_TRUE == result)
|
|
|
|
{
|
|
|
|
FlushOne();
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
break;
|
|
|
|
}
|
2012-06-17 13:58:29 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2015-02-21 16:58:53 -06:00
|
|
|
void PerfQueryGLESNV::FlushOne()
|
2012-06-17 13:58:29 +02:00
|
|
|
{
|
2015-02-21 16:58:53 -06:00
|
|
|
auto& entry = m_query_buffer[m_query_read_pos];
|
2012-06-17 13:58:29 +02:00
|
|
|
|
2015-02-21 16:58:53 -06:00
|
|
|
GLuint result = 0;
|
|
|
|
glGetOcclusionQueryuivNV(entry.query_id, GL_OCCLUSION_TEST_RESULT_HP, &result);
|
2013-10-29 01:23:17 -04:00
|
|
|
|
2015-02-21 16:58:53 -06:00
|
|
|
// NOTE: Reported pixel metrics should be referenced to native resolution
|
2016-06-13 15:41:29 +10:00
|
|
|
// TODO: Dropping the lower 2 bits from this count should be closer to actual
|
|
|
|
// hardware behavior when drawing triangles.
|
2023-01-31 17:29:16 +13:00
|
|
|
const u64 native_res_result =
|
|
|
|
static_cast<u64>(result) * EFB_WIDTH * EFB_HEIGHT /
|
|
|
|
(g_framebuffer_manager->GetEFBWidth() * g_framebuffer_manager->GetEFBHeight());
|
2022-11-17 21:54:43 +01:00
|
|
|
m_results[entry.query_group].fetch_add(static_cast<u32>(native_res_result),
|
|
|
|
std::memory_order_relaxed);
|
2013-10-29 01:23:17 -04:00
|
|
|
|
2015-02-21 16:58:53 -06:00
|
|
|
m_query_read_pos = (m_query_read_pos + 1) % m_query_buffer.size();
|
2021-05-13 19:30:30 +02:00
|
|
|
m_query_count.fetch_sub(1, std::memory_order_relaxed);
|
2015-02-21 16:58:53 -06:00
|
|
|
}
|
|
|
|
|
|
|
|
// TODO: could selectively flush things, but I don't think that will do much
|
|
|
|
void PerfQueryGLESNV::FlushResults()
|
|
|
|
{
|
|
|
|
while (!IsFlushed())
|
|
|
|
FlushOne();
|
2012-06-17 13:58:29 +02:00
|
|
|
}
|
|
|
|
|
2018-10-03 23:02:45 +10:00
|
|
|
} // namespace OGL
|