mirror of
https://github.com/skyline-emu/skyline.git
synced 2025-01-11 17:09:11 +01:00
Submit GPFIFO work prior to CircularQueue
waiting
The position at which we call submit is a significant factor in performance and we did so at the end of PBs (PushBuffers), this isn't optimal as there could be multiple PBs queued up that would benefit from being in the same submission. We now delay the submission of the workload till we run out of PBs.
This commit is contained in:
parent
3ac5ed8c06
commit
561103d3da
@ -49,9 +49,10 @@ namespace skyline {
|
||||
/**
|
||||
* @brief A blocking for-each that runs on every item and waits till new items to run on them as well
|
||||
* @param function A function that is called for each item (with the only parameter as a reference to that item)
|
||||
* @param preWait An optional function that's called prior to waiting on more items to be queued
|
||||
*/
|
||||
template<typename F>
|
||||
[[noreturn]] void Process(F function) {
|
||||
template<typename F1, typename F2>
|
||||
[[noreturn]] void Process(F1 function, F2 preWait) {
|
||||
TRACE_EVENT_BEGIN("containers", "CircularQueue::Process");
|
||||
|
||||
while (true) {
|
||||
@ -59,6 +60,7 @@ namespace skyline {
|
||||
std::unique_lock lock(productionMutex);
|
||||
|
||||
TRACE_EVENT_END("containers");
|
||||
preWait();
|
||||
produceCondition.wait(lock, [this]() { return start != end; });
|
||||
TRACE_EVENT_BEGIN("containers", "CircularQueue::Process");
|
||||
}
|
||||
|
@ -227,7 +227,7 @@ namespace skyline::gpu {
|
||||
presentQueue.Process([this](const PresentableFrame &frame) {
|
||||
PresentFrame(frame);
|
||||
frame.presentCallback(); // We're calling the callback here as it's outside of all the locks in PresentFrame
|
||||
});
|
||||
}, [] {});
|
||||
} catch (const signal::SignalException &e) {
|
||||
Logger::Error("{}\nStack Trace:{}", e.what(), state.loader->GetStackTrace(e.frames));
|
||||
if (state.process)
|
||||
|
@ -150,6 +150,10 @@ namespace skyline::soc::gm20b {
|
||||
}
|
||||
|
||||
void ChannelGpfifo::Process(GpEntry gpEntry) {
|
||||
// Submit if required by the GpEntry, this is needed as some games dynamically generate pushbuffer contents
|
||||
if (gpEntry.sync == GpEntry::Sync::Wait)
|
||||
channelCtx.executor.Submit();
|
||||
|
||||
if (!gpEntry.size) {
|
||||
// This is a GPFIFO control entry, all control entries have a zero length and contain no pushbuffers
|
||||
switch (gpEntry.opcode) {
|
||||
@ -335,8 +339,6 @@ namespace skyline::soc::gm20b {
|
||||
if (hitEnd)
|
||||
break;
|
||||
}
|
||||
|
||||
channelCtx.executor.Submit();
|
||||
}
|
||||
|
||||
void ChannelGpfifo::Run() {
|
||||
@ -350,6 +352,10 @@ namespace skyline::soc::gm20b {
|
||||
gpEntries.Process([this](GpEntry gpEntry) {
|
||||
Logger::Debug("Processing pushbuffer: 0x{:X}, Size: 0x{:X}", gpEntry.Address(), +gpEntry.size);
|
||||
Process(gpEntry);
|
||||
}, [this]() {
|
||||
// If we run out of GpEntries to process ensure we submit any remaining GPU work before waiting for more to arrive
|
||||
Logger::Debug("Finished processing pushbuffer batch");
|
||||
channelCtx.executor.Submit();
|
||||
});
|
||||
} catch (const signal::SignalException &e) {
|
||||
if (e.signal != SIGINT) {
|
||||
|
@ -124,7 +124,7 @@ namespace skyline::soc::host1x {
|
||||
gatherQueue.Process([this](span<u32> gather) {
|
||||
Logger::Debug("Processing pushbuffer: 0x{:X}, size: 0x{:X}", gather.data(), gather.size());
|
||||
Process(gather);
|
||||
});
|
||||
}, [] {});
|
||||
} catch (const signal::SignalException &e) {
|
||||
if (e.signal != SIGINT) {
|
||||
Logger::Error("{}\nStack Trace:{}", e.what(), state.loader->GetStackTrace(e.frames));
|
||||
|
Loading…
x
Reference in New Issue
Block a user