mirror of
https://github.com/skyline-emu/skyline.git
synced 2025-01-01 09:45:38 +03:00
Share single flag variable for Maxwell3D batch draw/constant buffer update
Slightly cheaper
This commit is contained in:
parent
bd7eee8e2b
commit
38aad21d29
@ -70,8 +70,8 @@ namespace skyline::soc::gm20b::engine::maxwell3d {
|
|||||||
}
|
}
|
||||||
|
|
||||||
__attribute__((always_inline)) void Maxwell3D::FlushDeferredDraw() {
|
__attribute__((always_inline)) void Maxwell3D::FlushDeferredDraw() {
|
||||||
if (deferredDraw.pending) {
|
if (batchEnableState.drawActive) {
|
||||||
deferredDraw.pending = false;
|
batchEnableState.drawActive = false;
|
||||||
interconnect.Draw(deferredDraw.drawTopology, deferredDraw.indexed, deferredDraw.drawCount, deferredDraw.drawFirst, deferredDraw.instanceCount, deferredDraw.drawBaseVertex, deferredDraw.drawBaseInstance);
|
interconnect.Draw(deferredDraw.drawTopology, deferredDraw.indexed, deferredDraw.drawCount, deferredDraw.drawFirst, deferredDraw.instanceCount, deferredDraw.drawBaseVertex, deferredDraw.drawBaseInstance);
|
||||||
deferredDraw.instanceCount = 1;
|
deferredDraw.instanceCount = 1;
|
||||||
}
|
}
|
||||||
@ -92,8 +92,8 @@ namespace skyline::soc::gm20b::engine::maxwell3d {
|
|||||||
bool redundant{registers.raw[method] == argument};
|
bool redundant{registers.raw[method] == argument};
|
||||||
registers.raw[method] = argument;
|
registers.raw[method] = argument;
|
||||||
|
|
||||||
// TODO COMBINE THESE
|
if (batchEnableState.raw) {
|
||||||
if (batchLoadConstantBuffer.Active()) {
|
if (batchEnableState.constantBufferActive) {
|
||||||
switch (method) {
|
switch (method) {
|
||||||
// Add to the batch constant buffer update buffer
|
// Add to the batch constant buffer update buffer
|
||||||
// Return early here so that any code below can rely on the fact that any cbuf updates will always be the first of a batch
|
// Return early here so that any code below can rely on the fact that any cbuf updates will always be the first of a batch
|
||||||
@ -109,11 +109,12 @@ namespace skyline::soc::gm20b::engine::maxwell3d {
|
|||||||
default:
|
default:
|
||||||
// When a method other than constant buffer update is called submit our submit the previously built-up update as a batch
|
// When a method other than constant buffer update is called submit our submit the previously built-up update as a batch
|
||||||
interconnect.DisableQuickConstantBufferBind();
|
interconnect.DisableQuickConstantBufferBind();
|
||||||
interconnect.LoadConstantBuffer(batchLoadConstantBuffer.buffer, batchLoadConstantBuffer.Invalidate());
|
interconnect.LoadConstantBuffer(batchLoadConstantBuffer.buffer, batchLoadConstantBuffer.startOffset);
|
||||||
|
batchEnableState.constantBufferActive = false;
|
||||||
batchLoadConstantBuffer.Reset();
|
batchLoadConstantBuffer.Reset();
|
||||||
break; // Continue on here to handle the actual method
|
break; // Continue on here to handle the actual method
|
||||||
}
|
}
|
||||||
} else if (deferredDraw.pending) { // See DeferredDrawState comment for full details
|
} else if (batchEnableState.drawActive) { // See DeferredDrawState comment for full details
|
||||||
switch (method) {
|
switch (method) {
|
||||||
ENGINE_CASE(begin, {
|
ENGINE_CASE(begin, {
|
||||||
if (begin.instanceId == Registers::Begin::InstanceId::Subsequent) {
|
if (begin.instanceId == Registers::Begin::InstanceId::Subsequent) {
|
||||||
@ -151,12 +152,11 @@ namespace skyline::soc::gm20b::engine::maxwell3d {
|
|||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
if (!redundant) {
|
|
||||||
dirtyManager.MarkDirty(method);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
|
if (!redundant)
|
||||||
|
dirtyManager.MarkDirty(method);
|
||||||
|
|
||||||
switch (method) {
|
switch (method) {
|
||||||
ENGINE_STRUCT_CASE(mme, instructionRamLoad, {
|
ENGINE_STRUCT_CASE(mme, instructionRamLoad, {
|
||||||
if (registers.mme->instructionRamPointer >= macroState.macroCode.size())
|
if (registers.mme->instructionRamPointer >= macroState.macroCode.size())
|
||||||
@ -208,11 +208,13 @@ namespace skyline::soc::gm20b::engine::maxwell3d {
|
|||||||
ENGINE_STRUCT_CASE(drawVertexArray, count, {
|
ENGINE_STRUCT_CASE(drawVertexArray, count, {
|
||||||
// Defer the draw until the first non-draw operation to allow for detecting instanced draws (see DeferredDrawState comment)
|
// Defer the draw until the first non-draw operation to allow for detecting instanced draws (see DeferredDrawState comment)
|
||||||
deferredDraw.Set(count, *registers.vertexArrayStart, 0, *registers.globalBaseInstanceIndex, GetCurrentTopology(), false);
|
deferredDraw.Set(count, *registers.vertexArrayStart, 0, *registers.globalBaseInstanceIndex, GetCurrentTopology(), false);
|
||||||
|
batchEnableState.drawActive = true;
|
||||||
})
|
})
|
||||||
|
|
||||||
ENGINE_STRUCT_CASE(drawIndexBuffer, count, {
|
ENGINE_STRUCT_CASE(drawIndexBuffer, count, {
|
||||||
// Defer the draw until the first non-draw operation to allow for detecting instanced draws (see DeferredDrawState comment)
|
// Defer the draw until the first non-draw operation to allow for detecting instanced draws (see DeferredDrawState comment)
|
||||||
deferredDraw.Set(count, registers.indexBuffer->first, *registers.globalBaseVertexIndex, *registers.globalBaseInstanceIndex, GetCurrentTopology(), true);
|
deferredDraw.Set(count, registers.indexBuffer->first, *registers.globalBaseVertexIndex, *registers.globalBaseInstanceIndex, GetCurrentTopology(), true);
|
||||||
|
batchEnableState.drawActive = true;
|
||||||
})
|
})
|
||||||
|
|
||||||
ENGINE_STRUCT_CASE(semaphore, info, {
|
ENGINE_STRUCT_CASE(semaphore, info, {
|
||||||
@ -253,6 +255,7 @@ namespace skyline::soc::gm20b::engine::maxwell3d {
|
|||||||
ENGINE_STRUCT_ARRAY_CASE(loadConstantBuffer, data, index, { \
|
ENGINE_STRUCT_ARRAY_CASE(loadConstantBuffer, data, index, { \
|
||||||
batchLoadConstantBuffer.startOffset = registers.loadConstantBuffer->offset; \
|
batchLoadConstantBuffer.startOffset = registers.loadConstantBuffer->offset; \
|
||||||
batchLoadConstantBuffer.buffer.push_back(data); \
|
batchLoadConstantBuffer.buffer.push_back(data); \
|
||||||
|
batchEnableState.constantBufferActive = true; \
|
||||||
registers.loadConstantBuffer->offset += 4; \
|
registers.loadConstantBuffer->offset += 4; \
|
||||||
})
|
})
|
||||||
|
|
||||||
@ -296,8 +299,9 @@ namespace skyline::soc::gm20b::engine::maxwell3d {
|
|||||||
void Maxwell3D::FlushEngineState() {
|
void Maxwell3D::FlushEngineState() {
|
||||||
FlushDeferredDraw();
|
FlushDeferredDraw();
|
||||||
|
|
||||||
if (batchLoadConstantBuffer.Active()) {
|
if (batchEnableState.constantBufferActive) {
|
||||||
interconnect.LoadConstantBuffer(batchLoadConstantBuffer.buffer, batchLoadConstantBuffer.Invalidate());
|
interconnect.LoadConstantBuffer(batchLoadConstantBuffer.buffer, batchLoadConstantBuffer.startOffset);
|
||||||
|
batchEnableState.constantBufferActive = false;
|
||||||
batchLoadConstantBuffer.Reset();
|
batchLoadConstantBuffer.Reset();
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -27,17 +27,18 @@ namespace skyline::soc::gm20b::engine::maxwell3d {
|
|||||||
gpu::interconnect::maxwell3d::DirtyManager dirtyManager;
|
gpu::interconnect::maxwell3d::DirtyManager dirtyManager;
|
||||||
gpu::interconnect::maxwell3d::Maxwell3D interconnect;
|
gpu::interconnect::maxwell3d::Maxwell3D interconnect;
|
||||||
|
|
||||||
|
union BatchEnableState {
|
||||||
|
u8 raw{};
|
||||||
|
|
||||||
|
struct {
|
||||||
|
bool constantBufferActive : 1;
|
||||||
|
bool drawActive : 1;
|
||||||
|
};
|
||||||
|
} batchEnableState{};
|
||||||
|
|
||||||
struct BatchLoadConstantBufferState {
|
struct BatchLoadConstantBufferState {
|
||||||
std::vector<u32> buffer;
|
std::vector<u32> buffer;
|
||||||
u32 startOffset{std::numeric_limits<u32>::max()};
|
u32 startOffset{};
|
||||||
|
|
||||||
bool Active() {
|
|
||||||
return startOffset != std::numeric_limits<u32>::max();
|
|
||||||
}
|
|
||||||
|
|
||||||
u32 Invalidate() {
|
|
||||||
return std::exchange(startOffset, std::numeric_limits<u32>::max());
|
|
||||||
}
|
|
||||||
|
|
||||||
void Reset() {
|
void Reset() {
|
||||||
buffer.clear();
|
buffer.clear();
|
||||||
@ -48,7 +49,6 @@ namespace skyline::soc::gm20b::engine::maxwell3d {
|
|||||||
* @brief In the Maxwell 3D engine, instanced draws are implemented by repeating the exact same draw in sequence with special flag set in vertexBeginGl. This flag allows either incrementing the instance counter or resetting it, since we need to supply an instance count to the host API we defer all draws until state changes occur. If there are no state changes between draws we can skip them and count the occurences to get the number of instances to draw.
|
* @brief In the Maxwell 3D engine, instanced draws are implemented by repeating the exact same draw in sequence with special flag set in vertexBeginGl. This flag allows either incrementing the instance counter or resetting it, since we need to supply an instance count to the host API we defer all draws until state changes occur. If there are no state changes between draws we can skip them and count the occurences to get the number of instances to draw.
|
||||||
*/
|
*/
|
||||||
struct DeferredDrawState {
|
struct DeferredDrawState {
|
||||||
bool pending;
|
|
||||||
bool indexed; //!< If the deferred draw is indexed
|
bool indexed; //!< If the deferred draw is indexed
|
||||||
type::DrawTopology drawTopology; //!< Topology of draw at draw time
|
type::DrawTopology drawTopology; //!< Topology of draw at draw time
|
||||||
u32 instanceCount{1}; //!< Number of instances in the final draw
|
u32 instanceCount{1}; //!< Number of instances in the final draw
|
||||||
@ -61,7 +61,6 @@ namespace skyline::soc::gm20b::engine::maxwell3d {
|
|||||||
* @brief Sets up the state necessary to defer a new draw
|
* @brief Sets up the state necessary to defer a new draw
|
||||||
*/
|
*/
|
||||||
void Set(u32 pDrawCount, u32 pDrawFirst, u32 pDrawBaseVertex, u32 pDrawBaseInstance, type::DrawTopology pDrawTopology, bool pIndexed) {
|
void Set(u32 pDrawCount, u32 pDrawFirst, u32 pDrawBaseVertex, u32 pDrawBaseInstance, type::DrawTopology pDrawTopology, bool pIndexed) {
|
||||||
pending = true;
|
|
||||||
indexed = pIndexed;
|
indexed = pIndexed;
|
||||||
drawTopology = pDrawTopology;
|
drawTopology = pDrawTopology;
|
||||||
drawCount = pDrawCount;
|
drawCount = pDrawCount;
|
||||||
|
Loading…
Reference in New Issue
Block a user