mirror of
https://github.com/skyline-emu/skyline.git
synced 2025-01-15 11:47:55 +03:00
Introduce IOVA
union for flipped words of IOVAs in GraphicsContext
The Maxwell3D `Address` class follows the big-endian register ordering for addresses while on the host we consume them in little-endian, the `IOVA` class is the host equivalent to the `Address` class with implicitly flipped 32-bit register ordering. It shares implicit decomposition semantics from `Address` due to similar requirements with a minor difference of being returned by reference rather than value as we want to have value setting semantics with implicit decomposition while we don't for `Address`.
This commit is contained in:
parent
73646c4da8
commit
d163e4ffa6
@ -23,6 +23,23 @@ namespace skyline::gpu::interconnect {
|
|||||||
soc::gm20b::ChannelContext &channelCtx;
|
soc::gm20b::ChannelContext &channelCtx;
|
||||||
gpu::interconnect::CommandExecutor &executor;
|
gpu::interconnect::CommandExecutor &executor;
|
||||||
|
|
||||||
|
/**
|
||||||
|
* @brief A host IOVA address composed of 32-bit low/high register values
|
||||||
|
* @note This differs from maxwell3d::Address in that it is little-endian rather than big-endian ordered for the register values
|
||||||
|
*/
|
||||||
|
union IOVA {
|
||||||
|
u64 iova;
|
||||||
|
struct {
|
||||||
|
u32 low;
|
||||||
|
u32 high;
|
||||||
|
};
|
||||||
|
|
||||||
|
operator u64&() {
|
||||||
|
return iova;
|
||||||
|
}
|
||||||
|
};
|
||||||
|
static_assert(sizeof(IOVA) == sizeof(u64));
|
||||||
|
|
||||||
public:
|
public:
|
||||||
GraphicsContext(GPU &gpu, soc::gm20b::ChannelContext &channelCtx, gpu::interconnect::CommandExecutor &executor) : gpu(gpu), channelCtx(channelCtx), executor(executor) {
|
GraphicsContext(GPU &gpu, soc::gm20b::ChannelContext &channelCtx, gpu::interconnect::CommandExecutor &executor) : gpu(gpu), channelCtx(channelCtx), executor(executor) {
|
||||||
scissors.fill(DefaultScissor);
|
scissors.fill(DefaultScissor);
|
||||||
@ -34,13 +51,7 @@ namespace skyline::gpu::interconnect {
|
|||||||
private:
|
private:
|
||||||
struct RenderTarget {
|
struct RenderTarget {
|
||||||
bool disabled{true}; //!< If this RT has been disabled and will be an unbound attachment instead
|
bool disabled{true}; //!< If this RT has been disabled and will be an unbound attachment instead
|
||||||
union {
|
IOVA iova;
|
||||||
u64 gpuAddress;
|
|
||||||
struct {
|
|
||||||
u32 gpuAddressLow;
|
|
||||||
u32 gpuAddressHigh;
|
|
||||||
};
|
|
||||||
};
|
|
||||||
u32 widthBytes; //!< The width in bytes for linear textures
|
u32 widthBytes; //!< The width in bytes for linear textures
|
||||||
GuestTexture guest;
|
GuestTexture guest;
|
||||||
std::optional<TextureView> view;
|
std::optional<TextureView> view;
|
||||||
@ -56,14 +67,14 @@ namespace skyline::gpu::interconnect {
|
|||||||
public:
|
public:
|
||||||
void SetRenderTargetAddressHigh(size_t index, u32 high) {
|
void SetRenderTargetAddressHigh(size_t index, u32 high) {
|
||||||
auto &renderTarget{renderTargets.at(index)};
|
auto &renderTarget{renderTargets.at(index)};
|
||||||
renderTarget.gpuAddressHigh = high;
|
renderTarget.iova.high = high;
|
||||||
renderTarget.guest.mappings.clear();
|
renderTarget.guest.mappings.clear();
|
||||||
renderTarget.view.reset();
|
renderTarget.view.reset();
|
||||||
}
|
}
|
||||||
|
|
||||||
void SetRenderTargetAddressLow(size_t index, u32 low) {
|
void SetRenderTargetAddressLow(size_t index, u32 low) {
|
||||||
auto &renderTarget{renderTargets.at(index)};
|
auto &renderTarget{renderTargets.at(index)};
|
||||||
renderTarget.gpuAddressLow = low;
|
renderTarget.iova.low = low;
|
||||||
renderTarget.guest.mappings.clear();
|
renderTarget.guest.mappings.clear();
|
||||||
renderTarget.view.reset();
|
renderTarget.view.reset();
|
||||||
}
|
}
|
||||||
@ -211,7 +222,7 @@ namespace skyline::gpu::interconnect {
|
|||||||
|
|
||||||
if (renderTarget.guest.mappings.empty()) {
|
if (renderTarget.guest.mappings.empty()) {
|
||||||
auto size{std::max<u64>(renderTarget.guest.layerStride * (renderTarget.guest.layerCount - renderTarget.guest.baseArrayLayer), renderTarget.guest.format->GetSize(renderTarget.guest.dimensions))};
|
auto size{std::max<u64>(renderTarget.guest.layerStride * (renderTarget.guest.layerCount - renderTarget.guest.baseArrayLayer), renderTarget.guest.format->GetSize(renderTarget.guest.dimensions))};
|
||||||
auto mappings{channelCtx.asCtx->gmmu.TranslateRange(renderTarget.gpuAddress, size)};
|
auto mappings{channelCtx.asCtx->gmmu.TranslateRange(renderTarget.iova, size)};
|
||||||
renderTarget.guest.mappings.assign(mappings.begin(), mappings.end());
|
renderTarget.guest.mappings.assign(mappings.begin(), mappings.end());
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -347,18 +358,18 @@ namespace skyline::gpu::interconnect {
|
|||||||
span<u8> data; //!< The shader bytecode in the CPU AS
|
span<u8> data; //!< The shader bytecode in the CPU AS
|
||||||
};
|
};
|
||||||
|
|
||||||
u64 shaderBaseIova{}; //!< The base IOVA that shaders are located at an offset from
|
IOVA shaderBaseIova{}; //!< The base IOVA that shaders are located at an offset from
|
||||||
std::array<Shader, maxwell3d::StageCount> boundShaders{};
|
std::array<Shader, maxwell3d::StageCount> boundShaders{};
|
||||||
|
|
||||||
public:
|
public:
|
||||||
void SetShaderBaseIovaHigh(u32 high) {
|
void SetShaderBaseIovaHigh(u32 high) {
|
||||||
shaderBaseIova = (shaderBaseIova & std::numeric_limits<u32>::max()) | (static_cast<u64>(high) << 32);
|
shaderBaseIova.high = high;
|
||||||
for (auto &shader : boundShaders)
|
for (auto &shader : boundShaders)
|
||||||
shader.data = span<u8>{};
|
shader.data = span<u8>{};
|
||||||
}
|
}
|
||||||
|
|
||||||
void SetShaderBaseIovaLow(u32 low) {
|
void SetShaderBaseIovaLow(u32 low) {
|
||||||
shaderBaseIova = (shaderBaseIova & (static_cast<u64>(std::numeric_limits<u32>::max()) << 32)) | low;
|
shaderBaseIova.low = low;
|
||||||
for (auto &shader : boundShaders)
|
for (auto &shader : boundShaders)
|
||||||
shader.data = span<u8>{};
|
shader.data = span<u8>{};
|
||||||
}
|
}
|
||||||
|
Loading…
x
Reference in New Issue
Block a user