Make Texture::SynchronizeGuest Blocking

It was determined that `Texture::SynchronizeGuest`'s `TextureBufferCopy` had races that were exposed by the introduction of the cycle waiter thread, the synchronization did not take place under a locked context so the texture could be mutated at any point in addition to the destructor not being run during `FenceCycle::Wait` due to `shouldDestroy` being `false`. 

This commit fixes the issue by making `SynchronizeGuest` entirely blocking as all usages of the function required blocking semantics regardless so it would be pointless to retain its async nature while solving any races that may arise from it being async.

Co-authored-by: Billy Laws <blaws05@gmail.com>
This commit is contained in:
PixelyIon 2022-08-06 15:47:11 +05:30
parent 77d15b02a3
commit 850c0f4092
No known key found for this signature in database
GPG Key ID: 11BC6C3201BC2C05
2 changed files with 5 additions and 26 deletions

View File

@ -176,7 +176,6 @@ namespace skyline::gpu {
return false; return false;
texture->SynchronizeGuest(false, true); // We can skip trapping since the caller will do it texture->SynchronizeGuest(false, true); // We can skip trapping since the caller will do it
texture->WaitOnFence();
return true; return true;
}, [weakThis] { }, [weakThis] {
TRACE_EVENT("gpu", "Texture::WriteTrap"); TRACE_EVENT("gpu", "Texture::WriteTrap");
@ -198,7 +197,6 @@ namespace skyline::gpu {
if (!lock) if (!lock)
return false; return false;
texture->SynchronizeGuest(true, true); // We need to assume the texture is dirty since we don't know what the guest is writing texture->SynchronizeGuest(true, true); // We need to assume the texture is dirty since we don't know what the guest is writing
texture->WaitOnFence();
return true; return true;
}); });
} }
@ -455,13 +453,6 @@ namespace skyline::gpu {
} }
} }
Texture::TextureBufferCopy::TextureBufferCopy(std::shared_ptr<Texture> texture, std::shared_ptr<memory::StagingBuffer> stagingBuffer) : texture(std::move(texture)), stagingBuffer(std::move(stagingBuffer)) {}
Texture::TextureBufferCopy::~TextureBufferCopy() {
TRACE_EVENT("gpu", "Texture::TextureBufferCopy");
texture->CopyToGuest(stagingBuffer ? stagingBuffer->data() : std::get<memory::Image>(texture->backing).data());
}
Texture::Texture(GPU &gpu, BackingType &&backing, texture::Dimensions dimensions, texture::Format format, vk::ImageLayout layout, vk::ImageTiling tiling, vk::ImageCreateFlags flags, vk::ImageUsageFlags usage, u32 levelCount, u32 layerCount, vk::SampleCountFlagBits sampleCount) Texture::Texture(GPU &gpu, BackingType &&backing, texture::Dimensions dimensions, texture::Format format, vk::ImageLayout layout, vk::ImageTiling tiling, vk::ImageCreateFlags flags, vk::ImageUsageFlags usage, u32 levelCount, u32 layerCount, vk::SampleCountFlagBits sampleCount)
: gpu(gpu), : gpu(gpu),
backing(std::move(backing)), backing(std::move(backing)),
@ -596,7 +587,6 @@ namespace skyline::gpu {
gpu.state.nce->DeleteTrap(*trapHandle); gpu.state.nce->DeleteTrap(*trapHandle);
if (alignedMirror.valid()) if (alignedMirror.valid())
munmap(alignedMirror.data(), alignedMirror.size()); munmap(alignedMirror.data(), alignedMirror.size());
WaitOnFence();
} }
void Texture::lock() { void Texture::lock() {
@ -780,12 +770,13 @@ namespace skyline::gpu {
if (tiling == vk::ImageTiling::eOptimal || !std::holds_alternative<memory::Image>(backing)) { if (tiling == vk::ImageTiling::eOptimal || !std::holds_alternative<memory::Image>(backing)) {
auto stagingBuffer{gpu.memory.AllocateStagingBuffer(surfaceSize)}; auto stagingBuffer{gpu.memory.AllocateStagingBuffer(surfaceSize)};
WaitOnFence();
auto lCycle{gpu.scheduler.Submit([&](vk::raii::CommandBuffer &commandBuffer) { auto lCycle{gpu.scheduler.Submit([&](vk::raii::CommandBuffer &commandBuffer) {
CopyIntoStagingBuffer(commandBuffer, stagingBuffer); CopyIntoStagingBuffer(commandBuffer, stagingBuffer);
})}; })};
lCycle->AttachObject(std::make_shared<TextureBufferCopy>(shared_from_this(), stagingBuffer)); lCycle->Wait(); // We block till the copy is complete
lCycle->ChainCycle(cycle);
cycle = lCycle; CopyToGuest(stagingBuffer->data());
} else if (tiling == vk::ImageTiling::eLinear) { } else if (tiling == vk::ImageTiling::eLinear) {
// We can optimize linear texture sync on a UMA by mapping the texture onto the CPU and copying directly from it rather than using a staging buffer // We can optimize linear texture sync on a UMA by mapping the texture onto the CPU and copying directly from it rather than using a staging buffer
WaitOnFence(); WaitOnFence();

View File

@ -416,18 +416,6 @@ namespace skyline::gpu {
*/ */
void CopyToGuest(u8 *hostBuffer); void CopyToGuest(u8 *hostBuffer);
/**
* @brief A fence cycle dependency that copies the contents of a staging buffer or mapped image backing the texture to the guest texture
*/
struct TextureBufferCopy {
std::shared_ptr<Texture> texture;
std::shared_ptr<memory::StagingBuffer> stagingBuffer;
TextureBufferCopy(std::shared_ptr<Texture> texture, std::shared_ptr<memory::StagingBuffer> stagingBuffer = {});
~TextureBufferCopy();
};
/** /**
* @return A vector of all the buffer image copies that need to be done for every aspect of every level of every layer of the texture * @return A vector of all the buffer image copies that need to be done for every aspect of every level of every layer of the texture
*/ */
@ -547,7 +535,7 @@ namespace skyline::gpu {
* @brief Synchronizes the guest texture with the host texture after it has been modified * @brief Synchronizes the guest texture with the host texture after it has been modified
* @param cpuDirty If true, the texture will be transitioned to being CpuDirty by this call * @param cpuDirty If true, the texture will be transitioned to being CpuDirty by this call
* @param skipTrap If true, trapping/untrapping the guest mappings will be skipped and has to be handled by the caller * @param skipTrap If true, trapping/untrapping the guest mappings will be skipped and has to be handled by the caller
* @note This function is not blocking and the synchronization will not be complete until the associated fence is signalled, it can be waited on with WaitOnFence() * @note This function is blocking and waiting on the fence is not required
* @note The texture **must** be locked prior to calling this * @note The texture **must** be locked prior to calling this
*/ */
void SynchronizeGuest(bool cpuDirty = false, bool skipTrap = false); void SynchronizeGuest(bool cpuDirty = false, bool skipTrap = false);