mirror of
https://github.com/skyline-emu/skyline.git
synced 2024-12-28 08:45:29 +03:00
Add guest shader replacement and dumping support
This commit is contained in:
parent
2f6d27e8d7
commit
326c05a5de
@ -400,14 +400,18 @@ namespace skyline::gpu {
|
|||||||
buffer(*this),
|
buffer(*this),
|
||||||
megaBufferAllocator(*this),
|
megaBufferAllocator(*this),
|
||||||
descriptor(*this),
|
descriptor(*this),
|
||||||
shader(state, *this),
|
|
||||||
helperShaders(*this, state.os->assetFileSystem),
|
helperShaders(*this, state.os->assetFileSystem),
|
||||||
graphicsPipelineCache(*this),
|
graphicsPipelineCache(*this),
|
||||||
renderPassCache(*this),
|
renderPassCache(*this),
|
||||||
framebufferCache(*this) {}
|
framebufferCache(*this) {}
|
||||||
|
|
||||||
void GPU::Initialise() {
|
void GPU::Initialise() {
|
||||||
graphicsPipelineCacheManager.emplace(state, state.os->publicAppFilesPath + "graphics_pipeline_cache/" + state.loader->nacp->GetSaveDataOwnerId());
|
std::string titleId{state.loader->nacp->GetSaveDataOwnerId()};
|
||||||
|
shader.emplace(state, *this,
|
||||||
|
state.os->publicAppFilesPath + "shader_replacements/" + titleId,
|
||||||
|
state.os->publicAppFilesPath + "shader_dumps/" + titleId);
|
||||||
|
graphicsPipelineCacheManager.emplace(state,
|
||||||
|
state.os->publicAppFilesPath + "graphics_pipeline_cache/" + titleId);
|
||||||
graphicsPipelineManager.emplace(*this);
|
graphicsPipelineManager.emplace(*this);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -55,7 +55,7 @@ namespace skyline::gpu {
|
|||||||
MegaBufferAllocator megaBufferAllocator;
|
MegaBufferAllocator megaBufferAllocator;
|
||||||
|
|
||||||
DescriptorAllocator descriptor;
|
DescriptorAllocator descriptor;
|
||||||
ShaderManager shader;
|
std::optional<ShaderManager> shader;
|
||||||
|
|
||||||
HelperShaders helperShaders;
|
HelperShaders helperShaders;
|
||||||
|
|
||||||
|
@ -10,10 +10,10 @@
|
|||||||
|
|
||||||
namespace skyline::gpu::interconnect::kepler_compute {
|
namespace skyline::gpu::interconnect::kepler_compute {
|
||||||
static Pipeline::ShaderStage MakePipelineShader(InterconnectContext &ctx, Textures &textures, ConstantBufferSet &constantBuffers, const PackedPipelineState &packedState, const ShaderBinary &shaderBinary) {
|
static Pipeline::ShaderStage MakePipelineShader(InterconnectContext &ctx, Textures &textures, ConstantBufferSet &constantBuffers, const PackedPipelineState &packedState, const ShaderBinary &shaderBinary) {
|
||||||
ctx.gpu.shader.ResetPools();
|
ctx.gpu.shader->ResetPools();
|
||||||
|
|
||||||
auto program{ctx.gpu.shader.ParseComputeShader(
|
auto program{ctx.gpu.shader->ParseComputeShader(
|
||||||
shaderBinary.binary, shaderBinary.baseOffset,
|
packedState.shaderHash, shaderBinary.binary, shaderBinary.baseOffset,
|
||||||
packedState.bindlessTextureConstantBufferSlotSelect,
|
packedState.bindlessTextureConstantBufferSlotSelect,
|
||||||
packedState.localMemorySize, packedState.sharedMemorySize,
|
packedState.localMemorySize, packedState.sharedMemorySize,
|
||||||
packedState.dimensions,
|
packedState.dimensions,
|
||||||
@ -25,7 +25,7 @@ namespace skyline::gpu::interconnect::kepler_compute {
|
|||||||
|
|
||||||
Shader::Backend::Bindings bindings{};
|
Shader::Backend::Bindings bindings{};
|
||||||
|
|
||||||
return {ctx.gpu.shader.CompileShader({}, program, bindings), program.info};
|
return {ctx.gpu.shader->CompileShader({}, program, bindings), program.info};
|
||||||
}
|
}
|
||||||
|
|
||||||
static Pipeline::DescriptorInfo MakePipelineDescriptorInfo(const Pipeline::ShaderStage &stage) {
|
static Pipeline::DescriptorInfo MakePipelineDescriptorInfo(const Pipeline::ShaderStage &stage) {
|
||||||
|
@ -187,7 +187,7 @@ namespace skyline::gpu::interconnect::maxwell3d {
|
|||||||
}
|
}
|
||||||
|
|
||||||
static std::array<Pipeline::ShaderStage, engine::ShaderStageCount> MakePipelineShaders(GPU &gpu, const PipelineStateAccessor &accessor, const PackedPipelineState &packedState) {
|
static std::array<Pipeline::ShaderStage, engine::ShaderStageCount> MakePipelineShaders(GPU &gpu, const PipelineStateAccessor &accessor, const PackedPipelineState &packedState) {
|
||||||
gpu.shader.ResetPools();
|
gpu.shader->ResetPools();
|
||||||
|
|
||||||
using PipelineStage = engine::Pipeline::Shader::Type;
|
using PipelineStage = engine::Pipeline::Shader::Type;
|
||||||
auto pipelineStage{[](u32 i) { return static_cast<PipelineStage>(i); }};
|
auto pipelineStage{[](u32 i) { return static_cast<PipelineStage>(i); }};
|
||||||
@ -200,16 +200,16 @@ namespace skyline::gpu::interconnect::maxwell3d {
|
|||||||
for (u32 i{}; i < engine::PipelineCount; i++) {
|
for (u32 i{}; i < engine::PipelineCount; i++) {
|
||||||
if (!packedState.shaderHashes[i]) {
|
if (!packedState.shaderHashes[i]) {
|
||||||
if (i == stageIdx(PipelineStage::Geometry) && layerConversionSourceProgram)
|
if (i == stageIdx(PipelineStage::Geometry) && layerConversionSourceProgram)
|
||||||
programs[i] = gpu.shader.GenerateGeometryPassthroughShader(*layerConversionSourceProgram, ConvertShaderOutputTopology(packedState.topology));
|
programs[i] = gpu.shader->GenerateGeometryPassthroughShader(*layerConversionSourceProgram, ConvertShaderOutputTopology(packedState.topology));
|
||||||
|
|
||||||
continue;
|
continue;
|
||||||
}
|
}
|
||||||
|
|
||||||
auto binary{accessor.GetShaderBinary(i)};
|
auto binary{accessor.GetShaderBinary(i)};
|
||||||
auto program{gpu.shader.ParseGraphicsShader(
|
auto program{gpu.shader->ParseGraphicsShader(
|
||||||
packedState.postVtgShaderAttributeSkipMask,
|
packedState.postVtgShaderAttributeSkipMask,
|
||||||
ConvertCompilerShaderStage(static_cast<PipelineStage>(i)),
|
ConvertCompilerShaderStage(static_cast<PipelineStage>(i)),
|
||||||
binary.binary, binary.baseOffset,
|
packedState.shaderHashes[i], binary.binary, binary.baseOffset,
|
||||||
packedState.bindlessTextureConstantBufferSlotSelect,
|
packedState.bindlessTextureConstantBufferSlotSelect,
|
||||||
packedState.viewportTransformEnable,
|
packedState.viewportTransformEnable,
|
||||||
[&](u32 index, u32 offset) {
|
[&](u32 index, u32 offset) {
|
||||||
@ -220,7 +220,7 @@ namespace skyline::gpu::interconnect::maxwell3d {
|
|||||||
})};
|
})};
|
||||||
if (i == stageIdx(PipelineStage::Vertex) && packedState.shaderHashes[stageIdx(PipelineStage::VertexCullBeforeFetch)]) {
|
if (i == stageIdx(PipelineStage::Vertex) && packedState.shaderHashes[stageIdx(PipelineStage::VertexCullBeforeFetch)]) {
|
||||||
ignoreVertexCullBeforeFetch = true;
|
ignoreVertexCullBeforeFetch = true;
|
||||||
programs[i] = gpu.shader.CombineVertexShaders(programs[stageIdx(PipelineStage::VertexCullBeforeFetch)], program, binary.binary);
|
programs[i] = gpu.shader->CombineVertexShaders(programs[stageIdx(PipelineStage::VertexCullBeforeFetch)], program, binary.binary);
|
||||||
} else {
|
} else {
|
||||||
programs[i] = program;
|
programs[i] = program;
|
||||||
}
|
}
|
||||||
@ -240,7 +240,9 @@ namespace skyline::gpu::interconnect::maxwell3d {
|
|||||||
continue;
|
continue;
|
||||||
|
|
||||||
auto runtimeInfo{MakeRuntimeInfo(packedState, programs[i], lastProgram, hasGeometry)};
|
auto runtimeInfo{MakeRuntimeInfo(packedState, programs[i], lastProgram, hasGeometry)};
|
||||||
shaderStages[i - (i >= 1 ? 1 : 0)] = {ConvertVkShaderStage(pipelineStage(i)), gpu.shader.CompileShader(runtimeInfo, programs[i], bindings), programs[i].info};
|
shaderStages[i - (i >= 1 ? 1 : 0)] = {ConvertVkShaderStage(pipelineStage(i)),
|
||||||
|
gpu.shader->CompileShader(runtimeInfo, programs[i], bindings, packedState.shaderHashes[i]),
|
||||||
|
programs[i].info};
|
||||||
|
|
||||||
lastProgram = &programs[i];
|
lastProgram = &programs[i];
|
||||||
}
|
}
|
||||||
|
@ -11,6 +11,8 @@
|
|||||||
#include <vulkan/vulkan_raii.hpp>
|
#include <vulkan/vulkan_raii.hpp>
|
||||||
#include "shader_manager.h"
|
#include "shader_manager.h"
|
||||||
|
|
||||||
|
static constexpr bool DumpShaders{false};
|
||||||
|
|
||||||
namespace Shader::Log {
|
namespace Shader::Log {
|
||||||
void Debug(const std::string &message) {
|
void Debug(const std::string &message) {
|
||||||
skyline::Logger::Write(skyline::Logger::LogLevel::Debug, message);
|
skyline::Logger::Write(skyline::Logger::LogLevel::Debug, message);
|
||||||
@ -26,7 +28,53 @@ namespace Shader::Log {
|
|||||||
}
|
}
|
||||||
|
|
||||||
namespace skyline::gpu {
|
namespace skyline::gpu {
|
||||||
ShaderManager::ShaderManager(const DeviceState &state, GPU &gpu) : gpu{gpu} {
|
void ShaderManager::LoadShaderReplacements(std::string_view replacementDir) {
|
||||||
|
std::filesystem::path replacementDirPath{replacementDir};
|
||||||
|
if (std::filesystem::exists(replacementDirPath)) {
|
||||||
|
for (const auto &entry : std::filesystem::directory_iterator{replacementDirPath}) {
|
||||||
|
if (entry.is_regular_file()) {
|
||||||
|
// Parse hash from filename
|
||||||
|
u64 hash{std::stoull(entry.path().filename().string(), nullptr, 16)};
|
||||||
|
auto it{shaderReplacements.insert({hash, {}})};
|
||||||
|
|
||||||
|
// Read file into map entry
|
||||||
|
std::ifstream file{entry.path(), std::ios::binary | std::ios::ate};
|
||||||
|
it.first->second.resize(static_cast<size_t>(file.tellg()));
|
||||||
|
file.seekg(0, std::ios::beg);
|
||||||
|
file.read(reinterpret_cast<char *>(it.first->second.data()), static_cast<std::streamsize>(it.first->second.size()));
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
span<u8> ShaderManager::ProcessShaderBinary(u64 hash, span<u8> binary) {
|
||||||
|
auto it{shaderReplacements.find(hash)};
|
||||||
|
if (it != shaderReplacements.end()) {
|
||||||
|
Logger::Info("Replacing shader with hash: 0x{:X}", hash);
|
||||||
|
return it->second;
|
||||||
|
}
|
||||||
|
|
||||||
|
if (DumpShaders) {
|
||||||
|
std::scoped_lock lock{dumpMutex};
|
||||||
|
|
||||||
|
auto shaderPath{dumpPath / fmt::format("{:016X}", hash)};
|
||||||
|
if (!std::filesystem::exists(shaderPath)) {
|
||||||
|
std::ofstream file{shaderPath, std::ios::binary};
|
||||||
|
file.write(reinterpret_cast<const char *>(binary.data()), static_cast<std::streamsize>(binary.size()));
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
return binary;
|
||||||
|
}
|
||||||
|
|
||||||
|
ShaderManager::ShaderManager(const DeviceState &state, GPU &gpu, std::string_view replacementDir, std::string_view dumpDir) : gpu{gpu}, dumpPath{dumpDir} {
|
||||||
|
LoadShaderReplacements(replacementDir);
|
||||||
|
|
||||||
|
if constexpr (DumpShaders) {
|
||||||
|
if (!std::filesystem::exists(dumpPath))
|
||||||
|
std::filesystem::create_directories(dumpPath);
|
||||||
|
}
|
||||||
|
|
||||||
auto &traits{gpu.traits};
|
auto &traits{gpu.traits};
|
||||||
hostTranslateInfo = Shader::HostTranslateInfo{
|
hostTranslateInfo = Shader::HostTranslateInfo{
|
||||||
.support_float16 = traits.supportsFloat16,
|
.support_float16 = traits.supportsFloat16,
|
||||||
@ -282,15 +330,25 @@ namespace skyline::gpu {
|
|||||||
return {0, 0, 0}; // Only relevant for compute shaders
|
return {0, 0, 0}; // Only relevant for compute shaders
|
||||||
}
|
}
|
||||||
|
|
||||||
|
[[nodiscard]] bool HasHLEMacroState() const final {
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
|
||||||
|
[[nodiscard]] std::optional<Shader::ReplaceConstant> GetReplaceConstBuffer(u32 bank, u32 offset) final {
|
||||||
|
return std::nullopt;
|
||||||
|
}
|
||||||
|
|
||||||
void Dump(u64 hash) final {}
|
void Dump(u64 hash) final {}
|
||||||
};
|
};
|
||||||
|
|
||||||
Shader::IR::Program ShaderManager::ParseGraphicsShader(const std::array<u32, 8> &postVtgShaderAttributeSkipMask,
|
Shader::IR::Program ShaderManager::ParseGraphicsShader(const std::array<u32, 8> &postVtgShaderAttributeSkipMask,
|
||||||
Shader::Stage stage,
|
Shader::Stage stage,
|
||||||
span<u8> binary, u32 baseOffset,
|
u64 hash, span<u8> binary, u32 baseOffset,
|
||||||
u32 textureConstantBufferIndex,
|
u32 textureConstantBufferIndex,
|
||||||
bool viewportTransformEnabled,
|
bool viewportTransformEnabled,
|
||||||
const ConstantBufferRead &constantBufferRead, const GetTextureType &getTextureType) {
|
const ConstantBufferRead &constantBufferRead, const GetTextureType &getTextureType) {
|
||||||
|
binary = ProcessShaderBinary(hash, binary);
|
||||||
|
|
||||||
std::scoped_lock lock{poolMutex};
|
std::scoped_lock lock{poolMutex};
|
||||||
|
|
||||||
GraphicsEnvironment environment{postVtgShaderAttributeSkipMask, stage, binary, baseOffset, textureConstantBufferIndex, viewportTransformEnabled, constantBufferRead, getTextureType};
|
GraphicsEnvironment environment{postVtgShaderAttributeSkipMask, stage, binary, baseOffset, textureConstantBufferIndex, viewportTransformEnabled, constantBufferRead, getTextureType};
|
||||||
@ -311,11 +369,13 @@ namespace skyline::gpu {
|
|||||||
return Shader::Maxwell::GenerateGeometryPassthrough(instructionPool, blockPool, hostTranslateInfo, layerSource, topology);
|
return Shader::Maxwell::GenerateGeometryPassthrough(instructionPool, blockPool, hostTranslateInfo, layerSource, topology);
|
||||||
}
|
}
|
||||||
|
|
||||||
Shader::IR::Program ShaderManager::ParseComputeShader(span<u8> binary, u32 baseOffset,
|
Shader::IR::Program ShaderManager::ParseComputeShader(u64 hash, span<u8> binary, u32 baseOffset,
|
||||||
u32 textureConstantBufferIndex,
|
u32 textureConstantBufferIndex,
|
||||||
u32 localMemorySize, u32 sharedMemorySize,
|
u32 localMemorySize, u32 sharedMemorySize,
|
||||||
std::array<u32, 3> workgroupDimensions,
|
std::array<u32, 3> workgroupDimensions,
|
||||||
const ConstantBufferRead &constantBufferRead, const GetTextureType &getTextureType) {
|
const ConstantBufferRead &constantBufferRead, const GetTextureType &getTextureType) {
|
||||||
|
binary = ProcessShaderBinary(hash, binary);
|
||||||
|
|
||||||
std::scoped_lock lock{poolMutex};
|
std::scoped_lock lock{poolMutex};
|
||||||
|
|
||||||
ComputeEnvironment environment{binary, baseOffset, textureConstantBufferIndex, localMemorySize, sharedMemorySize, workgroupDimensions, constantBufferRead, getTextureType};
|
ComputeEnvironment environment{binary, baseOffset, textureConstantBufferIndex, localMemorySize, sharedMemorySize, workgroupDimensions, constantBufferRead, getTextureType};
|
||||||
|
@ -3,6 +3,7 @@
|
|||||||
|
|
||||||
#pragma once
|
#pragma once
|
||||||
|
|
||||||
|
#include <unordered_map>
|
||||||
#include <vulkan/vulkan.hpp>
|
#include <vulkan/vulkan.hpp>
|
||||||
#include <shader_compiler/object_pool.h>
|
#include <shader_compiler/object_pool.h>
|
||||||
#include <shader_compiler/frontend/maxwell/control_flow.h>
|
#include <shader_compiler/frontend/maxwell/control_flow.h>
|
||||||
@ -27,18 +28,32 @@ namespace skyline::gpu {
|
|||||||
Shader::ObjectPool<Shader::Maxwell::Flow::Block> flowBlockPool;
|
Shader::ObjectPool<Shader::Maxwell::Flow::Block> flowBlockPool;
|
||||||
Shader::ObjectPool<Shader::IR::Inst> instructionPool;
|
Shader::ObjectPool<Shader::IR::Inst> instructionPool;
|
||||||
Shader::ObjectPool<Shader::IR::Block> blockPool;
|
Shader::ObjectPool<Shader::IR::Block> blockPool;
|
||||||
|
std::unordered_map<u64, std::vector<u8>> shaderReplacements; //!< Map of shader hash -> replacement shader binary, populated at init time and must not be modified after
|
||||||
std::mutex poolMutex;
|
std::mutex poolMutex;
|
||||||
|
std::filesystem::path dumpPath;
|
||||||
|
std::mutex dumpMutex;
|
||||||
|
|
||||||
|
/**
|
||||||
|
* @brief Called at init time to populate the shader replacements map from the input directory
|
||||||
|
*/
|
||||||
|
void LoadShaderReplacements(std::string_view replacementDir);
|
||||||
|
|
||||||
|
/**
|
||||||
|
* @brief Returns the raw binary of shader replacement for the given hash, if no replacement is found the input binary is returned
|
||||||
|
* @note This will also dump the binary to disk if dumping is enabled
|
||||||
|
*/
|
||||||
|
span<u8> ProcessShaderBinary(u64 hash, span<u8> binary);
|
||||||
|
|
||||||
public:
|
public:
|
||||||
using ConstantBufferRead = std::function<u32(u32 index, u32 offset)>; //!< A function which reads a constant buffer at the specified offset and returns the value
|
using ConstantBufferRead = std::function<u32(u32 index, u32 offset)>; //!< A function which reads a constant buffer at the specified offset and returns the value
|
||||||
using GetTextureType = std::function<Shader::TextureType(u32 handle)>; //!< A function which determines the type of a texture from its handle by checking the corresponding TIC
|
using GetTextureType = std::function<Shader::TextureType(u32 handle)>; //!< A function which determines the type of a texture from its handle by checking the corresponding TIC
|
||||||
|
|
||||||
ShaderManager(const DeviceState &state, GPU &gpu);
|
ShaderManager(const DeviceState &state, GPU &gpu, std::string_view replacementDir, std::string_view dumpDir);
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* @return A shader program that corresponds to all the supplied state including the current state of the constant buffers
|
* @return A shader program that corresponds to all the supplied state including the current state of the constant buffers
|
||||||
*/
|
*/
|
||||||
Shader::IR::Program ParseGraphicsShader(const std::array<u32, 8> &postVtgShaderAttributeSkipMask, Shader::Stage stage, span<u8> binary, u32 baseOffset, u32 textureConstantBufferIndex, bool viewportTransformEnabled, const ConstantBufferRead &constantBufferRead, const GetTextureType &getTextureType);
|
Shader::IR::Program ParseGraphicsShader(const std::array<u32, 8> &postVtgShaderAttributeSkipMask, Shader::Stage stage, u64 hash, span<u8> binary, u32 baseOffset, u32 textureConstantBufferIndex, bool viewportTransformEnabled, const ConstantBufferRead &constantBufferRead, const GetTextureType &getTextureType);
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* @brief Combines the VertexA and VertexB shader programs into a single program
|
* @brief Combines the VertexA and VertexB shader programs into a single program
|
||||||
@ -51,7 +66,7 @@ namespace skyline::gpu {
|
|||||||
*/
|
*/
|
||||||
Shader::IR::Program GenerateGeometryPassthroughShader(Shader::IR::Program &layerSource, Shader::OutputTopology topology);
|
Shader::IR::Program GenerateGeometryPassthroughShader(Shader::IR::Program &layerSource, Shader::OutputTopology topology);
|
||||||
|
|
||||||
Shader::IR::Program ParseComputeShader(span<u8> binary, u32 baseOffset, u32 textureConstantBufferIndex, u32 localMemorySize, u32 sharedMemorySize, std::array<u32, 3> workgroupDimensions, const ConstantBufferRead &constantBufferRead, const GetTextureType &getTextureType);
|
Shader::IR::Program ParseComputeShader(u64 hash, span<u8> binary, u32 baseOffset, u32 textureConstantBufferIndex, u32 localMemorySize, u32 sharedMemorySize, std::array<u32, 3> workgroupDimensions, const ConstantBufferRead &constantBufferRead, const GetTextureType &getTextureType);
|
||||||
|
|
||||||
vk::ShaderModule CompileShader(const Shader::RuntimeInfo &runtimeInfo, Shader::IR::Program &program, Shader::Backend::Bindings &bindings);
|
vk::ShaderModule CompileShader(const Shader::RuntimeInfo &runtimeInfo, Shader::IR::Program &program, Shader::Backend::Bindings &bindings);
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user