mirror of
https://gitlab.com/suyu-emu/suyu.git
synced 2024-03-15 23:15:44 +00:00
shader: Implement D3D samplers
This commit is contained in:
parent
a8d46a5eae
commit
dd860b684c
|
@ -17,7 +17,7 @@ public:
|
||||||
|
|
||||||
[[nodiscard]] virtual u32 ReadCbufValue(u32 cbuf_index, u32 cbuf_offset) = 0;
|
[[nodiscard]] virtual u32 ReadCbufValue(u32 cbuf_index, u32 cbuf_offset) = 0;
|
||||||
|
|
||||||
[[nodiscard]] virtual TextureType ReadTextureType(u32 cbuf_index, u32 cbuf_offset) = 0;
|
[[nodiscard]] virtual TextureType ReadTextureType(u32 raw_handle) = 0;
|
||||||
|
|
||||||
[[nodiscard]] virtual u32 TextureBoundBuffer() const = 0;
|
[[nodiscard]] virtual u32 TextureBoundBuffer() const = 0;
|
||||||
|
|
||||||
|
|
|
@ -19,6 +19,9 @@ namespace {
|
||||||
struct ConstBufferAddr {
|
struct ConstBufferAddr {
|
||||||
u32 index;
|
u32 index;
|
||||||
u32 offset;
|
u32 offset;
|
||||||
|
u32 secondary_index;
|
||||||
|
u32 secondary_offset;
|
||||||
|
bool has_secondary;
|
||||||
};
|
};
|
||||||
|
|
||||||
struct TextureInst {
|
struct TextureInst {
|
||||||
|
@ -109,9 +112,38 @@ bool IsTextureInstruction(const IR::Inst& inst) {
|
||||||
return IndexedInstruction(inst) != IR::Opcode::Void;
|
return IndexedInstruction(inst) != IR::Opcode::Void;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
std::optional<ConstBufferAddr> TryGetConstBuffer(const IR::Inst* inst);
|
||||||
|
|
||||||
|
std::optional<ConstBufferAddr> Track(const IR::Value& value) {
|
||||||
|
return IR::BreadthFirstSearch(value, TryGetConstBuffer);
|
||||||
|
}
|
||||||
|
|
||||||
std::optional<ConstBufferAddr> TryGetConstBuffer(const IR::Inst* inst) {
|
std::optional<ConstBufferAddr> TryGetConstBuffer(const IR::Inst* inst) {
|
||||||
if (inst->GetOpcode() != IR::Opcode::GetCbufU32) {
|
switch (inst->GetOpcode()) {
|
||||||
|
default:
|
||||||
return std::nullopt;
|
return std::nullopt;
|
||||||
|
case IR::Opcode::BitwiseOr32: {
|
||||||
|
std::optional lhs{Track(inst->Arg(0))};
|
||||||
|
std::optional rhs{Track(inst->Arg(1))};
|
||||||
|
if (!lhs || !rhs) {
|
||||||
|
return std::nullopt;
|
||||||
|
}
|
||||||
|
if (lhs->has_secondary || rhs->has_secondary) {
|
||||||
|
return std::nullopt;
|
||||||
|
}
|
||||||
|
if (lhs->index > rhs->index || lhs->offset > rhs->offset) {
|
||||||
|
std::swap(lhs, rhs);
|
||||||
|
}
|
||||||
|
return ConstBufferAddr{
|
||||||
|
.index = lhs->index,
|
||||||
|
.offset = lhs->offset,
|
||||||
|
.secondary_index = rhs->index,
|
||||||
|
.secondary_offset = rhs->offset,
|
||||||
|
.has_secondary = true,
|
||||||
|
};
|
||||||
|
}
|
||||||
|
case IR::Opcode::GetCbufU32:
|
||||||
|
break;
|
||||||
}
|
}
|
||||||
const IR::Value index{inst->Arg(0)};
|
const IR::Value index{inst->Arg(0)};
|
||||||
const IR::Value offset{inst->Arg(1)};
|
const IR::Value offset{inst->Arg(1)};
|
||||||
|
@ -127,13 +159,12 @@ std::optional<ConstBufferAddr> TryGetConstBuffer(const IR::Inst* inst) {
|
||||||
return ConstBufferAddr{
|
return ConstBufferAddr{
|
||||||
.index{index.U32()},
|
.index{index.U32()},
|
||||||
.offset{offset.U32()},
|
.offset{offset.U32()},
|
||||||
|
.secondary_index = 0,
|
||||||
|
.secondary_offset = 0,
|
||||||
|
.has_secondary = false,
|
||||||
};
|
};
|
||||||
}
|
}
|
||||||
|
|
||||||
std::optional<ConstBufferAddr> Track(const IR::Value& value) {
|
|
||||||
return IR::BreadthFirstSearch(value, TryGetConstBuffer);
|
|
||||||
}
|
|
||||||
|
|
||||||
TextureInst MakeInst(Environment& env, IR::Block* block, IR::Inst& inst) {
|
TextureInst MakeInst(Environment& env, IR::Block* block, IR::Inst& inst) {
|
||||||
ConstBufferAddr addr;
|
ConstBufferAddr addr;
|
||||||
if (IsBindless(inst)) {
|
if (IsBindless(inst)) {
|
||||||
|
@ -146,6 +177,9 @@ TextureInst MakeInst(Environment& env, IR::Block* block, IR::Inst& inst) {
|
||||||
addr = ConstBufferAddr{
|
addr = ConstBufferAddr{
|
||||||
.index = env.TextureBoundBuffer(),
|
.index = env.TextureBoundBuffer(),
|
||||||
.offset = inst.Arg(0).U32(),
|
.offset = inst.Arg(0).U32(),
|
||||||
|
.secondary_index = 0,
|
||||||
|
.secondary_offset = 0,
|
||||||
|
.has_secondary = false,
|
||||||
};
|
};
|
||||||
}
|
}
|
||||||
return TextureInst{
|
return TextureInst{
|
||||||
|
@ -155,6 +189,14 @@ TextureInst MakeInst(Environment& env, IR::Block* block, IR::Inst& inst) {
|
||||||
};
|
};
|
||||||
}
|
}
|
||||||
|
|
||||||
|
TextureType ReadTextureType(Environment& env, const ConstBufferAddr& cbuf) {
|
||||||
|
const u32 secondary_index{cbuf.has_secondary ? cbuf.index : cbuf.secondary_index};
|
||||||
|
const u32 secondary_offset{cbuf.has_secondary ? cbuf.offset : cbuf.secondary_offset};
|
||||||
|
const u32 lhs_raw{env.ReadCbufValue(cbuf.index, cbuf.offset)};
|
||||||
|
const u32 rhs_raw{env.ReadCbufValue(secondary_index, secondary_offset)};
|
||||||
|
return env.ReadTextureType(lhs_raw | rhs_raw);
|
||||||
|
}
|
||||||
|
|
||||||
class Descriptors {
|
class Descriptors {
|
||||||
public:
|
public:
|
||||||
explicit Descriptors(TextureBufferDescriptors& texture_buffer_descriptors_,
|
explicit Descriptors(TextureBufferDescriptors& texture_buffer_descriptors_,
|
||||||
|
@ -167,8 +209,11 @@ public:
|
||||||
|
|
||||||
u32 Add(const TextureBufferDescriptor& desc) {
|
u32 Add(const TextureBufferDescriptor& desc) {
|
||||||
return Add(texture_buffer_descriptors, desc, [&desc](const auto& existing) {
|
return Add(texture_buffer_descriptors, desc, [&desc](const auto& existing) {
|
||||||
return desc.cbuf_index == existing.cbuf_index &&
|
return desc.has_secondary == existing.has_secondary &&
|
||||||
desc.cbuf_offset == existing.cbuf_offset;
|
desc.cbuf_index == existing.cbuf_index &&
|
||||||
|
desc.cbuf_offset == existing.cbuf_offset &&
|
||||||
|
desc.secondary_cbuf_index == existing.secondary_cbuf_index &&
|
||||||
|
desc.secondary_cbuf_offset == existing.secondary_cbuf_offset;
|
||||||
});
|
});
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -181,8 +226,12 @@ public:
|
||||||
|
|
||||||
u32 Add(const TextureDescriptor& desc) {
|
u32 Add(const TextureDescriptor& desc) {
|
||||||
return Add(texture_descriptors, desc, [&desc](const auto& existing) {
|
return Add(texture_descriptors, desc, [&desc](const auto& existing) {
|
||||||
return desc.cbuf_index == existing.cbuf_index &&
|
return desc.type == existing.type && desc.is_depth == existing.is_depth &&
|
||||||
desc.cbuf_offset == existing.cbuf_offset && desc.type == existing.type;
|
desc.has_secondary == existing.has_secondary &&
|
||||||
|
desc.cbuf_index == existing.cbuf_index &&
|
||||||
|
desc.cbuf_offset == existing.cbuf_offset &&
|
||||||
|
desc.secondary_cbuf_index == existing.secondary_cbuf_index &&
|
||||||
|
desc.secondary_cbuf_offset == existing.secondary_cbuf_offset;
|
||||||
});
|
});
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -247,14 +296,14 @@ void TexturePass(Environment& env, IR::Program& program) {
|
||||||
auto flags{inst->Flags<IR::TextureInstInfo>()};
|
auto flags{inst->Flags<IR::TextureInstInfo>()};
|
||||||
switch (inst->GetOpcode()) {
|
switch (inst->GetOpcode()) {
|
||||||
case IR::Opcode::ImageQueryDimensions:
|
case IR::Opcode::ImageQueryDimensions:
|
||||||
flags.type.Assign(env.ReadTextureType(cbuf.index, cbuf.offset));
|
flags.type.Assign(ReadTextureType(env, cbuf));
|
||||||
inst->SetFlags(flags);
|
inst->SetFlags(flags);
|
||||||
break;
|
break;
|
||||||
case IR::Opcode::ImageFetch:
|
case IR::Opcode::ImageFetch:
|
||||||
if (flags.type != TextureType::Color1D) {
|
if (flags.type != TextureType::Color1D) {
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
if (env.ReadTextureType(cbuf.index, cbuf.offset) == TextureType::Buffer) {
|
if (ReadTextureType(env, cbuf) == TextureType::Buffer) {
|
||||||
// Replace with the bound texture type only when it's a texture buffer
|
// Replace with the bound texture type only when it's a texture buffer
|
||||||
// If the instruction is 1D and the bound type is 2D, don't change the code and let
|
// If the instruction is 1D and the bound type is 2D, don't change the code and let
|
||||||
// the rasterizer robustness handle it
|
// the rasterizer robustness handle it
|
||||||
|
@ -270,6 +319,9 @@ void TexturePass(Environment& env, IR::Program& program) {
|
||||||
switch (inst->GetOpcode()) {
|
switch (inst->GetOpcode()) {
|
||||||
case IR::Opcode::ImageRead:
|
case IR::Opcode::ImageRead:
|
||||||
case IR::Opcode::ImageWrite: {
|
case IR::Opcode::ImageWrite: {
|
||||||
|
if (cbuf.has_secondary) {
|
||||||
|
throw NotImplementedException("Unexpected separate sampler");
|
||||||
|
}
|
||||||
const bool is_written{inst->GetOpcode() == IR::Opcode::ImageWrite};
|
const bool is_written{inst->GetOpcode() == IR::Opcode::ImageWrite};
|
||||||
if (flags.type == TextureType::Buffer) {
|
if (flags.type == TextureType::Buffer) {
|
||||||
index = descriptors.Add(ImageBufferDescriptor{
|
index = descriptors.Add(ImageBufferDescriptor{
|
||||||
|
@ -294,16 +346,22 @@ void TexturePass(Environment& env, IR::Program& program) {
|
||||||
default:
|
default:
|
||||||
if (flags.type == TextureType::Buffer) {
|
if (flags.type == TextureType::Buffer) {
|
||||||
index = descriptors.Add(TextureBufferDescriptor{
|
index = descriptors.Add(TextureBufferDescriptor{
|
||||||
|
.has_secondary = cbuf.has_secondary,
|
||||||
.cbuf_index = cbuf.index,
|
.cbuf_index = cbuf.index,
|
||||||
.cbuf_offset = cbuf.offset,
|
.cbuf_offset = cbuf.offset,
|
||||||
|
.secondary_cbuf_index = cbuf.secondary_index,
|
||||||
|
.secondary_cbuf_offset = cbuf.secondary_offset,
|
||||||
.count = 1,
|
.count = 1,
|
||||||
});
|
});
|
||||||
} else {
|
} else {
|
||||||
index = descriptors.Add(TextureDescriptor{
|
index = descriptors.Add(TextureDescriptor{
|
||||||
.type = flags.type,
|
.type = flags.type,
|
||||||
.is_depth = flags.is_depth != 0,
|
.is_depth = flags.is_depth != 0,
|
||||||
|
.has_secondary = cbuf.has_secondary,
|
||||||
.cbuf_index = cbuf.index,
|
.cbuf_index = cbuf.index,
|
||||||
.cbuf_offset = cbuf.offset,
|
.cbuf_offset = cbuf.offset,
|
||||||
|
.secondary_cbuf_index = cbuf.secondary_index,
|
||||||
|
.secondary_cbuf_offset = cbuf.secondary_offset,
|
||||||
.count = 1,
|
.count = 1,
|
||||||
});
|
});
|
||||||
}
|
}
|
||||||
|
|
|
@ -61,8 +61,11 @@ struct StorageBufferDescriptor {
|
||||||
};
|
};
|
||||||
|
|
||||||
struct TextureBufferDescriptor {
|
struct TextureBufferDescriptor {
|
||||||
|
bool has_secondary;
|
||||||
u32 cbuf_index;
|
u32 cbuf_index;
|
||||||
u32 cbuf_offset;
|
u32 cbuf_offset;
|
||||||
|
u32 secondary_cbuf_index;
|
||||||
|
u32 secondary_cbuf_offset;
|
||||||
u32 count;
|
u32 count;
|
||||||
};
|
};
|
||||||
using TextureBufferDescriptors = boost::container::small_vector<TextureBufferDescriptor, 6>;
|
using TextureBufferDescriptors = boost::container::small_vector<TextureBufferDescriptor, 6>;
|
||||||
|
@ -79,8 +82,11 @@ using ImageBufferDescriptors = boost::container::small_vector<ImageBufferDescrip
|
||||||
struct TextureDescriptor {
|
struct TextureDescriptor {
|
||||||
TextureType type;
|
TextureType type;
|
||||||
bool is_depth;
|
bool is_depth;
|
||||||
|
bool has_secondary;
|
||||||
u32 cbuf_index;
|
u32 cbuf_index;
|
||||||
u32 cbuf_offset;
|
u32 cbuf_offset;
|
||||||
|
u32 secondary_cbuf_index;
|
||||||
|
u32 secondary_cbuf_offset;
|
||||||
u32 count;
|
u32 count;
|
||||||
};
|
};
|
||||||
using TextureDescriptors = boost::container::small_vector<TextureDescriptor, 12>;
|
using TextureDescriptors = boost::container::small_vector<TextureDescriptor, 12>;
|
||||||
|
|
|
@ -88,23 +88,34 @@ void ComputePipeline::Configure(Tegra::Engines::KeplerCompute& kepler_compute,
|
||||||
boost::container::static_vector<u32, max_elements> image_view_indices;
|
boost::container::static_vector<u32, max_elements> image_view_indices;
|
||||||
boost::container::static_vector<VkSampler, max_elements> samplers;
|
boost::container::static_vector<VkSampler, max_elements> samplers;
|
||||||
|
|
||||||
const auto& launch_desc{kepler_compute.launch_description};
|
const auto& qmd{kepler_compute.launch_description};
|
||||||
const auto& cbufs{launch_desc.const_buffer_config};
|
const auto& cbufs{qmd.const_buffer_config};
|
||||||
const bool via_header_index{launch_desc.linked_tsc};
|
const bool via_header_index{qmd.linked_tsc != 0};
|
||||||
const auto read_handle{[&](u32 cbuf_index, u32 cbuf_offset) {
|
const auto read_handle{[&](const auto& desc) {
|
||||||
ASSERT(((launch_desc.const_buffer_enable_mask >> cbuf_index) & 1) != 0);
|
ASSERT(((qmd.const_buffer_enable_mask >> desc.cbuf_index) & 1) != 0);
|
||||||
const GPUVAddr addr{cbufs[cbuf_index].Address() + cbuf_offset};
|
const GPUVAddr addr{cbufs[desc.cbuf_index].Address() + desc.cbuf_offset};
|
||||||
const u32 raw_handle{gpu_memory.Read<u32>(addr)};
|
if constexpr (std::is_same_v<decltype(desc), const Shader::TextureDescriptor&> ||
|
||||||
return TextureHandle(raw_handle, via_header_index);
|
std::is_same_v<decltype(desc), const Shader::TextureBufferDescriptor&>) {
|
||||||
|
if (desc.has_secondary) {
|
||||||
|
ASSERT(((qmd.const_buffer_enable_mask >> desc.secondary_cbuf_index) & 1) != 0);
|
||||||
|
const GPUVAddr separate_addr{cbufs[desc.secondary_cbuf_index].Address() +
|
||||||
|
desc.secondary_cbuf_offset};
|
||||||
|
const u32 lhs_raw{gpu_memory.Read<u32>(addr)};
|
||||||
|
const u32 rhs_raw{gpu_memory.Read<u32>(separate_addr)};
|
||||||
|
const u32 raw{lhs_raw | rhs_raw};
|
||||||
|
return TextureHandle{raw, via_header_index};
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return TextureHandle{gpu_memory.Read<u32>(addr), via_header_index};
|
||||||
}};
|
}};
|
||||||
const auto add_image{[&](const auto& desc) {
|
const auto add_image{[&](const auto& desc) {
|
||||||
const TextureHandle handle{read_handle(desc.cbuf_index, desc.cbuf_offset)};
|
const TextureHandle handle{read_handle(desc)};
|
||||||
image_view_indices.push_back(handle.image);
|
image_view_indices.push_back(handle.image);
|
||||||
}};
|
}};
|
||||||
std::ranges::for_each(info.texture_buffer_descriptors, add_image);
|
std::ranges::for_each(info.texture_buffer_descriptors, add_image);
|
||||||
std::ranges::for_each(info.image_buffer_descriptors, add_image);
|
std::ranges::for_each(info.image_buffer_descriptors, add_image);
|
||||||
for (const auto& desc : info.texture_descriptors) {
|
for (const auto& desc : info.texture_descriptors) {
|
||||||
const TextureHandle handle{read_handle(desc.cbuf_index, desc.cbuf_offset)};
|
const TextureHandle handle{read_handle(desc)};
|
||||||
image_view_indices.push_back(handle.image);
|
image_view_indices.push_back(handle.image);
|
||||||
|
|
||||||
Sampler* const sampler = texture_cache.GetComputeSampler(handle.sampler);
|
Sampler* const sampler = texture_cache.GetComputeSampler(handle.sampler);
|
||||||
|
|
|
@ -169,20 +169,31 @@ void GraphicsPipeline::Configure(bool is_indexed) {
|
||||||
++index;
|
++index;
|
||||||
}
|
}
|
||||||
const auto& cbufs{maxwell3d.state.shader_stages[stage].const_buffers};
|
const auto& cbufs{maxwell3d.state.shader_stages[stage].const_buffers};
|
||||||
const auto read_handle{[&](u32 cbuf_index, u32 cbuf_offset) {
|
const auto read_handle{[&](const auto& desc) {
|
||||||
ASSERT(cbufs[cbuf_index].enabled);
|
ASSERT(cbufs[desc.cbuf_index].enabled);
|
||||||
const GPUVAddr addr{cbufs[cbuf_index].address + cbuf_offset};
|
const GPUVAddr addr{cbufs[desc.cbuf_index].address + desc.cbuf_offset};
|
||||||
const u32 raw_handle{gpu_memory.Read<u32>(addr)};
|
if constexpr (std::is_same_v<decltype(desc), const Shader::TextureDescriptor&> ||
|
||||||
return TextureHandle(raw_handle, via_header_index);
|
std::is_same_v<decltype(desc), const Shader::TextureBufferDescriptor&>) {
|
||||||
|
if (desc.has_secondary) {
|
||||||
|
ASSERT(cbufs[desc.secondary_cbuf_index].enabled);
|
||||||
|
const GPUVAddr separate_addr{cbufs[desc.secondary_cbuf_index].address +
|
||||||
|
desc.secondary_cbuf_offset};
|
||||||
|
const u32 lhs_raw{gpu_memory.Read<u32>(addr)};
|
||||||
|
const u32 rhs_raw{gpu_memory.Read<u32>(separate_addr)};
|
||||||
|
const u32 raw{lhs_raw | rhs_raw};
|
||||||
|
return TextureHandle{raw, via_header_index};
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return TextureHandle{gpu_memory.Read<u32>(addr), via_header_index};
|
||||||
}};
|
}};
|
||||||
const auto add_image{[&](const auto& desc) {
|
const auto add_image{[&](const auto& desc) {
|
||||||
const TextureHandle handle{read_handle(desc.cbuf_index, desc.cbuf_offset)};
|
const TextureHandle handle{read_handle(desc)};
|
||||||
image_view_indices.push_back(handle.image);
|
image_view_indices.push_back(handle.image);
|
||||||
}};
|
}};
|
||||||
std::ranges::for_each(info.texture_buffer_descriptors, add_image);
|
std::ranges::for_each(info.texture_buffer_descriptors, add_image);
|
||||||
std::ranges::for_each(info.image_buffer_descriptors, add_image);
|
std::ranges::for_each(info.image_buffer_descriptors, add_image);
|
||||||
for (const auto& desc : info.texture_descriptors) {
|
for (const auto& desc : info.texture_descriptors) {
|
||||||
const TextureHandle handle{read_handle(desc.cbuf_index, desc.cbuf_offset)};
|
const TextureHandle handle{read_handle(desc)};
|
||||||
image_view_indices.push_back(handle.image);
|
image_view_indices.push_back(handle.image);
|
||||||
|
|
||||||
Sampler* const sampler{texture_cache.GetGraphicsSampler(handle.sampler)};
|
Sampler* const sampler{texture_cache.GetGraphicsSampler(handle.sampler)};
|
||||||
|
|
|
@ -188,9 +188,7 @@ protected:
|
||||||
}
|
}
|
||||||
|
|
||||||
Shader::TextureType ReadTextureTypeImpl(GPUVAddr tic_addr, u32 tic_limit, bool via_header_index,
|
Shader::TextureType ReadTextureTypeImpl(GPUVAddr tic_addr, u32 tic_limit, bool via_header_index,
|
||||||
GPUVAddr cbuf_addr, u32 cbuf_size, u32 cbuf_index,
|
u32 raw) {
|
||||||
u32 cbuf_offset) {
|
|
||||||
const u32 raw{cbuf_offset < cbuf_size ? gpu_memory->Read<u32>(cbuf_addr + cbuf_offset) : 0};
|
|
||||||
const TextureHandle handle{raw, via_header_index};
|
const TextureHandle handle{raw, via_header_index};
|
||||||
const GPUVAddr descriptor_addr{tic_addr + handle.image * sizeof(Tegra::Texture::TICEntry)};
|
const GPUVAddr descriptor_addr{tic_addr + handle.image * sizeof(Tegra::Texture::TICEntry)};
|
||||||
Tegra::Texture::TICEntry entry;
|
Tegra::Texture::TICEntry entry;
|
||||||
|
@ -219,7 +217,7 @@ protected:
|
||||||
throw Shader::NotImplementedException("Unknown texture type");
|
throw Shader::NotImplementedException("Unknown texture type");
|
||||||
}
|
}
|
||||||
}()};
|
}()};
|
||||||
texture_types.emplace(MakeCbufKey(cbuf_index, cbuf_offset), result);
|
texture_types.emplace(raw, result);
|
||||||
return result;
|
return result;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -227,7 +225,7 @@ protected:
|
||||||
GPUVAddr program_base{};
|
GPUVAddr program_base{};
|
||||||
|
|
||||||
std::vector<u64> code;
|
std::vector<u64> code;
|
||||||
std::unordered_map<u64, Shader::TextureType> texture_types;
|
std::unordered_map<u32, Shader::TextureType> texture_types;
|
||||||
std::unordered_map<u64, u32> cbuf_values;
|
std::unordered_map<u64, u32> cbuf_values;
|
||||||
|
|
||||||
u32 local_memory_size{};
|
u32 local_memory_size{};
|
||||||
|
@ -250,7 +248,7 @@ using Shader::Maxwell::TranslateProgram;
|
||||||
|
|
||||||
// TODO: Move this to a separate file
|
// TODO: Move this to a separate file
|
||||||
constexpr std::array<char, 8> MAGIC_NUMBER{'y', 'u', 'z', 'u', 'c', 'a', 'c', 'h'};
|
constexpr std::array<char, 8> MAGIC_NUMBER{'y', 'u', 'z', 'u', 'c', 'a', 'c', 'h'};
|
||||||
constexpr u32 CACHE_VERSION{1};
|
constexpr u32 CACHE_VERSION{2};
|
||||||
|
|
||||||
class GraphicsEnvironment final : public GenericEnvironment {
|
class GraphicsEnvironment final : public GenericEnvironment {
|
||||||
public:
|
public:
|
||||||
|
@ -308,13 +306,10 @@ public:
|
||||||
return value;
|
return value;
|
||||||
}
|
}
|
||||||
|
|
||||||
Shader::TextureType ReadTextureType(u32 cbuf_index, u32 cbuf_offset) override {
|
Shader::TextureType ReadTextureType(u32 handle) override {
|
||||||
const auto& regs{maxwell3d->regs};
|
const auto& regs{maxwell3d->regs};
|
||||||
const auto& cbuf{maxwell3d->state.shader_stages[stage_index].const_buffers[cbuf_index]};
|
|
||||||
ASSERT(cbuf.enabled);
|
|
||||||
const bool via_header_index{regs.sampler_index == Maxwell::SamplerIndex::ViaHeaderIndex};
|
const bool via_header_index{regs.sampler_index == Maxwell::SamplerIndex::ViaHeaderIndex};
|
||||||
return ReadTextureTypeImpl(regs.tic.Address(), regs.tic.limit, via_header_index,
|
return ReadTextureTypeImpl(regs.tic.Address(), regs.tic.limit, via_header_index, handle);
|
||||||
cbuf.address, cbuf.size, cbuf_index, cbuf_offset);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
private:
|
private:
|
||||||
|
@ -352,13 +347,10 @@ public:
|
||||||
return value;
|
return value;
|
||||||
}
|
}
|
||||||
|
|
||||||
Shader::TextureType ReadTextureType(u32 cbuf_index, u32 cbuf_offset) override {
|
Shader::TextureType ReadTextureType(u32 handle) override {
|
||||||
const auto& regs{kepler_compute->regs};
|
const auto& regs{kepler_compute->regs};
|
||||||
const auto& qmd{kepler_compute->launch_description};
|
const auto& qmd{kepler_compute->launch_description};
|
||||||
ASSERT(((qmd.const_buffer_enable_mask.Value() >> cbuf_index) & 1) != 0);
|
return ReadTextureTypeImpl(regs.tic.Address(), regs.tic.limit, qmd.linked_tsc != 0, handle);
|
||||||
const auto& cbuf{qmd.const_buffer_config[cbuf_index]};
|
|
||||||
return ReadTextureTypeImpl(regs.tic.Address(), regs.tic.limit, qmd.linked_tsc != 0,
|
|
||||||
cbuf.Address(), cbuf.size, cbuf_index, cbuf_offset);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
private:
|
private:
|
||||||
|
@ -421,7 +413,7 @@ public:
|
||||||
code = std::make_unique<u64[]>(Common::DivCeil(code_size, sizeof(u64)));
|
code = std::make_unique<u64[]>(Common::DivCeil(code_size, sizeof(u64)));
|
||||||
file.read(reinterpret_cast<char*>(code.get()), code_size);
|
file.read(reinterpret_cast<char*>(code.get()), code_size);
|
||||||
for (size_t i = 0; i < num_texture_types; ++i) {
|
for (size_t i = 0; i < num_texture_types; ++i) {
|
||||||
u64 key;
|
u32 key;
|
||||||
Shader::TextureType type;
|
Shader::TextureType type;
|
||||||
file.read(reinterpret_cast<char*>(&key), sizeof(key))
|
file.read(reinterpret_cast<char*>(&key), sizeof(key))
|
||||||
.read(reinterpret_cast<char*>(&type), sizeof(type));
|
.read(reinterpret_cast<char*>(&type), sizeof(type));
|
||||||
|
@ -457,8 +449,8 @@ public:
|
||||||
return it->second;
|
return it->second;
|
||||||
}
|
}
|
||||||
|
|
||||||
Shader::TextureType ReadTextureType(u32 cbuf_index, u32 cbuf_offset) override {
|
Shader::TextureType ReadTextureType(u32 handle) override {
|
||||||
const auto it{texture_types.find(MakeCbufKey(cbuf_index, cbuf_offset))};
|
const auto it{texture_types.find(handle)};
|
||||||
if (it == texture_types.end()) {
|
if (it == texture_types.end()) {
|
||||||
throw Shader::LogicError("Uncached read texture type");
|
throw Shader::LogicError("Uncached read texture type");
|
||||||
}
|
}
|
||||||
|
@ -483,7 +475,7 @@ public:
|
||||||
|
|
||||||
private:
|
private:
|
||||||
std::unique_ptr<u64[]> code;
|
std::unique_ptr<u64[]> code;
|
||||||
std::unordered_map<u64, Shader::TextureType> texture_types;
|
std::unordered_map<u32, Shader::TextureType> texture_types;
|
||||||
std::unordered_map<u64, u32> cbuf_values;
|
std::unordered_map<u64, u32> cbuf_values;
|
||||||
std::array<u32, 3> workgroup_size{};
|
std::array<u32, 3> workgroup_size{};
|
||||||
u32 local_memory_size{};
|
u32 local_memory_size{};
|
||||||
|
|
Loading…
Reference in a new issue