summaryrefslogtreecommitdiffstats
path: root/src/video_core
diff options
context:
space:
mode:
authorReinUsesLisp <reinuseslisp@airmail.cc>2021-04-21 00:48:45 +0200
committerameerj <52414509+ameerj@users.noreply.github.com>2021-07-23 03:51:28 +0200
commitdd860b684c7695097107c1186e96a70e754e5990 (patch)
tree14cbd25c655798f846b75582d5364aef0508f8b0 /src/video_core
parentshader: Add constant propagation for arithmetic right shifts (diff)
downloadyuzu-dd860b684c7695097107c1186e96a70e754e5990.tar
yuzu-dd860b684c7695097107c1186e96a70e754e5990.tar.gz
yuzu-dd860b684c7695097107c1186e96a70e754e5990.tar.bz2
yuzu-dd860b684c7695097107c1186e96a70e754e5990.tar.lz
yuzu-dd860b684c7695097107c1186e96a70e754e5990.tar.xz
yuzu-dd860b684c7695097107c1186e96a70e754e5990.tar.zst
yuzu-dd860b684c7695097107c1186e96a70e754e5990.zip
Diffstat (limited to 'src/video_core')
-rw-r--r--src/video_core/renderer_vulkan/vk_compute_pipeline.cpp31
-rw-r--r--src/video_core/renderer_vulkan/vk_graphics_pipeline.cpp25
-rw-r--r--src/video_core/renderer_vulkan/vk_pipeline_cache.cpp32
3 files changed, 51 insertions, 37 deletions
diff --git a/src/video_core/renderer_vulkan/vk_compute_pipeline.cpp b/src/video_core/renderer_vulkan/vk_compute_pipeline.cpp
index 3c907ec5a..45d837ca4 100644
--- a/src/video_core/renderer_vulkan/vk_compute_pipeline.cpp
+++ b/src/video_core/renderer_vulkan/vk_compute_pipeline.cpp
@@ -88,23 +88,34 @@ void ComputePipeline::Configure(Tegra::Engines::KeplerCompute& kepler_compute,
boost::container::static_vector<u32, max_elements> image_view_indices;
boost::container::static_vector<VkSampler, max_elements> samplers;
- const auto& launch_desc{kepler_compute.launch_description};
- const auto& cbufs{launch_desc.const_buffer_config};
- const bool via_header_index{launch_desc.linked_tsc};
- const auto read_handle{[&](u32 cbuf_index, u32 cbuf_offset) {
- ASSERT(((launch_desc.const_buffer_enable_mask >> cbuf_index) & 1) != 0);
- const GPUVAddr addr{cbufs[cbuf_index].Address() + cbuf_offset};
- const u32 raw_handle{gpu_memory.Read<u32>(addr)};
- return TextureHandle(raw_handle, via_header_index);
+ const auto& qmd{kepler_compute.launch_description};
+ const auto& cbufs{qmd.const_buffer_config};
+ const bool via_header_index{qmd.linked_tsc != 0};
+ const auto read_handle{[&](const auto& desc) {
+ ASSERT(((qmd.const_buffer_enable_mask >> desc.cbuf_index) & 1) != 0);
+ const GPUVAddr addr{cbufs[desc.cbuf_index].Address() + desc.cbuf_offset};
+ if constexpr (std::is_same_v<decltype(desc), const Shader::TextureDescriptor&> ||
+ std::is_same_v<decltype(desc), const Shader::TextureBufferDescriptor&>) {
+ if (desc.has_secondary) {
+ ASSERT(((qmd.const_buffer_enable_mask >> desc.secondary_cbuf_index) & 1) != 0);
+ const GPUVAddr separate_addr{cbufs[desc.secondary_cbuf_index].Address() +
+ desc.secondary_cbuf_offset};
+ const u32 lhs_raw{gpu_memory.Read<u32>(addr)};
+ const u32 rhs_raw{gpu_memory.Read<u32>(separate_addr)};
+ const u32 raw{lhs_raw | rhs_raw};
+ return TextureHandle{raw, via_header_index};
+ }
+ }
+ return TextureHandle{gpu_memory.Read<u32>(addr), via_header_index};
}};
const auto add_image{[&](const auto& desc) {
- const TextureHandle handle{read_handle(desc.cbuf_index, desc.cbuf_offset)};
+ const TextureHandle handle{read_handle(desc)};
image_view_indices.push_back(handle.image);
}};
std::ranges::for_each(info.texture_buffer_descriptors, add_image);
std::ranges::for_each(info.image_buffer_descriptors, add_image);
for (const auto& desc : info.texture_descriptors) {
- const TextureHandle handle{read_handle(desc.cbuf_index, desc.cbuf_offset)};
+ const TextureHandle handle{read_handle(desc)};
image_view_indices.push_back(handle.image);
Sampler* const sampler = texture_cache.GetComputeSampler(handle.sampler);
diff --git a/src/video_core/renderer_vulkan/vk_graphics_pipeline.cpp b/src/video_core/renderer_vulkan/vk_graphics_pipeline.cpp
index d5e9dae0f..08f00b9ce 100644
--- a/src/video_core/renderer_vulkan/vk_graphics_pipeline.cpp
+++ b/src/video_core/renderer_vulkan/vk_graphics_pipeline.cpp
@@ -169,20 +169,31 @@ void GraphicsPipeline::Configure(bool is_indexed) {
++index;
}
const auto& cbufs{maxwell3d.state.shader_stages[stage].const_buffers};
- const auto read_handle{[&](u32 cbuf_index, u32 cbuf_offset) {
- ASSERT(cbufs[cbuf_index].enabled);
- const GPUVAddr addr{cbufs[cbuf_index].address + cbuf_offset};
- const u32 raw_handle{gpu_memory.Read<u32>(addr)};
- return TextureHandle(raw_handle, via_header_index);
+ const auto read_handle{[&](const auto& desc) {
+ ASSERT(cbufs[desc.cbuf_index].enabled);
+ const GPUVAddr addr{cbufs[desc.cbuf_index].address + desc.cbuf_offset};
+ if constexpr (std::is_same_v<decltype(desc), const Shader::TextureDescriptor&> ||
+ std::is_same_v<decltype(desc), const Shader::TextureBufferDescriptor&>) {
+ if (desc.has_secondary) {
+ ASSERT(cbufs[desc.secondary_cbuf_index].enabled);
+ const GPUVAddr separate_addr{cbufs[desc.secondary_cbuf_index].address +
+ desc.secondary_cbuf_offset};
+ const u32 lhs_raw{gpu_memory.Read<u32>(addr)};
+ const u32 rhs_raw{gpu_memory.Read<u32>(separate_addr)};
+ const u32 raw{lhs_raw | rhs_raw};
+ return TextureHandle{raw, via_header_index};
+ }
+ }
+ return TextureHandle{gpu_memory.Read<u32>(addr), via_header_index};
}};
const auto add_image{[&](const auto& desc) {
- const TextureHandle handle{read_handle(desc.cbuf_index, desc.cbuf_offset)};
+ const TextureHandle handle{read_handle(desc)};
image_view_indices.push_back(handle.image);
}};
std::ranges::for_each(info.texture_buffer_descriptors, add_image);
std::ranges::for_each(info.image_buffer_descriptors, add_image);
for (const auto& desc : info.texture_descriptors) {
- const TextureHandle handle{read_handle(desc.cbuf_index, desc.cbuf_offset)};
+ const TextureHandle handle{read_handle(desc)};
image_view_indices.push_back(handle.image);
Sampler* const sampler{texture_cache.GetGraphicsSampler(handle.sampler)};
diff --git a/src/video_core/renderer_vulkan/vk_pipeline_cache.cpp b/src/video_core/renderer_vulkan/vk_pipeline_cache.cpp
index e9b93336b..4317b2ac7 100644
--- a/src/video_core/renderer_vulkan/vk_pipeline_cache.cpp
+++ b/src/video_core/renderer_vulkan/vk_pipeline_cache.cpp
@@ -188,9 +188,7 @@ protected:
}
Shader::TextureType ReadTextureTypeImpl(GPUVAddr tic_addr, u32 tic_limit, bool via_header_index,
- GPUVAddr cbuf_addr, u32 cbuf_size, u32 cbuf_index,
- u32 cbuf_offset) {
- const u32 raw{cbuf_offset < cbuf_size ? gpu_memory->Read<u32>(cbuf_addr + cbuf_offset) : 0};
+ u32 raw) {
const TextureHandle handle{raw, via_header_index};
const GPUVAddr descriptor_addr{tic_addr + handle.image * sizeof(Tegra::Texture::TICEntry)};
Tegra::Texture::TICEntry entry;
@@ -219,7 +217,7 @@ protected:
throw Shader::NotImplementedException("Unknown texture type");
}
}()};
- texture_types.emplace(MakeCbufKey(cbuf_index, cbuf_offset), result);
+ texture_types.emplace(raw, result);
return result;
}
@@ -227,7 +225,7 @@ protected:
GPUVAddr program_base{};
std::vector<u64> code;
- std::unordered_map<u64, Shader::TextureType> texture_types;
+ std::unordered_map<u32, Shader::TextureType> texture_types;
std::unordered_map<u64, u32> cbuf_values;
u32 local_memory_size{};
@@ -250,7 +248,7 @@ using Shader::Maxwell::TranslateProgram;
// TODO: Move this to a separate file
constexpr std::array<char, 8> MAGIC_NUMBER{'y', 'u', 'z', 'u', 'c', 'a', 'c', 'h'};
-constexpr u32 CACHE_VERSION{1};
+constexpr u32 CACHE_VERSION{2};
class GraphicsEnvironment final : public GenericEnvironment {
public:
@@ -308,13 +306,10 @@ public:
return value;
}
- Shader::TextureType ReadTextureType(u32 cbuf_index, u32 cbuf_offset) override {
+ Shader::TextureType ReadTextureType(u32 handle) override {
const auto& regs{maxwell3d->regs};
- const auto& cbuf{maxwell3d->state.shader_stages[stage_index].const_buffers[cbuf_index]};
- ASSERT(cbuf.enabled);
const bool via_header_index{regs.sampler_index == Maxwell::SamplerIndex::ViaHeaderIndex};
- return ReadTextureTypeImpl(regs.tic.Address(), regs.tic.limit, via_header_index,
- cbuf.address, cbuf.size, cbuf_index, cbuf_offset);
+ return ReadTextureTypeImpl(regs.tic.Address(), regs.tic.limit, via_header_index, handle);
}
private:
@@ -352,13 +347,10 @@ public:
return value;
}
- Shader::TextureType ReadTextureType(u32 cbuf_index, u32 cbuf_offset) override {
+ Shader::TextureType ReadTextureType(u32 handle) override {
const auto& regs{kepler_compute->regs};
const auto& qmd{kepler_compute->launch_description};
- ASSERT(((qmd.const_buffer_enable_mask.Value() >> cbuf_index) & 1) != 0);
- const auto& cbuf{qmd.const_buffer_config[cbuf_index]};
- return ReadTextureTypeImpl(regs.tic.Address(), regs.tic.limit, qmd.linked_tsc != 0,
- cbuf.Address(), cbuf.size, cbuf_index, cbuf_offset);
+ return ReadTextureTypeImpl(regs.tic.Address(), regs.tic.limit, qmd.linked_tsc != 0, handle);
}
private:
@@ -421,7 +413,7 @@ public:
code = std::make_unique<u64[]>(Common::DivCeil(code_size, sizeof(u64)));
file.read(reinterpret_cast<char*>(code.get()), code_size);
for (size_t i = 0; i < num_texture_types; ++i) {
- u64 key;
+ u32 key;
Shader::TextureType type;
file.read(reinterpret_cast<char*>(&key), sizeof(key))
.read(reinterpret_cast<char*>(&type), sizeof(type));
@@ -457,8 +449,8 @@ public:
return it->second;
}
- Shader::TextureType ReadTextureType(u32 cbuf_index, u32 cbuf_offset) override {
- const auto it{texture_types.find(MakeCbufKey(cbuf_index, cbuf_offset))};
+ Shader::TextureType ReadTextureType(u32 handle) override {
+ const auto it{texture_types.find(handle)};
if (it == texture_types.end()) {
throw Shader::LogicError("Uncached read texture type");
}
@@ -483,7 +475,7 @@ public:
private:
std::unique_ptr<u64[]> code;
- std::unordered_map<u64, Shader::TextureType> texture_types;
+ std::unordered_map<u32, Shader::TextureType> texture_types;
std::unordered_map<u64, u32> cbuf_values;
std::array<u32, 3> workgroup_size{};
u32 local_memory_size{};