shader: Implement transform feedbacks and define file format
This commit is contained in:
parent
a83579b50a
commit
b126987c59
11 changed files with 272 additions and 23 deletions
|
@ -52,6 +52,8 @@ void FixedPipelineState::Refresh(Tegra::Engines::Maxwell3D& maxwell3d,
|
|||
const u32 topology_index = static_cast<u32>(regs.draw.topology.Value());
|
||||
|
||||
raw1 = 0;
|
||||
no_extended_dynamic_state.Assign(has_extended_dynamic_state ? 0 : 1);
|
||||
xfb_enabled.Assign(regs.tfb_enabled != 0);
|
||||
primitive_restart_enable.Assign(regs.primitive_restart.enabled != 0 ? 1 : 0);
|
||||
depth_bias_enable.Assign(enabled_lut[POLYGON_OFFSET_ENABLE_LUT[topology_index]] != 0 ? 1 : 0);
|
||||
depth_clamp_disabled.Assign(regs.view_volume_clip_control.depth_clamp_disabled.Value());
|
||||
|
@ -113,10 +115,12 @@ void FixedPipelineState::Refresh(Tegra::Engines::Maxwell3D& maxwell3d,
|
|||
return static_cast<u16>(viewport.swizzle.raw);
|
||||
});
|
||||
}
|
||||
if (!has_extended_dynamic_state) {
|
||||
no_extended_dynamic_state.Assign(1);
|
||||
if (no_extended_dynamic_state != 0) {
|
||||
dynamic_state.Refresh(regs);
|
||||
}
|
||||
if (xfb_enabled != 0) {
|
||||
xfb_state.Refresh(regs);
|
||||
}
|
||||
}
|
||||
|
||||
void FixedPipelineState::BlendingAttachment::Refresh(const Maxwell& regs, size_t index) {
|
||||
|
@ -158,6 +162,17 @@ void FixedPipelineState::BlendingAttachment::Refresh(const Maxwell& regs, size_t
|
|||
enable.Assign(1);
|
||||
}
|
||||
|
||||
void FixedPipelineState::TransformFeedbackState::Refresh(const Maxwell& regs) {
|
||||
std::ranges::transform(regs.tfb_layouts, layouts.begin(), [](const auto& layout) {
|
||||
return Layout{
|
||||
.stream = layout.stream,
|
||||
.varying_count = layout.varying_count,
|
||||
.stride = layout.stride,
|
||||
};
|
||||
});
|
||||
varyings = regs.tfb_varying_locs;
|
||||
}
|
||||
|
||||
void FixedPipelineState::DynamicState::Refresh(const Maxwell& regs) {
|
||||
u32 packed_front_face = PackFrontFace(regs.front_face);
|
||||
if (regs.screen_y_control.triangle_rast_flip != 0) {
|
||||
|
|
|
@ -130,6 +130,18 @@ struct FixedPipelineState {
|
|||
}
|
||||
};
|
||||
|
||||
struct TransformFeedbackState {
|
||||
struct Layout {
|
||||
u32 stream;
|
||||
u32 varying_count;
|
||||
u32 stride;
|
||||
};
|
||||
std::array<Layout, Maxwell::NumTransformFeedbackBuffers> layouts;
|
||||
std::array<std::array<u8, 128>, Maxwell::NumTransformFeedbackBuffers> varyings;
|
||||
|
||||
void Refresh(const Maxwell& regs);
|
||||
};
|
||||
|
||||
struct DynamicState {
|
||||
union {
|
||||
u32 raw1;
|
||||
|
@ -168,6 +180,7 @@ struct FixedPipelineState {
|
|||
union {
|
||||
u32 raw1;
|
||||
BitField<0, 1, u32> no_extended_dynamic_state;
|
||||
BitField<1, 1, u32> xfb_enabled;
|
||||
BitField<2, 1, u32> primitive_restart_enable;
|
||||
BitField<3, 1, u32> depth_bias_enable;
|
||||
BitField<4, 1, u32> depth_clamp_disabled;
|
||||
|
@ -199,6 +212,7 @@ struct FixedPipelineState {
|
|||
std::array<BlendingAttachment, Maxwell::NumRenderTargets> attachments;
|
||||
std::array<u16, Maxwell::NumViewports> viewport_swizzles;
|
||||
DynamicState dynamic_state;
|
||||
TransformFeedbackState xfb_state;
|
||||
|
||||
void Refresh(Tegra::Engines::Maxwell3D& maxwell3d, bool has_extended_dynamic_state);
|
||||
|
||||
|
@ -211,8 +225,16 @@ struct FixedPipelineState {
|
|||
}
|
||||
|
||||
size_t Size() const noexcept {
|
||||
const size_t total_size = sizeof *this;
|
||||
return total_size - (no_extended_dynamic_state != 0 ? 0 : sizeof(DynamicState));
|
||||
if (xfb_enabled != 0) {
|
||||
// When transform feedback is enabled, use the whole struct
|
||||
return sizeof(*this);
|
||||
} else if (no_extended_dynamic_state != 0) {
|
||||
// Dynamic state is enabled, we can enable more
|
||||
return offsetof(FixedPipelineState, xfb_state);
|
||||
} else {
|
||||
// No XFB, extended dynamic state enabled
|
||||
return offsetof(FixedPipelineState, dynamic_state);
|
||||
}
|
||||
}
|
||||
};
|
||||
static_assert(std::has_unique_object_representations_v<FixedPipelineState>);
|
||||
|
|
|
@ -248,6 +248,10 @@ namespace {
|
|||
using Shader::Backend::SPIRV::EmitSPIRV;
|
||||
using Shader::Maxwell::TranslateProgram;
|
||||
|
||||
// TODO: Move this to a separate file
|
||||
constexpr std::array<char, 8> MAGIC_NUMBER{'y', 'u', 'z', 'u', 'c', 'a', 'c', 'h'};
|
||||
constexpr u32 CACHE_VERSION{1};
|
||||
|
||||
class GraphicsEnvironment final : public GenericEnvironment {
|
||||
public:
|
||||
explicit GraphicsEnvironment() = default;
|
||||
|
@ -379,13 +383,14 @@ void SerializePipeline(const Key& key, const Envs& envs, const std::string& file
|
|||
try {
|
||||
std::ofstream file;
|
||||
file.exceptions(std::ifstream::failbit);
|
||||
Common::FS::OpenFStream(file, filename, std::ios::binary | std::ios::app);
|
||||
Common::FS::OpenFStream(file, filename, std::ios::binary | std::ios::ate | std::ios::app);
|
||||
if (!file.is_open()) {
|
||||
LOG_ERROR(Common_Filesystem, "Failed to open pipeline cache file {}", filename);
|
||||
return;
|
||||
}
|
||||
if (file.tellp() == 0) {
|
||||
// Write header...
|
||||
file.write(MAGIC_NUMBER.data(), MAGIC_NUMBER.size())
|
||||
.write(reinterpret_cast<const char*>(&CACHE_VERSION), sizeof(CACHE_VERSION));
|
||||
}
|
||||
const std::span key_span(reinterpret_cast<const char*>(&key), sizeof(key));
|
||||
SerializePipeline(key_span, MakeSpan(envs), file);
|
||||
|
@ -520,8 +525,27 @@ void PipelineCache::LoadDiskResources(u64 title_id, std::stop_token stop_loading
|
|||
file.exceptions(std::ifstream::failbit);
|
||||
const auto end{file.tellg()};
|
||||
file.seekg(0, std::ios::beg);
|
||||
// Read header...
|
||||
|
||||
std::array<char, 8> magic_number;
|
||||
u32 cache_version;
|
||||
file.read(magic_number.data(), magic_number.size())
|
||||
.read(reinterpret_cast<char*>(&cache_version), sizeof(cache_version));
|
||||
if (magic_number != MAGIC_NUMBER || cache_version != CACHE_VERSION) {
|
||||
file.close();
|
||||
if (Common::FS::Delete(pipeline_cache_filename)) {
|
||||
if (magic_number != MAGIC_NUMBER) {
|
||||
LOG_ERROR(Render_Vulkan, "Invalid pipeline cache file");
|
||||
}
|
||||
if (cache_version != CACHE_VERSION) {
|
||||
LOG_INFO(Render_Vulkan, "Deleting old pipeline cache");
|
||||
}
|
||||
} else {
|
||||
LOG_ERROR(Render_Vulkan,
|
||||
"Invalid pipeline cache file and failed to delete it in \"{}\"",
|
||||
pipeline_cache_filename);
|
||||
}
|
||||
return;
|
||||
}
|
||||
while (file.tellg() != end) {
|
||||
if (stop_loading) {
|
||||
return;
|
||||
|
@ -879,6 +903,88 @@ static Shader::AttributeType CastAttributeType(const FixedPipelineState::VertexA
|
|||
return Shader::AttributeType::Float;
|
||||
}
|
||||
|
||||
static std::vector<Shader::TransformFeedbackVarying> MakeTransformFeedbackVaryings(
|
||||
const GraphicsPipelineCacheKey& key) {
|
||||
static constexpr std::array VECTORS{
|
||||
28, // gl_Position
|
||||
32, // Generic 0
|
||||
36, // Generic 1
|
||||
40, // Generic 2
|
||||
44, // Generic 3
|
||||
48, // Generic 4
|
||||
52, // Generic 5
|
||||
56, // Generic 6
|
||||
60, // Generic 7
|
||||
64, // Generic 8
|
||||
68, // Generic 9
|
||||
72, // Generic 10
|
||||
76, // Generic 11
|
||||
80, // Generic 12
|
||||
84, // Generic 13
|
||||
88, // Generic 14
|
||||
92, // Generic 15
|
||||
96, // Generic 16
|
||||
100, // Generic 17
|
||||
104, // Generic 18
|
||||
108, // Generic 19
|
||||
112, // Generic 20
|
||||
116, // Generic 21
|
||||
120, // Generic 22
|
||||
124, // Generic 23
|
||||
128, // Generic 24
|
||||
132, // Generic 25
|
||||
136, // Generic 26
|
||||
140, // Generic 27
|
||||
144, // Generic 28
|
||||
148, // Generic 29
|
||||
152, // Generic 30
|
||||
156, // Generic 31
|
||||
160, // gl_FrontColor
|
||||
164, // gl_FrontSecondaryColor
|
||||
160, // gl_BackColor
|
||||
164, // gl_BackSecondaryColor
|
||||
192, // gl_TexCoord[0]
|
||||
196, // gl_TexCoord[1]
|
||||
200, // gl_TexCoord[2]
|
||||
204, // gl_TexCoord[3]
|
||||
208, // gl_TexCoord[4]
|
||||
212, // gl_TexCoord[5]
|
||||
216, // gl_TexCoord[6]
|
||||
220, // gl_TexCoord[7]
|
||||
};
|
||||
std::vector<Shader::TransformFeedbackVarying> xfb(256);
|
||||
for (size_t buffer = 0; buffer < Maxwell::NumTransformFeedbackBuffers; ++buffer) {
|
||||
const auto& locations = key.state.xfb_state.varyings[buffer];
|
||||
const auto& layout = key.state.xfb_state.layouts[buffer];
|
||||
const u32 varying_count = layout.varying_count;
|
||||
u32 highest = 0;
|
||||
for (u32 offset = 0; offset < varying_count; ++offset) {
|
||||
const u32 base_offset = offset;
|
||||
const u8 location = locations[offset];
|
||||
|
||||
Shader::TransformFeedbackVarying varying;
|
||||
varying.buffer = layout.stream;
|
||||
varying.stride = layout.stride;
|
||||
varying.offset = offset * 4;
|
||||
varying.components = 1;
|
||||
|
||||
if (std::ranges::find(VECTORS, Common::AlignDown(location, 4)) != VECTORS.end()) {
|
||||
UNIMPLEMENTED_IF_MSG(location % 4 != 0, "Unaligned TFB");
|
||||
|
||||
const u8 base_index = location / 4;
|
||||
while (offset + 1 < varying_count && base_index == locations[offset + 1] / 4) {
|
||||
++offset;
|
||||
++varying.components;
|
||||
}
|
||||
}
|
||||
xfb[location] = varying;
|
||||
highest = std::max(highest, (base_offset + varying.components) * 4);
|
||||
}
|
||||
UNIMPLEMENTED_IF(highest != layout.stride);
|
||||
}
|
||||
return xfb;
|
||||
}
|
||||
|
||||
Shader::Profile PipelineCache::MakeProfile(const GraphicsPipelineCacheKey& key,
|
||||
const Shader::IR::Program& program) {
|
||||
Shader::Profile profile{base_profile};
|
||||
|
@ -893,6 +999,9 @@ Shader::Profile PipelineCache::MakeProfile(const GraphicsPipelineCacheKey& key,
|
|||
if (key.state.topology == Maxwell::PrimitiveTopology::Points) {
|
||||
profile.fixed_state_point_size = point_size;
|
||||
}
|
||||
if (key.state.xfb_enabled != 0) {
|
||||
profile.xfb_varyings = MakeTransformFeedbackVaryings(key);
|
||||
}
|
||||
profile.convert_depth_mode = gl_ndc;
|
||||
}
|
||||
std::ranges::transform(key.state.attributes, profile.generic_input_types.begin(),
|
||||
|
@ -902,6 +1011,9 @@ Shader::Profile PipelineCache::MakeProfile(const GraphicsPipelineCacheKey& key,
|
|||
if (program.output_topology == Shader::OutputTopology::PointList) {
|
||||
profile.fixed_state_point_size = point_size;
|
||||
}
|
||||
if (key.state.xfb_enabled != 0) {
|
||||
profile.xfb_varyings = MakeTransformFeedbackVaryings(key);
|
||||
}
|
||||
profile.convert_depth_mode = gl_ndc;
|
||||
break;
|
||||
default:
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue