mirror of
https://github.com/Lime3DS/Lime3DS
synced 2025-01-09 13:43:27 +00:00
spv_fs_shader_gen: Implement quaternion correction with barycentric extension (#7152)
This commit is contained in:
parent
312068eebf
commit
168f168c33
3 changed files with 79 additions and 12 deletions
|
@ -472,7 +472,7 @@ void PipelineCache::UseFragmentShader(const Pica::Regs& regs,
|
||||||
if (new_shader) {
|
if (new_shader) {
|
||||||
const bool use_spirv = Settings::values.spirv_shader_gen.GetValue();
|
const bool use_spirv = Settings::values.spirv_shader_gen.GetValue();
|
||||||
if (use_spirv && !fs_config.UsesShadowPipeline()) {
|
if (use_spirv && !fs_config.UsesShadowPipeline()) {
|
||||||
const std::vector code = SPIRV::GenerateFragmentShader(fs_config);
|
const std::vector code = SPIRV::GenerateFragmentShader(fs_config, profile);
|
||||||
shader.module = CompileSPV(code, instance.GetDevice());
|
shader.module = CompileSPV(code, instance.GetDevice());
|
||||||
shader.MarkDone();
|
shader.MarkDone();
|
||||||
} else {
|
} else {
|
||||||
|
|
|
@ -2,6 +2,7 @@
|
||||||
// Licensed under GPLv2 or any later version
|
// Licensed under GPLv2 or any later version
|
||||||
// Refer to the license.txt file included.
|
// Refer to the license.txt file included.
|
||||||
|
|
||||||
|
#include <boost/container/small_vector.hpp>
|
||||||
#include "video_core/shader/generator/spv_fs_shader_gen.h"
|
#include "video_core/shader/generator/spv_fs_shader_gen.h"
|
||||||
|
|
||||||
namespace Pica::Shader::Generator::SPIRV {
|
namespace Pica::Shader::Generator::SPIRV {
|
||||||
|
@ -14,8 +15,10 @@ using TevStageConfig = TexturingRegs::TevStageConfig;
|
||||||
|
|
||||||
constexpr u32 SPIRV_VERSION_1_3 = 0x00010300;
|
constexpr u32 SPIRV_VERSION_1_3 = 0x00010300;
|
||||||
|
|
||||||
FragmentModule::FragmentModule(const FSConfig& config_)
|
FragmentModule::FragmentModule(const FSConfig& config_, const Profile& profile_)
|
||||||
: Sirit::Module{SPIRV_VERSION_1_3}, config{config_} {
|
: Sirit::Module{SPIRV_VERSION_1_3}, config{config_}, profile{profile_},
|
||||||
|
use_fragment_shader_barycentric{profile.has_fragment_shader_barycentric &&
|
||||||
|
config.lighting.enable} {
|
||||||
DefineArithmeticTypes();
|
DefineArithmeticTypes();
|
||||||
DefineUniformStructs();
|
DefineUniformStructs();
|
||||||
DefineInterface();
|
DefineInterface();
|
||||||
|
@ -270,9 +273,48 @@ void FragmentModule::WriteLighting() {
|
||||||
return OpFAdd(vec_ids.Get(3), v, val2);
|
return OpFAdd(vec_ids.Get(3), v, val2);
|
||||||
};
|
};
|
||||||
|
|
||||||
|
// Perform quaternion correction in the fragment shader if fragment_shader_barycentric is
|
||||||
|
// supported.
|
||||||
|
Id normquat{};
|
||||||
|
if (use_fragment_shader_barycentric) {
|
||||||
|
const auto are_quaternions_opposite = [&](Id qa, Id qb) {
|
||||||
|
const Id dot_q{OpDot(f32_id, qa, qb)};
|
||||||
|
const Id dot_le_zero{OpFOrdLessThan(bool_id, dot_q, ConstF32(0.f))};
|
||||||
|
return OpCompositeConstruct(bvec_ids.Get(4), dot_le_zero, dot_le_zero, dot_le_zero,
|
||||||
|
dot_le_zero);
|
||||||
|
};
|
||||||
|
|
||||||
|
const Id input_pointer_id{TypePointer(spv::StorageClass::Input, vec_ids.Get(4))};
|
||||||
|
const Id normquat_0{
|
||||||
|
OpLoad(vec_ids.Get(4), OpAccessChain(input_pointer_id, normquat_id, ConstS32(0)))};
|
||||||
|
const Id normquat_1{
|
||||||
|
OpLoad(vec_ids.Get(4), OpAccessChain(input_pointer_id, normquat_id, ConstS32(1)))};
|
||||||
|
const Id normquat_1_correct{OpSelect(vec_ids.Get(4),
|
||||||
|
are_quaternions_opposite(normquat_0, normquat_1),
|
||||||
|
OpFNegate(vec_ids.Get(4), normquat_1), normquat_1)};
|
||||||
|
const Id normquat_2{
|
||||||
|
OpLoad(vec_ids.Get(4), OpAccessChain(input_pointer_id, normquat_id, ConstS32(2)))};
|
||||||
|
const Id normquat_2_correct{OpSelect(vec_ids.Get(4),
|
||||||
|
are_quaternions_opposite(normquat_0, normquat_2),
|
||||||
|
OpFNegate(vec_ids.Get(4), normquat_2), normquat_2)};
|
||||||
|
const Id bary_coord{OpLoad(vec_ids.Get(3), gl_bary_coord_id)};
|
||||||
|
const Id bary_coord_x{OpCompositeExtract(f32_id, bary_coord, 0)};
|
||||||
|
const Id bary_coord_y{OpCompositeExtract(f32_id, bary_coord, 1)};
|
||||||
|
const Id bary_coord_z{OpCompositeExtract(f32_id, bary_coord, 2)};
|
||||||
|
const Id normquat_0_final{OpVectorTimesScalar(vec_ids.Get(4), normquat_0, bary_coord_x)};
|
||||||
|
const Id normquat_1_final{
|
||||||
|
OpVectorTimesScalar(vec_ids.Get(4), normquat_1_correct, bary_coord_y)};
|
||||||
|
const Id normquat_2_final{
|
||||||
|
OpVectorTimesScalar(vec_ids.Get(4), normquat_2_correct, bary_coord_z)};
|
||||||
|
normquat = OpFAdd(vec_ids.Get(4), normquat_0_final,
|
||||||
|
OpFAdd(vec_ids.Get(4), normquat_1_final, normquat_2_final));
|
||||||
|
} else {
|
||||||
|
normquat = OpLoad(vec_ids.Get(4), normquat_id);
|
||||||
|
}
|
||||||
|
|
||||||
// Rotate the surface-local normal by the interpolated normal quaternion to convert it to
|
// Rotate the surface-local normal by the interpolated normal quaternion to convert it to
|
||||||
// eyespace.
|
// eyespace.
|
||||||
const Id normalized_normquat{OpNormalize(vec_ids.Get(4), OpLoad(vec_ids.Get(4), normquat_id))};
|
const Id normalized_normquat{OpNormalize(vec_ids.Get(4), normquat)};
|
||||||
const Id normal{quaternion_rotate(normalized_normquat, surface_normal)};
|
const Id normal{quaternion_rotate(normalized_normquat, surface_normal)};
|
||||||
const Id tangent{quaternion_rotate(normalized_normquat, surface_tangent)};
|
const Id tangent{quaternion_rotate(normalized_normquat, surface_tangent)};
|
||||||
|
|
||||||
|
@ -1452,13 +1494,24 @@ void FragmentModule::DefineEntryPoint() {
|
||||||
AddCapability(spv::Capability::Shader);
|
AddCapability(spv::Capability::Shader);
|
||||||
AddCapability(spv::Capability::SampledBuffer);
|
AddCapability(spv::Capability::SampledBuffer);
|
||||||
AddCapability(spv::Capability::ImageQuery);
|
AddCapability(spv::Capability::ImageQuery);
|
||||||
|
if (use_fragment_shader_barycentric) {
|
||||||
|
AddCapability(spv::Capability::FragmentBarycentricKHR);
|
||||||
|
AddExtension("SPV_KHR_fragment_shader_barycentric");
|
||||||
|
}
|
||||||
SetMemoryModel(spv::AddressingModel::Logical, spv::MemoryModel::GLSL450);
|
SetMemoryModel(spv::AddressingModel::Logical, spv::MemoryModel::GLSL450);
|
||||||
|
|
||||||
const Id main_type{TypeFunction(TypeVoid())};
|
const Id main_type{TypeFunction(TypeVoid())};
|
||||||
const Id main_func{OpFunction(TypeVoid(), spv::FunctionControlMask::MaskNone, main_type)};
|
const Id main_func{OpFunction(TypeVoid(), spv::FunctionControlMask::MaskNone, main_type)};
|
||||||
AddEntryPoint(spv::ExecutionModel::Fragment, main_func, "main", primary_color_id,
|
|
||||||
texcoord_id[0], texcoord_id[1], texcoord_id[2], texcoord0_w_id, normquat_id,
|
boost::container::small_vector<Id, 11> interface_ids{
|
||||||
view_id, color_id, gl_frag_coord_id, gl_frag_depth_id);
|
primary_color_id, texcoord_id[0], texcoord_id[1], texcoord_id[2], texcoord0_w_id,
|
||||||
|
normquat_id, view_id, color_id, gl_frag_coord_id, gl_frag_depth_id,
|
||||||
|
};
|
||||||
|
if (use_fragment_shader_barycentric) {
|
||||||
|
interface_ids.push_back(gl_bary_coord_id);
|
||||||
|
}
|
||||||
|
|
||||||
|
AddEntryPoint(spv::ExecutionModel::Fragment, main_func, "main", interface_ids);
|
||||||
AddExecutionMode(main_func, spv::ExecutionMode::OriginUpperLeft);
|
AddExecutionMode(main_func, spv::ExecutionMode::OriginUpperLeft);
|
||||||
AddExecutionMode(main_func, spv::ExecutionMode::DepthReplacing);
|
AddExecutionMode(main_func, spv::ExecutionMode::DepthReplacing);
|
||||||
}
|
}
|
||||||
|
@ -1510,7 +1563,12 @@ void FragmentModule::DefineInterface() {
|
||||||
texcoord_id[1] = DefineInput(vec_ids.Get(2), 3);
|
texcoord_id[1] = DefineInput(vec_ids.Get(2), 3);
|
||||||
texcoord_id[2] = DefineInput(vec_ids.Get(2), 4);
|
texcoord_id[2] = DefineInput(vec_ids.Get(2), 4);
|
||||||
texcoord0_w_id = DefineInput(f32_id, 5);
|
texcoord0_w_id = DefineInput(f32_id, 5);
|
||||||
|
if (use_fragment_shader_barycentric) {
|
||||||
|
normquat_id = DefineInput(TypeArray(vec_ids.Get(4), ConstU32(3U)), 6);
|
||||||
|
Decorate(normquat_id, spv::Decoration::PerVertexKHR);
|
||||||
|
} else {
|
||||||
normquat_id = DefineInput(vec_ids.Get(4), 6);
|
normquat_id = DefineInput(vec_ids.Get(4), 6);
|
||||||
|
}
|
||||||
view_id = DefineInput(vec_ids.Get(3), 7);
|
view_id = DefineInput(vec_ids.Get(3), 7);
|
||||||
color_id = DefineOutput(vec_ids.Get(4), 0);
|
color_id = DefineOutput(vec_ids.Get(4), 0);
|
||||||
|
|
||||||
|
@ -1537,10 +1595,14 @@ void FragmentModule::DefineInterface() {
|
||||||
gl_frag_depth_id = DefineVar(f32_id, spv::StorageClass::Output);
|
gl_frag_depth_id = DefineVar(f32_id, spv::StorageClass::Output);
|
||||||
Decorate(gl_frag_coord_id, spv::Decoration::BuiltIn, spv::BuiltIn::FragCoord);
|
Decorate(gl_frag_coord_id, spv::Decoration::BuiltIn, spv::BuiltIn::FragCoord);
|
||||||
Decorate(gl_frag_depth_id, spv::Decoration::BuiltIn, spv::BuiltIn::FragDepth);
|
Decorate(gl_frag_depth_id, spv::Decoration::BuiltIn, spv::BuiltIn::FragDepth);
|
||||||
|
if (use_fragment_shader_barycentric) {
|
||||||
|
gl_bary_coord_id = DefineVar(vec_ids.Get(3), spv::StorageClass::Input);
|
||||||
|
Decorate(gl_bary_coord_id, spv::Decoration::BuiltIn, spv::BuiltIn::BaryCoordKHR);
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
std::vector<u32> GenerateFragmentShader(const FSConfig& config) {
|
std::vector<u32> GenerateFragmentShader(const FSConfig& config, const Profile& profile) {
|
||||||
FragmentModule module{config};
|
FragmentModule module{config, profile};
|
||||||
module.Generate();
|
module.Generate();
|
||||||
return module.Assemble();
|
return module.Assemble();
|
||||||
}
|
}
|
||||||
|
|
|
@ -30,7 +30,7 @@ class FragmentModule : public Sirit::Module {
|
||||||
static constexpr u32 NUM_NON_PROC_TEX_UNITS = 3;
|
static constexpr u32 NUM_NON_PROC_TEX_UNITS = 3;
|
||||||
|
|
||||||
public:
|
public:
|
||||||
explicit FragmentModule(const FSConfig& config);
|
explicit FragmentModule(const FSConfig& config, const Profile& profile);
|
||||||
~FragmentModule();
|
~FragmentModule();
|
||||||
|
|
||||||
/// Emits SPIR-V bytecode corresponding to the provided pica fragment configuration
|
/// Emits SPIR-V bytecode corresponding to the provided pica fragment configuration
|
||||||
|
@ -215,6 +215,10 @@ private:
|
||||||
|
|
||||||
private:
|
private:
|
||||||
const FSConfig& config;
|
const FSConfig& config;
|
||||||
|
const Profile& profile;
|
||||||
|
|
||||||
|
bool use_fragment_shader_barycentric{};
|
||||||
|
|
||||||
Id void_id{};
|
Id void_id{};
|
||||||
Id bool_id{};
|
Id bool_id{};
|
||||||
Id f32_id{};
|
Id f32_id{};
|
||||||
|
@ -242,6 +246,7 @@ private:
|
||||||
|
|
||||||
Id gl_frag_coord_id{};
|
Id gl_frag_coord_id{};
|
||||||
Id gl_frag_depth_id{};
|
Id gl_frag_depth_id{};
|
||||||
|
Id gl_bary_coord_id{};
|
||||||
Id depth{};
|
Id depth{};
|
||||||
|
|
||||||
Id tex0_id{};
|
Id tex0_id{};
|
||||||
|
@ -284,6 +289,6 @@ private:
|
||||||
* @param separable_shader generates shader that can be used for separate shader object
|
* @param separable_shader generates shader that can be used for separate shader object
|
||||||
* @returns String of the shader source code
|
* @returns String of the shader source code
|
||||||
*/
|
*/
|
||||||
std::vector<u32> GenerateFragmentShader(const FSConfig& config);
|
std::vector<u32> GenerateFragmentShader(const FSConfig& config, const Profile& profile);
|
||||||
|
|
||||||
} // namespace Pica::Shader::Generator::SPIRV
|
} // namespace Pica::Shader::Generator::SPIRV
|
||||||
|
|
Loading…
Reference in a new issue