ir: Perform degamma in shader when sampler sets force_degamma (#3420)

* ir: Perform degamma in shader when sampler sets force_degamma * specialization: Add srgb if image is sampled Might fix cases where sampler force_degamma is used with srgb image
2025-12-12 14:48:52 +00:00 · 2025-08-19 03:41:41 +03:00
parent 2d53d1a1e2
commit 0b02364f97
12 changed files with 82 additions and 43 deletions
--- a/src/shader_recompiler/ir/ir_emitter.cpp
+++ b/src/shader_recompiler/ir/ir_emitter.cpp
@@ -1169,6 +1169,10 @@ F32 IREmitter::FPLog2(const F32& value) {
    return Inst<F32>(Opcode::FPLog2, value);
 }

+F32 IREmitter::FPPow(const F32& x, const F32& y) {
+    return Inst<F32>(Opcode::FPPow, x, y);
+}
+
 F32F64 IREmitter::FPRecip(const F32F64& value) {
    switch (value.Type()) {
    case Type::F32:
--- a/src/shader_recompiler/ir/ir_emitter.h
+++ b/src/shader_recompiler/ir/ir_emitter.h
@@ -228,6 +228,7 @@ public:
    [[nodiscard]] F32 FPSin(const F32& value);
    [[nodiscard]] F32 FPExp2(const F32& value);
    [[nodiscard]] F32 FPLog2(const F32& value);
+    [[nodiscard]] F32 FPPow(const F32& x, const F32& y);
    [[nodiscard]] F32 FPLdexp(const F32& value, const U32& exp);
    [[nodiscard]] F32F64 FPRecip(const F32F64& value);
    [[nodiscard]] F32F64 FPRecipSqrt(const F32F64& value);
--- a/src/shader_recompiler/ir/opcodes.inc
+++ b/src/shader_recompiler/ir/opcodes.inc
@@ -283,6 +283,7 @@ OPCODE(FPRecipSqrt64,                                       F64,            F64,
 OPCODE(FPSqrt,                                              F32,            F32,                                                                            )
 OPCODE(FPSin,                                               F32,            F32,                                                                            )
 OPCODE(FPExp2,                                              F32,            F32,                                                                            )
+OPCODE(FPPow,                                               F32,            F32,            F32,                                                            )
 OPCODE(FPLdexp,                                             F32,            F32,            U32,                                                            )
 OPCODE(FPCos,                                               F32,            F32,                                                                            )
 OPCODE(FPLog2,                                              F32,            F32,                                                                            )
--- a/src/shader_recompiler/ir/passes/resource_tracking_pass.cpp
+++ b/src/shader_recompiler/ir/passes/resource_tracking_pass.cpp
@@ -542,7 +542,7 @@ void PatchImageSharp(IR::Block& block, IR::Inst& inst, Info& info, Descriptors&
    ASSERT(image.GetType() != AmdGpu::ImageType::Invalid);

    // Patch image instruction if image is FMask.
-    if (image.IsFmask()) {
+    if (AmdGpu::IsFmask(image.GetDataFmt())) {
        ASSERT_MSG(!is_written, "FMask storage instructions are not supported");

        IR::IREmitter ir{block, IR::Block::InstructionList::s_iterator_to(inst)};
@@ -830,8 +830,8 @@ IR::Value FixCubeCoords(IR::IREmitter& ir, const AmdGpu::Image& image, const IR:
 void PatchImageSampleArgs(IR::Block& block, IR::Inst& inst, Info& info,
                          const ImageResource& image_res, const AmdGpu::Image& image) {
    const auto handle = inst.Arg(0);
-    const auto sampler_res = info.samplers[(handle.U32() >> 16) & 0xFFFF];
-    auto sampler = sampler_res.GetSharp(info);
+    const auto& sampler_res = info.samplers[(handle.U32() >> 16) & 0xFFFF];
+    const auto sampler = sampler_res.GetSharp(info);

    IR::IREmitter ir{block, IR::Block::InstructionList::s_iterator_to(inst)};
    const auto inst_info = inst.Flags<IR::TextureInstInfo>();
@@ -1001,7 +1001,10 @@ void PatchImageSampleArgs(IR::Block& block, IR::Inst& inst, Info& info,
        return ir.ImageSampleImplicitLod(handle, coords, bias, offset, inst_info);
    }();

-    const auto converted = ApplyReadNumberConversionVec4(ir, texel, image.GetNumberConversion());
+    auto converted = ApplyReadNumberConversionVec4(ir, texel, image.GetNumberConversion());
+    if (sampler.force_degamma && image.GetNumberFmt() != AmdGpu::NumberFormat::Srgb) {
+        converted = ApplyForceDegamma(ir, texel, image.DstSelect());
+    }
    inst.ReplaceUsesWith(converted);
 }

--- a/src/shader_recompiler/ir/reinterpret.h
+++ b/src/shader_recompiler/ir/reinterpret.h
@@ -4,7 +4,7 @@
 #pragma once

 #include "shader_recompiler/ir/ir_emitter.h"
-#include "video_core/amdgpu/types.h"
+#include "video_core/amdgpu/pixel_format.h"

 namespace Shader::IR {

@@ -21,6 +21,36 @@ inline Value ApplySwizzle(IREmitter& ir, const Value& vector, const AmdGpu::Comp
    return swizzled;
 }

+/// Converts gamma corrected value to linear space
+inline F32 ApplyGammaToLinear(IREmitter& ir, F32& c) {
+    const F32 a =
+        ir.FPPow(ir.FPMul(ir.FPAdd(c, ir.Imm32(0.055f)), ir.Imm32(1.0f / 1.055f)), ir.Imm32(2.4f));
+    const F32 b = ir.FPMul(c, ir.Imm32(1.0f / 12.92f));
+    return IR::F32{ir.Select(ir.FPGreaterThan(c, ir.Imm32(0.04045f)), a, b)};
+}
+
+inline Value ApplyForceDegamma(IREmitter& ir, const Value& value,
+                               const AmdGpu::CompMapping& mapping) {
+    auto x = F32{ir.CompositeExtract(value, 0)};
+    auto y = F32{ir.CompositeExtract(value, 1)};
+    auto z = F32{ir.CompositeExtract(value, 2)};
+    auto w = F32{ir.CompositeExtract(value, 3)};
+    // Gamma correction is only applied to RGB components
+    if (AmdGpu::IsRgb(mapping.r)) {
+        x = ApplyGammaToLinear(ir, x);
+    }
+    if (AmdGpu::IsRgb(mapping.g)) {
+        y = ApplyGammaToLinear(ir, y);
+    }
+    if (AmdGpu::IsRgb(mapping.b)) {
+        z = ApplyGammaToLinear(ir, z);
+    }
+    if (AmdGpu::IsRgb(mapping.a)) {
+        w = ApplyGammaToLinear(ir, w);
+    }
+    return ir.CompositeConstruct(x, y, z, w);
+}
+
 /// Applies a number conversion in the read direction.
 inline F32 ApplyReadNumberConversion(IREmitter& ir, const F32& value,
                                     const AmdGpu::NumberConversion& conversion) {