Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

HDR Enhancements for Devil May Cry 5 #97

Merged
merged 1 commit into from
Dec 25, 2024
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
110 changes: 110 additions & 0 deletions src/games/dmc5/ConvertRec2020PS_0x6AB2B106.ps_5_0.hlsl
Original file line number Diff line number Diff line change
@@ -0,0 +1,110 @@
#include "./DICE.hlsl"
#include "./shared.h"

cbuffer HDRMapping : register(b0) {
float whitePaperNits : packoffset(c0);
float configImageAlphaScale : packoffset(c0.y);
float displayMaxNits : packoffset(c0.z);
float displayMinNits : packoffset(c0.w);
float4 displayMaxNitsRect : packoffset(c1);
float4 standardMaxNitsRect : packoffset(c2);
float4 mdrOutRangeRect : packoffset(c3);
uint drawMode : packoffset(c4);
float gammaForHDR : packoffset(c4.y);
float2 configDrawRectSize : packoffset(c4.z);
}

SamplerState PointBorder_s : register(s0);
Texture2D<float4> tLinearImage : register(t0);

// 3Dmigoto declarations
#define cmp -

float4 main(float4 v0: SV_Position0, float2 v1: TEXCOORD0)
: SV_Target {
#if 1
float3 bt709Color =
tLinearImage.SampleLevel(PointBorder_s, v1.xy, 0.0f).rgb;
#if 1
bt709Color = renodx::color::correct::GammaSafe(bt709Color);
#endif

#if 2
DICESettings config = DefaultDICESettings();
config.Type = 3;
config.ShoulderStart = 0.5f;
config.DesaturationAmount = 0.f;
config.DarkeningAmount = 0.f;
const float dicePaperWhite =
whitePaperNits / renodx::color::srgb::REFERENCE_WHITE;
const float dicePeakWhite = max(displayMaxNits, whitePaperNits) / renodx::color::srgb::REFERENCE_WHITE;
bt709Color.rgb =
DICETonemap(bt709Color.rgb * dicePaperWhite, dicePeakWhite, config) / dicePaperWhite;
#endif

float3 bt2020Color = renodx::color::bt2020::from::BT709(bt709Color.rgb);

float3 pqColor = renodx::color::pq::Encode(bt2020Color, whitePaperNits);

return float4(pqColor, 1.0);

#else

float4 r0, r1, r2, r3, r4, o0;

r0.xyz = tLinearImage.SampleLevel(PointBorder_s, v1.xy, 0).xyz;
r0.w = dot(float3(0.627403975, 0.329281986, 0.0433136001), r0.xyz);
r1.x = dot(float3(0.0690969974, 0.919539988, 0.0113612004), r0.xyz);
r0.x = dot(float3(0.0163915996, 0.088013202, 0.895595014), r0.xyz);
r2.x = log2(r0.w);
r2.y = log2(r1.x);
r2.z = log2(r0.x);
r0.xyz = gammaForHDR * r2.xyz;
r0.xyz = exp2(r0.xyz);
r0.w = 2.0999999 * whitePaperNits;
r0.w = 10000 / r0.w;
r0.xyz = saturate(r0.xyz / r0.www);
r0.xyz = log2(r0.xyz);
r0.xyz = float3(0.171569824, 0.171569824, 0.171569824) * r0.xyz;
r0.xyz = exp2(r0.xyz);
r1.xyz = r0.xyz * float3(16.71875, 16.71875, 16.71875) + float3(0.84375, 0.84375, 0.84375);
r0.xyz = r0.xyz * float3(16.5625, 16.5625, 16.5625) + float3(1, 1, 1);
r0.xyz = r1.xyz / r0.xyz;
r0.xyz = log2(r0.xyz);
r0.xyz = float3(82.53125, 82.53125, 82.53125) * r0.xyz;
r0.xyz = exp2(r0.xyz);
r0.xyz = min(float3(1, 1, 1), r0.xyz);
r0.w = drawMode & 2;
if (r0.w != 0) {
r1.xyzw = saturate(float4(9.99999975e-005, 9.99999975e-005, 9.99999975e-005,
9.99999975e-005)
* displayMaxNits);
r1.xyzw = log2(r1.xyzw);
r1.xyzw =
float4(0.159301758, 0.159301758, 0.159301758, 0.159301758) * r1.xyzw;
r1.xyzw = exp2(r1.xyzw);
r1.xyzw = r1.xyzw * float4(18.8515625, 18.6875, 18.8515625, 18.6875) + float4(0.8359375, 1, 0.8359375, 1);
r1.xy = r1.xz / r1.yw;
r1.xy = log2(r1.xy);
r1.xy = float2(78.84375, 78.84375) * r1.xy;
r1.xy = exp2(r1.xy);
r1.xy = min(float2(1, 1), r1.xy);
r1.y = r1.x + -r1.y;
r2.xyz = r0.xyz / r1.xxx;
r2.xyz = min(float3(1, 1, 1), r2.xyz);
r3.xyz = r2.xyz * r1.yyy;
r4.xyz = float3(1, 1, 1) + -r2.xyz;
r1.xzw = r2.xyz * r1.xxx;
r1.xyz = r1.yyy * r4.xyz + r1.xzw;
r1.xyz = r1.xyz * r2.xyz;
r1.xyz = r3.xyz * r4.xyz + r1.xyz;
r1.xyz = min(r1.xyz, r0.xyz);
}
if (r0.w == 0) {
r1.xyz = r0.xyz;
}
o0.xyz = r1.xyz;
o0.w = 1;
return o0;
#endif
}
251 changes: 251 additions & 0 deletions src/games/dmc5/DICE.hlsl
Original file line number Diff line number Diff line change
@@ -0,0 +1,251 @@
#include "./shared.h"

static const float HDR10_MaxWhiteNits = 10000.0f;

float max3(float a, float b, float c) {
return max(a, max(b, c));
}

float max3(float3 v) {
return max3(v.x, v.y, v.z);
}

static const float PQ_constant_M1 = 0.1593017578125f;
static const float PQ_constant_M2 = 78.84375f;
static const float PQ_constant_C1 = 0.8359375f;
static const float PQ_constant_C2 = 18.8515625f;
static const float PQ_constant_C3 = 18.6875f;

// PQ (Perceptual Quantizer - ST.2084) encode/decode used for HDR10 BT.2100.
// Clamp type:
// 0 None
// 1 Remove negative numbers
// 2 Remove numbers beyond 0-1
// 3 Mirror negative numbers
float3 Linear_to_PQ(float3 LinearColor, int clampType = 0) {
float3 LinearColorSign = sign(LinearColor);
if (clampType == 1) {
LinearColor = max(LinearColor, 0.f);
} else if (clampType == 2) {
LinearColor = saturate(LinearColor);
} else if (clampType == 3) {
LinearColor = abs(LinearColor);
}
float3 colorPow = pow(LinearColor, PQ_constant_M1);
float3 numerator = PQ_constant_C1 + PQ_constant_C2 * colorPow;
float3 denominator = 1.f + PQ_constant_C3 * colorPow;
float3 pq = pow(numerator / denominator, PQ_constant_M2);
if (clampType == 3) {
return pq * LinearColorSign;
}
return pq;
}

float3 PQ_to_Linear(float3 ST2084Color, int clampType = 0) {
float3 ST2084ColorSign = sign(ST2084Color);
if (clampType == 1) {
ST2084Color = max(ST2084Color, 0.f);
} else if (clampType == 2) {
ST2084Color = saturate(ST2084Color);
} else if (clampType == 3) {
ST2084Color = abs(ST2084Color);
}
float3 colorPow = pow(ST2084Color, 1.f / PQ_constant_M2);
float3 numerator = max(colorPow - PQ_constant_C1, 0.f);
float3 denominator = PQ_constant_C2 - (PQ_constant_C3 * colorPow);
float3 linearColor = pow(numerator / denominator, 1.f / PQ_constant_M1);
if (clampType == 3) {
return linearColor * ST2084ColorSign;
}
return linearColor;
}

// Applies exponential ("Photographic") luminance/luma compression.
// The pow can modulate the curve without changing the values around the edges.
// The max is the max possible range to compress from, to not lose any output
// range if the input range was limited.
float rangeCompress(float X, float Max = asfloat(0x7F7FFFFF)) {
// Branches are for static parameters optimizations
if (Max == asfloat(0x7F7FFFFF)) {
// This does e^X. We expect X to be between 0 and 1.
return 1.f - exp(-X);
}
const float lostRange = exp(-Max);
const float restoreRangeScale = 1.f / (1.f - lostRange);
return (1.f - exp(-X)) * restoreRangeScale;
}

// Refurbished DICE HDR tonemapper (per channel or luminance).
// Expects "InValue" to be >= "ShoulderStart" and "OutMaxValue" to be >
// "ShoulderStart".
float luminanceCompress(float InValue, float OutMaxValue,
float ShoulderStart = 0.f,
bool ConsiderMaxValue = false,
float InMaxValue = asfloat(0x7F7FFFFF)) {
const float compressableValue = InValue - ShoulderStart;
const float compressableRange = InMaxValue - ShoulderStart;
const float compressedRange = OutMaxValue - ShoulderStart;
const float possibleOutValue =
ShoulderStart + compressedRange * rangeCompress(compressableValue / compressedRange, ConsiderMaxValue ? (compressableRange / compressedRange) : asfloat(0x7F7FFFFF));
#if 1
return possibleOutValue;
#else // Enable this branch if "InValue" can be smaller than "ShoulderStart"
return (InValue <= ShoulderStart) ? InValue : possibleOutValue;
#endif
}

#define DICE_TYPE_BY_LUMINANCE_RGB 0
// Doing the DICE compression in PQ (either on luminance or each color channel)
// produces a curve that is closer to our "perception" and leaves more detail
// highlights without overly compressing them
#define DICE_TYPE_BY_LUMINANCE_PQ 1
// Modern HDR displays clip individual rgb channels beyond their "white" peak
// brightness, like, if the peak brightness is 700 nits, any r g b color beyond
// a value of 700/80 will be clipped (not acknowledged, it won't make a
// difference). Tonemapping by luminance, is generally more perception accurate
// but can then generate rgb colors "out of range". This setting fixes them up,
// though it's optional as it's working based on assumptions on how current
// displays work, which might not be true anymore in the future. Note that this
// can create some steep (rough, quickly changing) gradients on very bright
// colors.
#define DICE_TYPE_BY_LUMINANCE_PQ_CORRECT_CHANNELS_BEYOND_PEAK_WHITE 2
// This might look more like classic SDR tonemappers and is closer to how modern
// TVs and Monitors play back colors (usually they clip each individual channel
// to the peak brightness value, though in their native panel color space, or
// current SDR/HDR mode color space). Overall, this seems to handle bright
// gradients more smoothly, even if it shifts hues more (and generally
// desaturating).
#define DICE_TYPE_BY_CHANNEL_PQ 3

struct DICESettings {
uint Type;
// Determines where the highlights curve (shoulder) starts.
// Values between 0.25 and 0.5 are good with DICE by PQ (any type).
// With linear/rgb DICE this barely makes a difference, zero is a good default
// but (e.g.) 0.5 would also work. This should always be between 0 and 1.
float ShoulderStart;

// For "Type == DICE_TYPE_BY_LUMINANCE_PQ_CORRECT_CHANNELS_BEYOND_PEAK_WHITE"
// only: The sum of these needs to be <= 1, both within 0 and 1. The closer
// the sum is to 1, the more each color channel will be containted within its
// peak range.
float DesaturationAmount;
float DarkeningAmount;
};

DICESettings DefaultDICESettings() {
DICESettings Settings;
Settings.Type = DICE_TYPE_BY_CHANNEL_PQ;
Settings.ShoulderStart =
(Settings.Type > DICE_TYPE_BY_LUMINANCE_RGB)
? (1.f / 3.f)
: 0.f; // TODOFT3: increase value!!! (did I already?)
Settings.DesaturationAmount = 1.0 / 3.0;
Settings.DarkeningAmount = 1.0 / 3.0;
return Settings;
}

// Tonemapper inspired from DICE. Can work by luminance to maintain hue.
// Takes scRGB colors with a white level (the value of 1 1 1) of 80 nits (sRGB)
// (to not be confused with paper white). Paper white is expected to have
// already been multiplied in.
float3 DICETonemap(float3 Color, float PeakWhite,
const DICESettings Settings /*= DefaultDICESettings()*/) {
const float sourceLuminance = renodx::color::y::from::BT709(Color);

if (Settings.Type != DICE_TYPE_BY_LUMINANCE_RGB) {
static const float HDR10_MaxWhite =
HDR10_MaxWhiteNits / renodx::color::srgb::REFERENCE_WHITE;

// We could first convert the peak white to PQ and then apply the "shoulder
// start" alpha to it (in PQ), but tests showed scaling it in linear
// actually produces a better curve and more consistently follows the peak
// across different values
const float shoulderStartPQ =
Linear_to_PQ((Settings.ShoulderStart * PeakWhite) / HDR10_MaxWhite).x;
if (Settings.Type == DICE_TYPE_BY_LUMINANCE_PQ || Settings.Type == DICE_TYPE_BY_LUMINANCE_PQ_CORRECT_CHANNELS_BEYOND_PEAK_WHITE) {
const float sourceLuminanceNormalized = sourceLuminance / HDR10_MaxWhite;
const float sourceLuminancePQ =
Linear_to_PQ(sourceLuminanceNormalized, 1).x;

if (sourceLuminancePQ > shoulderStartPQ) // Luminance below the shoulder (or below zero) don't
// need to be adjusted
{
const float peakWhitePQ = Linear_to_PQ(PeakWhite / HDR10_MaxWhite).x;

const float compressedLuminancePQ =
luminanceCompress(sourceLuminancePQ, peakWhitePQ, shoulderStartPQ);
const float compressedLuminanceNormalized =
PQ_to_Linear(compressedLuminancePQ).x;
Color *= compressedLuminanceNormalized / sourceLuminanceNormalized;

if (Settings.Type == DICE_TYPE_BY_LUMINANCE_PQ_CORRECT_CHANNELS_BEYOND_PEAK_WHITE) {
float3 Color_BT2020 = renodx::color::bt2020::from::BT709(Color);
if (any(Color_BT2020 > PeakWhite)) // Optional "optimization" branch
{
float colorLuminance = renodx::color::y::from::BT2020(Color_BT2020);
float colorLuminanceInExcess = colorLuminance - PeakWhite;
float maxColorInExcess =
max3(Color_BT2020) - PeakWhite; // This is guaranteed to be >=
// "colorLuminanceInExcess"
float brightnessReduction = saturate(renodx::math::SafeDivision(
PeakWhite, max3(Color_BT2020),
1)); // Fall back to one in case of division by zero
float desaturateAlpha = saturate(renodx::math::SafeDivision(
maxColorInExcess, maxColorInExcess - colorLuminanceInExcess,
0)); // Fall back to zero in case of division by zero
Color_BT2020 = lerp(Color_BT2020, colorLuminance,
desaturateAlpha * Settings.DesaturationAmount);
Color_BT2020 =
lerp(Color_BT2020, Color_BT2020 * brightnessReduction,
Settings.DarkeningAmount); // Also reduce the brightness to
// partially maintain the hue,
// at the cost of brightness
Color = renodx::color::bt709::from::BT2020(Color_BT2020);
}
}
}
} else // DICE_TYPE_BY_CHANNEL_PQ
{
const float peakWhitePQ = Linear_to_PQ(PeakWhite / HDR10_MaxWhite).x;

// Tonemap in BT.2020 to more closely match the primaries of modern
// displays
const float3 sourceColorNormalized =
renodx::color::bt2020::from::BT709(Color) / HDR10_MaxWhite;
const float3 sourceColorPQ = Linear_to_PQ(sourceColorNormalized, 1);

[unroll]
for (uint i = 0; i < 3;
i++) // TODO LUMA: optimize? will the shader compile already convert
// this to float3? Or should we already make a version with no
// branches that works in float3?
{
if (sourceColorPQ[i] > shoulderStartPQ) // Colors below the shoulder (or below zero) don't
// need to be adjusted
{
const float compressedColorPQ =
luminanceCompress(sourceColorPQ[i], peakWhitePQ, shoulderStartPQ);
const float compressedColorNormalized =
PQ_to_Linear(compressedColorPQ).x;
Color[i] = renodx::color::bt709::from::BT2020(
Color[i] * (compressedColorNormalized / sourceColorNormalized[i]))
.x;
}
}
}
} else // DICE_TYPE_BY_LUMINANCE_RGB
{
const float shoulderStart =
PeakWhite * Settings.ShoulderStart; // From alpha to linear range
if (sourceLuminance > shoulderStart) // Luminances below the shoulder (or below zero) don't
// need to be adjusted
{
const float compressedLuminance =
luminanceCompress(sourceLuminance, PeakWhite, shoulderStart);
Color *= compressedLuminance / sourceLuminance;
}
}

return Color;
}
Loading