cnq3/code/renderer/shaders/grp/uber_shader.hlsl

293 lines
7.4 KiB
HLSL

/*
===========================================================================
Copyright (C) 2023 Gian 'myT' Schellenbaum
This file is part of Challenge Quake 3 (CNQ3).
Challenge Quake 3 is free software; you can redistribute it
and/or modify it under the terms of the GNU General Public License as
published by the Free Software Foundation; either version 2 of the License,
or (at your option) any later version.
Challenge Quake 3 is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with Challenge Quake 3. If not, see <https://www.gnu.org/licenses/>.
===========================================================================
*/
// the uber shader is the all-encompassing world and game UI rendering shader
//
// VS macros to define:
// STAGE_COUNT 1-8
//
// PS macros to define:
// DITHER
// STAGE_COUNT 1-8
// STAGE#_BITS
//
#define STAGE_ATTRIBS(Index) \
float2 texCoords##Index : TEXCOORD##Index; \
float4 color##Index : COLOR##Index;
#if VERTEX_SHADER
struct VIn
{
float3 position : POSITION;
float3 normal : NORMAL;
#if STAGE_COUNT >= 1
STAGE_ATTRIBS(0)
#endif
#if STAGE_COUNT >= 2
STAGE_ATTRIBS(1)
#endif
#if STAGE_COUNT >= 3
STAGE_ATTRIBS(2)
#endif
#if STAGE_COUNT >= 4
STAGE_ATTRIBS(3)
#endif
#if STAGE_COUNT >= 5
STAGE_ATTRIBS(4)
#endif
#if STAGE_COUNT >= 6
STAGE_ATTRIBS(5)
#endif
#if STAGE_COUNT >= 7
STAGE_ATTRIBS(6)
#endif
#if STAGE_COUNT >= 8
STAGE_ATTRIBS(7)
#endif
};
#endif
struct VOut
{
float4 position : SV_Position;
float3 normal : NORMAL;
#if STAGE_COUNT >= 1
STAGE_ATTRIBS(0)
#endif
#if STAGE_COUNT >= 2
STAGE_ATTRIBS(1)
#endif
#if STAGE_COUNT >= 3
STAGE_ATTRIBS(2)
#endif
#if STAGE_COUNT >= 4
STAGE_ATTRIBS(3)
#endif
#if STAGE_COUNT >= 5
STAGE_ATTRIBS(4)
#endif
#if STAGE_COUNT >= 6
STAGE_ATTRIBS(5)
#endif
#if STAGE_COUNT >= 7
STAGE_ATTRIBS(6)
#endif
#if STAGE_COUNT >= 8
STAGE_ATTRIBS(7)
#endif
float clipDist : SV_ClipDistance0;
float2 proj2232 : PROJ;
float depthVS : DEPTHVS;
};
#undef STAGE_ATTRIBS
#if VERTEX_SHADER
cbuffer RootConstants
{
matrix modelViewMatrix;
matrix projectionMatrix;
float4 clipPlane;
};
#define STAGE_ATTRIBS(Index) \
output.texCoords##Index = input.texCoords##Index; \
output.color##Index = input.color##Index;
VOut vs(VIn input)
{
float4 positionVS = mul(modelViewMatrix, float4(input.position.xyz, 1));
VOut output;
output.position = mul(projectionMatrix, positionVS);
output.normal = input.normal;
#if STAGE_COUNT >= 1
STAGE_ATTRIBS(0)
#endif
#if STAGE_COUNT >= 2
STAGE_ATTRIBS(1)
#endif
#if STAGE_COUNT >= 3
STAGE_ATTRIBS(2)
#endif
#if STAGE_COUNT >= 4
STAGE_ATTRIBS(3)
#endif
#if STAGE_COUNT >= 5
STAGE_ATTRIBS(4)
#endif
#if STAGE_COUNT >= 6
STAGE_ATTRIBS(5)
#endif
#if STAGE_COUNT >= 7
STAGE_ATTRIBS(6)
#endif
#if STAGE_COUNT >= 8
STAGE_ATTRIBS(7)
#endif
output.clipDist = dot(positionVS, clipPlane);
output.proj2232 = float2(-projectionMatrix[2][2], projectionMatrix[2][3]);
output.depthVS = -positionVS.z;
return output;
}
#endif
#if PIXEL_SHADER
#if USE_INCLUDES
#include "shared.hlsli"
#include "../common/state_bits.h.hlsli"
#include "../common/blend.hlsli"
#endif
cbuffer RootConstants
{
// general
uint4 stageIndices0; // sampler: 16 - texture: 16
uint4 stageIndices1;
float greyscale;
// shader trace
uint shaderTrace; // shader index: 14 - frame index: 2 - enable: 1
uint centerPixel; // y: 16 - x: 16
// depth fade
uint halfDistOffset; // low: distance - high: offset
uint depthFadeColorTex; // texture index: 12 - color bias: 4 - color scale: 4
// dither
uint halfSeedNoise; // low: frame seed - high: noise scale
uint halfInvGammaBright; // low: inv gamma - high: inv brightness
};
Texture2D textures2D[4096] : register(t0);
SamplerState samplers[96] : register(s0);
RWByteAddressBuffer shaderIndexBuffer : register(u0);
bool FailsAlphaTest(float alpha, uint stateBits)
{
if(stateBits == GLS_ATEST_GT_0)
return alpha == 0.0;
else if(stateBits == GLS_ATEST_LT_80)
return alpha >= 0.5;
else if(stateBits == GLS_ATEST_GE_80)
return alpha < 0.5;
else
return false;
}
float4 ProcessStage(float4 color, float2 texCoords, uint textureIndex, uint samplerIndex)
{
return color * textures2D[textureIndex].Sample(samplers[samplerIndex], texCoords);
}
void ProcessFullStage(inout float4 dst, float4 color, float2 texCoords, uint textureIndex, uint samplerIndex, uint stateBits)
{
float4 src = ProcessStage(color, texCoords, textureIndex, samplerIndex);
if(!FailsAlphaTest(src.a, stateBits & GLS_ATEST_BITS))
{
dst = Blend(src, dst, stateBits);
}
}
// reminder: early-Z is early depth test AND early depth write
// therefore, the attribute should be gone if opaque stage #1 does alpha testing (discard)
#if (STAGE0_BITS & GLS_ATEST_BITS) == 0
[earlydepthstencil]
#endif
float4 ps(VOut input) : SV_Target
{
float4 dst = ProcessStage(input.color0, input.texCoords0, stageIndices0.x & 0xFFFF, stageIndices0.x >> 16);
if(FailsAlphaTest(dst.a, STAGE0_BITS & GLS_ATEST_BITS))
{
discard;
}
#if STAGE_COUNT >= 2
ProcessFullStage(dst, input.color1, input.texCoords1, stageIndices0.y & 0xFFFF, stageIndices0.y >> 16, STAGE1_BITS);
#endif
#if STAGE_COUNT >= 3
ProcessFullStage(dst, input.color2, input.texCoords2, stageIndices0.z & 0xFFFF, stageIndices0.z >> 16, STAGE2_BITS);
#endif
#if STAGE_COUNT >= 4
ProcessFullStage(dst, input.color3, input.texCoords3, stageIndices0.w & 0xFFFF, stageIndices0.w >> 16, STAGE3_BITS);
#endif
#if STAGE_COUNT >= 5
ProcessFullStage(dst, input.color4, input.texCoords4, stageIndices1.x & 0xFFFF, stageIndices1.x >> 16, STAGE4_BITS);
#endif
#if STAGE_COUNT >= 6
ProcessFullStage(dst, input.color5, input.texCoords5, stageIndices1.y & 0xFFFF, stageIndices1.y >> 16, STAGE5_BITS);
#endif
#if STAGE_COUNT >= 7
ProcessFullStage(dst, input.color6, input.texCoords6, stageIndices1.z & 0xFFFF, stageIndices1.z >> 16, STAGE6_BITS);
#endif
#if STAGE_COUNT >= 8
ProcessFullStage(dst, input.color7, input.texCoords7, stageIndices1.w & 0xFFFF, stageIndices1.w >> 16, STAGE7_BITS);
#endif
dst = MakeGreyscale(dst, greyscale);
#if DITHER
float2 seedNoise = UnpackHalf2(halfSeedNoise);
float2 invGammaBright = UnpackHalf2(halfInvGammaBright);
dst = Dither(dst, input.position.xyz, seedNoise.x, seedNoise.y, invGammaBright.y, invGammaBright.x);
#endif
#if DEPTH_FADE
#define BIT(Index) GetBitAsFloat(depthFadeColorTex, Index)
float2 distOffset = UnpackHalf2(halfDistOffset);
float4 fadeColorScale = float4(BIT(0), BIT(1), BIT(2), BIT(3));
float4 fadeColorBias = float4(BIT(4), BIT(5), BIT(6), BIT(7));
float zwDepth = textures2D[depthFadeColorTex >> 8].Load(int3(input.position.xy, 0)).x;// stored depth, z/w
float depthS = LinearDepth(zwDepth, input.proj2232.x, input.proj2232.y); // stored depth, linear
float depthP = input.depthVS - distOffset.y; // fragment depth
float fadeScale = Contrast((depthS - depthP) * distOffset.x, 2.0);
dst = lerp(dst * fadeColorScale + fadeColorBias, dst, fadeScale);
#undef BIT
#endif
if(shaderTrace & 1)
{
// we only store the shader index of 1 pixel
uint2 fragmentCoords = uint2(input.position.xy);
uint2 centerCoords = uint2(centerPixel & 0xFFFF, centerPixel >> 16);
if(all(fragmentCoords == centerCoords))
{
uint frameIndex = (shaderTrace >> 1) & 3;
uint shaderIndex = shaderTrace >> 3;
shaderIndexBuffer.Store(frameIndex * 4, shaderIndex);
}
}
return dst;
}
#endif