csgo-2018-source/materialsystem/stdshaders/csm_common_gameconsole_fxc.h

302 lines
13 KiB
C
Raw Permalink Normal View History

2021-07-24 21:11:47 -07:00
//========== Copyright (c) Valve Corporation, All rights reserved. ==========//
// X360 and PS3 cascaded shadow mapping
// 7LS TODO - PS3
#if defined(_X360)
float CSMSampleShadowBuffer360Simple( sampler DepthSampler, const float3 vProjCoords )
{
float fLOD;
float2 shadowMapCenter = vProjCoords.xy; // Center of shadow filter
float objDepth = min( vProjCoords.z, 0.99999 ); // Object depth in shadow space
// TODO: why doesn't the reverse depth path work with CSM's here since CPU side is set to flip z
//#if defined( REVERSE_DEPTH_ON_X360 )
// objDepth = 1.0f - objDepth;
//#endif
float4 vSampledDepths, vWeights;
asm
{
tfetch2D vSampledDepths.x___, shadowMapCenter, DepthSampler, OffsetX = -0.5, OffsetY = -0.5, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
tfetch2D vSampledDepths._x__, shadowMapCenter, DepthSampler, OffsetX = 0.5, OffsetY = -0.5, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
tfetch2D vSampledDepths.__x_, shadowMapCenter, DepthSampler, OffsetX = -0.5, OffsetY = 0.5, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
tfetch2D vSampledDepths.___x, shadowMapCenter, DepthSampler, OffsetX = 0.5, OffsetY = 0.5, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
};
asm
{
getWeights2D vWeights, shadowMapCenter.xy, DepthSampler, MagFilter=linear, MinFilter=linear, UseComputedLOD=false, UseRegisterLOD=false
};
vWeights = float4( (1-vWeights.x)*(1-vWeights.y), vWeights.x*(1-vWeights.y), (1-vWeights.x)*vWeights.y, vWeights.x*vWeights.y );
//#if defined( REVERSE_DEPTH_ON_X360 )
// float4 vCompare = (vSampledDepths < objDepth.xxxx);
//#else
float4 vCompare = (vSampledDepths > objDepth.xxxx);
//#endif
return 1.0f - dot( vCompare, vWeights );
}
float CSMSampleShadowBuffer3604x4( sampler DepthSampler, const float3 vProjCoords )
{
float2 vShadowMapCenter = vProjCoords.xy + float2( .5f / 1408.0f, .5f / 1408.0f ); // Center of shadow filter
// This shader assumes REVERSE_DEPTH_ON_X360 is always defined.
// TODO: why doesn't the reverse depth path work on CSM's since CPU code is set to flip z
//float flObjDepth = 1.0f - min( vProjCoords.z, 0.99999f ); // Object depth in shadow space
float flObjDepth = min( vProjCoords.z, 0.99999f ); // Object depth in shadow space
// projective distance from z plane in view coords
float4 vDist4 = float4( flObjDepth, flObjDepth, flObjDepth, flObjDepth );
//fraction component of projected coordinates; here FLASHLIGHT_SHADOW_TEXTURE_RESOLUTION represents the shadowmap size
float2 vTexRes = float2( 1408.0f, 1408.0f );
float2 vFrac = frac( vShadowMapCenter * vTexRes );
float4 vWeights = float4( vFrac.x, vFrac.y, 1.0f - vFrac.x, 1.0f - vFrac.y );
float flPercentInLight;
[isolate]
{
float4 vShadowMapVals, vInLight;
asm
{
tfetch2D vShadowMapVals.x___, vShadowMapCenter, DepthSampler, OffsetX = -1.0, OffsetY = -2.0, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
tfetch2D vShadowMapVals._x__, vShadowMapCenter, DepthSampler, OffsetX = -2.0, OffsetY = -1.0, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
tfetch2D vShadowMapVals.__x_, vShadowMapCenter, DepthSampler, OffsetX = -1.0, OffsetY = -1.0, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
tfetch2D vShadowMapVals.___x, vShadowMapCenter, DepthSampler, OffsetX = -2.0, OffsetY = -2.0, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
sgt vInLight, vShadowMapVals, vDist4
};
//7LS flipped z sub for above sgt args
//sgt vInLight, vDist4, vShadowMapVals
float4 vShadowMapWeights = float4( vWeights.w, vWeights.z, 1, vWeights.z * vWeights.w );
flPercentInLight = dot( vInLight, vShadowMapWeights );
}
[isolate]
{
float4 vShadowMapVals, vInLight;
asm
{
tfetch2D vShadowMapVals.x___, vShadowMapCenter, DepthSampler, OffsetX = 1.0, OffsetY = -2.0, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
tfetch2D vShadowMapVals._x__, vShadowMapCenter, DepthSampler, OffsetX = 0.0, OffsetY = -1.0, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
tfetch2D vShadowMapVals.__x_, vShadowMapCenter, DepthSampler, OffsetX = 1.0, OffsetY = -1.0, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
tfetch2D vShadowMapVals.___x, vShadowMapCenter, DepthSampler, OffsetX = 0.0, OffsetY = -2.0, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
sgt vInLight, vShadowMapVals, vDist4
};
float4 vShadowMapWeights = float4( vWeights.x * vWeights.w, 1, vWeights.x, vWeights.w );
flPercentInLight += dot( vInLight, vShadowMapWeights );
}
[isolate]
{
float4 vShadowMapVals, vInLight;
asm
{
tfetch2D vShadowMapVals.x___, vShadowMapCenter, DepthSampler, OffsetX = -1.0, OffsetY = 0.0, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
tfetch2D vShadowMapVals._x__, vShadowMapCenter, DepthSampler, OffsetX = -2.0, OffsetY = 1.0, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
tfetch2D vShadowMapVals.__x_, vShadowMapCenter, DepthSampler, OffsetX = -1.0, OffsetY = 1.0, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
tfetch2D vShadowMapVals.___x, vShadowMapCenter, DepthSampler, OffsetX = -2.0, OffsetY = 0.0, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
sgt vInLight, vShadowMapVals, vDist4
};
float4 vShadowMapWeights = float4( 1, vWeights.z * vWeights.y, vWeights.y, vWeights.z );
flPercentInLight += dot( vInLight, vShadowMapWeights );
}
[isolate]
{
float4 vShadowMapVals, vInLight;
asm
{
tfetch2D vShadowMapVals.x___, vShadowMapCenter, DepthSampler, OffsetX = 1.0, OffsetY = 0.0, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
tfetch2D vShadowMapVals._x__, vShadowMapCenter, DepthSampler, OffsetX = 0.0, OffsetY = 1.0, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
tfetch2D vShadowMapVals.__x_, vShadowMapCenter, DepthSampler, OffsetX = 1.0, OffsetY = 1.0, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
tfetch2D vShadowMapVals.___x, vShadowMapCenter, DepthSampler, OffsetX = 0.0, OffsetY = 0.0, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
sgt vInLight, vShadowMapVals, vDist4
};
float4 vShadowMapWeights = float4( vWeights.x, vWeights.y, vWeights.x * vWeights.y, 1 );
flPercentInLight += dot( vInLight, vShadowMapWeights );
}
//sum of weights is 9 since border taps are bilinearly filtered
return 1.0f - (( 1.0f / 9.0f ) * flPercentInLight);
}
#elif defined(_PS3)
// keep this in sync with c_env_cascade_light.cpp
#define CASCADE_RESOLUTION 768
// 1 2 1
// 2 4 2
// 1 2 1
// Tweaked for good code gen with the SCE Cg compiler.
half CSMSampleShadowBufferPS33x3( sampler DepthSampler, const float3 shadowMapPos )
{
float fTexelEpsilon = 1.0f / CASCADE_RESOLUTION;
float3 shadowMapCenter_objDepth = shadowMapPos.xyz;
float3 shadowMapCenter = shadowMapCenter_objDepth.xyz; // Center of shadow filter
float4 vUV0 = shadowMapCenter.xyzx + float4( fTexelEpsilon, fTexelEpsilon, 0.0f, -fTexelEpsilon );
float4 vUV1 = shadowMapCenter.xyzx + float4( fTexelEpsilon, -fTexelEpsilon, 0.0f, -fTexelEpsilon );
half4 vOneTaps;
vOneTaps.x = h4tex2D( DepthSampler, vUV0.xyz ).x;
vOneTaps.y = h4tex2D( DepthSampler, vUV0.wyz ).y;
vOneTaps.z = h4tex2D( DepthSampler, vUV1.xyz ).z;
vOneTaps.w = h4tex2D( DepthSampler, vUV1.wyz ).w;
half flSum = dot( vOneTaps, half4(1.0f, 1.0f, 1.0f, 1.0f));
float4 vUV2 = shadowMapCenter.xyzx + float4( fTexelEpsilon, 0.0f, 0.0f, -fTexelEpsilon );
float4 vUV3 = shadowMapCenter.xyzy + float4( 0.0f, -fTexelEpsilon, 0.0f, fTexelEpsilon );
half4 vTwoTaps;
vTwoTaps.x = h4tex2D( DepthSampler, vUV2.xyz ).x;
vTwoTaps.y = h4tex2D( DepthSampler, vUV2.wyz ).y;
vTwoTaps.z = h4tex2D( DepthSampler, vUV3.xyz ).z;
vTwoTaps.w = h4tex2D( DepthSampler, vUV3.xwz ).w;
flSum += dot( vTwoTaps, half4(2.0f, 2.0f, 2.0f, 2.0f));
flSum += tex2D( DepthSampler, shadowMapCenter ).x * half(4.0f);
// Sum all 9 Taps
return flSum * (1.0h / 16.0h);
}
#else
#error Unsupported
#endif // #elif defined(_PS3)
float CSMSampleShadowBuffer1Tap( float2 vPositionLs, float flComparisonDepth )
{
#if defined(_X360)
#if (CSM_VIEWMODELQUALITY == 0)
return CSMSampleShadowBuffer360Simple( CSMDepthAtlasSampler, float3( vPositionLs.x, vPositionLs.y, flComparisonDepth ) );
#else
return CSMSampleShadowBuffer3604x4( CSMDepthAtlasSampler, float3( vPositionLs.x, vPositionLs.y, flComparisonDepth ) );
#endif
#elif defined(_PS3)
#if (CSM_VIEWMODELQUALITY == 0)
return tex2Dproj( CSMDepthAtlasSampler, float4( vPositionLs.x, vPositionLs.y, flComparisonDepth.x, 1.0f ) );
#else
return CSMSampleShadowBufferPS33x3( CSMDepthAtlasSampler, float3( vPositionLs.x, vPositionLs.y, flComparisonDepth ) );
#endif
#else
#error Unsupported
#endif
}
float CSMSampleShadowBuffer( float2 vPositionLs, float flComparisonDepth )
{
return CSMSampleShadowBuffer1Tap( vPositionLs, flComparisonDepth );
}
int CSMRangeTestExpanded( float2 vCoords )
{
// Returns true if the coordinates are within [.02,.98] - purposely a little sloppy to prevent the shadow filter kernel from leaking outside the cascade's portion of the atlas.
vCoords = vCoords * ( 1.0f / .96f ) - float2( .02f / .96f, .02f / .96f );
return ( dot( saturate( vCoords.xy ) - vCoords.xy, float2( 1, 1 ) ) == 0.0f );
}
int CSMRangeTestNonExpanded( float2 vCoords )
{
return ( dot( saturate( vCoords.xy ) - vCoords.xy, float2( 1, 1 ) ) == 0.0f );
}
float CSMComputeSplitLerpFactor( float2 vPositionToSampleLs )
{
float2 vSplitLerpFactorTemp = float2( 1.0f, 1.0f ) - saturate( ( abs( vPositionToSampleLs.xy - float2( .5f, .5f ) ) - float2( g_flSunShadowingSplitLerpFactorBase, g_flSunShadowingSplitLerpFactorBase ) ) * float2( g_flSunShadowingSplitLerpFactorInvRange, g_flSunShadowingSplitLerpFactorInvRange ) );
return vSplitLerpFactorTemp.x * vSplitLerpFactorTemp.y;
}
float4 CSMTransformLightToTexture( float4 pos, float4x4 mat )
{
#if defined(_PS3)
return mul( mat, pos );
#else
return mul( pos, mat );
#endif
}
#if ( CASCADE_SIZE == 0 )
float CSMComputeShadowing( float3 vPositionWs )
{
return 1.0f;
}
#elif ( CSM_MODE >= 1 )
#error Invalid CSM_MODE
#else
// CSM shader quality level 0 (the only supported level on gameconsole)
float CSMComputeShadowing( float3 vPositionWs )
{
float flShadowScalar = 1.0f;
float4 vPosition4Ws = float4( vPositionWs.xyz, 1.0f );
float3 vPositionToSampleLs = float3( 0.0f, 0.0f, CSMTransformLightToTexture( vPosition4Ws.xyzw, g_matWorldToShadowTexMatrices[0] ).z );
#if ( CSM_VIEWMODELQUALITY == 0 )
// only consider cascade 1 and 2 for console perf
#if defined(_PS3)
float4 cascadeAtlasUVOffsets_1 = g_vCascadeAtlasUVOffsets[1];
float4 cascadeAtlasUVOffsets_2 = g_vCascadeAtlasUVOffsets[2];
float4 cascadeAtlasUVOffset = cascadeAtlasUVOffsets_1;
#else
int nCascadeIndex = 1;
#endif
vPositionToSampleLs.xy = CSMTransformLightToTexture( vPosition4Ws.xyzw, g_matWorldToShadowTexMatrices[1] ).xy;
if ( !CSMRangeTestExpanded( vPositionToSampleLs.xy ) )
{
vPositionToSampleLs.xy = CSMTransformLightToTexture( vPosition4Ws.xyzw, g_matWorldToShadowTexMatrices[2] ).xy;
#if defined(_PS3)
cascadeAtlasUVOffset = cascadeAtlasUVOffsets_2;
#else
nCascadeIndex = 2;
#endif
}
#if defined(_PS3)
vPositionToSampleLs.xy = saturate( vPositionToSampleLs.xy ) * cascadeAtlasUVOffset.zw + cascadeAtlasUVOffset.xy;
#else
vPositionToSampleLs.xy = saturate( vPositionToSampleLs.xy ) * g_vCascadeAtlasUVOffsets[nCascadeIndex].zw + g_vCascadeAtlasUVOffsets[nCascadeIndex].xy;
#endif
float3 vCamDelta = vPositionWs - g_vCamPosition.xyz;
float flZLerpFactor = saturate( dot( vCamDelta, vCamDelta ) * g_flSunShadowingZLerpFactorRange + g_flSunShadowingZLerpFactorBase );
flShadowScalar = CSMSampleShadowBuffer( vPositionToSampleLs.xy, vPositionToSampleLs.z );
flShadowScalar = lerp( flShadowScalar, 1.0f, flZLerpFactor );
#else
// Viewmodel shadowing
// only use cascade 0 for viewmodel rendering
vPositionToSampleLs.xy = CSMTransformLightToTexture( vPosition4Ws.xyzw, g_matWorldToShadowTexMatrices[0] ).xy;
vPositionToSampleLs.xy = saturate( vPositionToSampleLs.xy ) * g_vCascadeAtlasUVOffsets[0].zw + g_vCascadeAtlasUVOffsets[0].xy;
flShadowScalar = CSMSampleShadowBuffer( vPositionToSampleLs.xy, vPositionToSampleLs.z );
#endif // CSM_VIEWMODELQUALITY == 0
return flShadowScalar;
}
#endif // #if ( CSM_MODE == 0 )