302 lines
13 KiB
C
302 lines
13 KiB
C
|
//========== Copyright (c) Valve Corporation, All rights reserved. ==========//
|
||
|
|
||
|
// X360 and PS3 cascaded shadow mapping
|
||
|
|
||
|
// 7LS TODO - PS3
|
||
|
#if defined(_X360)
|
||
|
|
||
|
float CSMSampleShadowBuffer360Simple( sampler DepthSampler, const float3 vProjCoords )
|
||
|
{
|
||
|
float fLOD;
|
||
|
float2 shadowMapCenter = vProjCoords.xy; // Center of shadow filter
|
||
|
float objDepth = min( vProjCoords.z, 0.99999 ); // Object depth in shadow space
|
||
|
|
||
|
// TODO: why doesn't the reverse depth path work with CSM's here since CPU side is set to flip z
|
||
|
|
||
|
//#if defined( REVERSE_DEPTH_ON_X360 )
|
||
|
// objDepth = 1.0f - objDepth;
|
||
|
//#endif
|
||
|
|
||
|
float4 vSampledDepths, vWeights;
|
||
|
|
||
|
asm
|
||
|
{
|
||
|
tfetch2D vSampledDepths.x___, shadowMapCenter, DepthSampler, OffsetX = -0.5, OffsetY = -0.5, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
|
||
|
tfetch2D vSampledDepths._x__, shadowMapCenter, DepthSampler, OffsetX = 0.5, OffsetY = -0.5, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
|
||
|
tfetch2D vSampledDepths.__x_, shadowMapCenter, DepthSampler, OffsetX = -0.5, OffsetY = 0.5, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
|
||
|
tfetch2D vSampledDepths.___x, shadowMapCenter, DepthSampler, OffsetX = 0.5, OffsetY = 0.5, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
|
||
|
};
|
||
|
|
||
|
asm
|
||
|
{
|
||
|
getWeights2D vWeights, shadowMapCenter.xy, DepthSampler, MagFilter=linear, MinFilter=linear, UseComputedLOD=false, UseRegisterLOD=false
|
||
|
};
|
||
|
|
||
|
vWeights = float4( (1-vWeights.x)*(1-vWeights.y), vWeights.x*(1-vWeights.y), (1-vWeights.x)*vWeights.y, vWeights.x*vWeights.y );
|
||
|
|
||
|
//#if defined( REVERSE_DEPTH_ON_X360 )
|
||
|
// float4 vCompare = (vSampledDepths < objDepth.xxxx);
|
||
|
//#else
|
||
|
float4 vCompare = (vSampledDepths > objDepth.xxxx);
|
||
|
//#endif
|
||
|
|
||
|
return 1.0f - dot( vCompare, vWeights );
|
||
|
}
|
||
|
|
||
|
float CSMSampleShadowBuffer3604x4( sampler DepthSampler, const float3 vProjCoords )
|
||
|
{
|
||
|
float2 vShadowMapCenter = vProjCoords.xy + float2( .5f / 1408.0f, .5f / 1408.0f ); // Center of shadow filter
|
||
|
|
||
|
// This shader assumes REVERSE_DEPTH_ON_X360 is always defined.
|
||
|
// TODO: why doesn't the reverse depth path work on CSM's since CPU code is set to flip z
|
||
|
|
||
|
|
||
|
//float flObjDepth = 1.0f - min( vProjCoords.z, 0.99999f ); // Object depth in shadow space
|
||
|
float flObjDepth = min( vProjCoords.z, 0.99999f ); // Object depth in shadow space
|
||
|
|
||
|
// projective distance from z plane in view coords
|
||
|
float4 vDist4 = float4( flObjDepth, flObjDepth, flObjDepth, flObjDepth );
|
||
|
|
||
|
//fraction component of projected coordinates; here FLASHLIGHT_SHADOW_TEXTURE_RESOLUTION represents the shadowmap size
|
||
|
float2 vTexRes = float2( 1408.0f, 1408.0f );
|
||
|
float2 vFrac = frac( vShadowMapCenter * vTexRes );
|
||
|
float4 vWeights = float4( vFrac.x, vFrac.y, 1.0f - vFrac.x, 1.0f - vFrac.y );
|
||
|
|
||
|
float flPercentInLight;
|
||
|
|
||
|
[isolate]
|
||
|
{
|
||
|
float4 vShadowMapVals, vInLight;
|
||
|
asm
|
||
|
{
|
||
|
tfetch2D vShadowMapVals.x___, vShadowMapCenter, DepthSampler, OffsetX = -1.0, OffsetY = -2.0, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
|
||
|
tfetch2D vShadowMapVals._x__, vShadowMapCenter, DepthSampler, OffsetX = -2.0, OffsetY = -1.0, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
|
||
|
tfetch2D vShadowMapVals.__x_, vShadowMapCenter, DepthSampler, OffsetX = -1.0, OffsetY = -1.0, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
|
||
|
tfetch2D vShadowMapVals.___x, vShadowMapCenter, DepthSampler, OffsetX = -2.0, OffsetY = -2.0, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
|
||
|
sgt vInLight, vShadowMapVals, vDist4
|
||
|
};
|
||
|
//7LS flipped z sub for above sgt args
|
||
|
//sgt vInLight, vDist4, vShadowMapVals
|
||
|
float4 vShadowMapWeights = float4( vWeights.w, vWeights.z, 1, vWeights.z * vWeights.w );
|
||
|
flPercentInLight = dot( vInLight, vShadowMapWeights );
|
||
|
}
|
||
|
|
||
|
[isolate]
|
||
|
{
|
||
|
float4 vShadowMapVals, vInLight;
|
||
|
asm
|
||
|
{
|
||
|
tfetch2D vShadowMapVals.x___, vShadowMapCenter, DepthSampler, OffsetX = 1.0, OffsetY = -2.0, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
|
||
|
tfetch2D vShadowMapVals._x__, vShadowMapCenter, DepthSampler, OffsetX = 0.0, OffsetY = -1.0, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
|
||
|
tfetch2D vShadowMapVals.__x_, vShadowMapCenter, DepthSampler, OffsetX = 1.0, OffsetY = -1.0, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
|
||
|
tfetch2D vShadowMapVals.___x, vShadowMapCenter, DepthSampler, OffsetX = 0.0, OffsetY = -2.0, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
|
||
|
sgt vInLight, vShadowMapVals, vDist4
|
||
|
};
|
||
|
float4 vShadowMapWeights = float4( vWeights.x * vWeights.w, 1, vWeights.x, vWeights.w );
|
||
|
flPercentInLight += dot( vInLight, vShadowMapWeights );
|
||
|
}
|
||
|
|
||
|
[isolate]
|
||
|
{
|
||
|
float4 vShadowMapVals, vInLight;
|
||
|
asm
|
||
|
{
|
||
|
tfetch2D vShadowMapVals.x___, vShadowMapCenter, DepthSampler, OffsetX = -1.0, OffsetY = 0.0, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
|
||
|
tfetch2D vShadowMapVals._x__, vShadowMapCenter, DepthSampler, OffsetX = -2.0, OffsetY = 1.0, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
|
||
|
tfetch2D vShadowMapVals.__x_, vShadowMapCenter, DepthSampler, OffsetX = -1.0, OffsetY = 1.0, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
|
||
|
tfetch2D vShadowMapVals.___x, vShadowMapCenter, DepthSampler, OffsetX = -2.0, OffsetY = 0.0, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
|
||
|
sgt vInLight, vShadowMapVals, vDist4
|
||
|
};
|
||
|
float4 vShadowMapWeights = float4( 1, vWeights.z * vWeights.y, vWeights.y, vWeights.z );
|
||
|
flPercentInLight += dot( vInLight, vShadowMapWeights );
|
||
|
}
|
||
|
|
||
|
[isolate]
|
||
|
{
|
||
|
float4 vShadowMapVals, vInLight;
|
||
|
asm
|
||
|
{
|
||
|
tfetch2D vShadowMapVals.x___, vShadowMapCenter, DepthSampler, OffsetX = 1.0, OffsetY = 0.0, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
|
||
|
tfetch2D vShadowMapVals._x__, vShadowMapCenter, DepthSampler, OffsetX = 0.0, OffsetY = 1.0, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
|
||
|
tfetch2D vShadowMapVals.__x_, vShadowMapCenter, DepthSampler, OffsetX = 1.0, OffsetY = 1.0, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
|
||
|
tfetch2D vShadowMapVals.___x, vShadowMapCenter, DepthSampler, OffsetX = 0.0, OffsetY = 0.0, UseComputedLOD=false, UseRegisterLOD=false, MagFilter = point, MinFilter = point
|
||
|
sgt vInLight, vShadowMapVals, vDist4
|
||
|
};
|
||
|
float4 vShadowMapWeights = float4( vWeights.x, vWeights.y, vWeights.x * vWeights.y, 1 );
|
||
|
flPercentInLight += dot( vInLight, vShadowMapWeights );
|
||
|
}
|
||
|
|
||
|
//sum of weights is 9 since border taps are bilinearly filtered
|
||
|
return 1.0f - (( 1.0f / 9.0f ) * flPercentInLight);
|
||
|
}
|
||
|
|
||
|
#elif defined(_PS3)
|
||
|
|
||
|
// keep this in sync with c_env_cascade_light.cpp
|
||
|
#define CASCADE_RESOLUTION 768
|
||
|
|
||
|
// 1 2 1
|
||
|
// 2 4 2
|
||
|
// 1 2 1
|
||
|
// Tweaked for good code gen with the SCE Cg compiler.
|
||
|
half CSMSampleShadowBufferPS33x3( sampler DepthSampler, const float3 shadowMapPos )
|
||
|
{
|
||
|
float fTexelEpsilon = 1.0f / CASCADE_RESOLUTION;
|
||
|
|
||
|
float3 shadowMapCenter_objDepth = shadowMapPos.xyz;
|
||
|
|
||
|
float3 shadowMapCenter = shadowMapCenter_objDepth.xyz; // Center of shadow filter
|
||
|
|
||
|
float4 vUV0 = shadowMapCenter.xyzx + float4( fTexelEpsilon, fTexelEpsilon, 0.0f, -fTexelEpsilon );
|
||
|
float4 vUV1 = shadowMapCenter.xyzx + float4( fTexelEpsilon, -fTexelEpsilon, 0.0f, -fTexelEpsilon );
|
||
|
|
||
|
half4 vOneTaps;
|
||
|
vOneTaps.x = h4tex2D( DepthSampler, vUV0.xyz ).x;
|
||
|
vOneTaps.y = h4tex2D( DepthSampler, vUV0.wyz ).y;
|
||
|
vOneTaps.z = h4tex2D( DepthSampler, vUV1.xyz ).z;
|
||
|
vOneTaps.w = h4tex2D( DepthSampler, vUV1.wyz ).w;
|
||
|
half flSum = dot( vOneTaps, half4(1.0f, 1.0f, 1.0f, 1.0f));
|
||
|
|
||
|
float4 vUV2 = shadowMapCenter.xyzx + float4( fTexelEpsilon, 0.0f, 0.0f, -fTexelEpsilon );
|
||
|
float4 vUV3 = shadowMapCenter.xyzy + float4( 0.0f, -fTexelEpsilon, 0.0f, fTexelEpsilon );
|
||
|
|
||
|
half4 vTwoTaps;
|
||
|
vTwoTaps.x = h4tex2D( DepthSampler, vUV2.xyz ).x;
|
||
|
vTwoTaps.y = h4tex2D( DepthSampler, vUV2.wyz ).y;
|
||
|
vTwoTaps.z = h4tex2D( DepthSampler, vUV3.xyz ).z;
|
||
|
vTwoTaps.w = h4tex2D( DepthSampler, vUV3.xwz ).w;
|
||
|
flSum += dot( vTwoTaps, half4(2.0f, 2.0f, 2.0f, 2.0f));
|
||
|
|
||
|
flSum += tex2D( DepthSampler, shadowMapCenter ).x * half(4.0f);
|
||
|
|
||
|
// Sum all 9 Taps
|
||
|
return flSum * (1.0h / 16.0h);
|
||
|
}
|
||
|
|
||
|
#else
|
||
|
|
||
|
#error Unsupported
|
||
|
|
||
|
#endif // #elif defined(_PS3)
|
||
|
|
||
|
float CSMSampleShadowBuffer1Tap( float2 vPositionLs, float flComparisonDepth )
|
||
|
{
|
||
|
#if defined(_X360)
|
||
|
#if (CSM_VIEWMODELQUALITY == 0)
|
||
|
return CSMSampleShadowBuffer360Simple( CSMDepthAtlasSampler, float3( vPositionLs.x, vPositionLs.y, flComparisonDepth ) );
|
||
|
#else
|
||
|
return CSMSampleShadowBuffer3604x4( CSMDepthAtlasSampler, float3( vPositionLs.x, vPositionLs.y, flComparisonDepth ) );
|
||
|
#endif
|
||
|
#elif defined(_PS3)
|
||
|
#if (CSM_VIEWMODELQUALITY == 0)
|
||
|
return tex2Dproj( CSMDepthAtlasSampler, float4( vPositionLs.x, vPositionLs.y, flComparisonDepth.x, 1.0f ) );
|
||
|
#else
|
||
|
return CSMSampleShadowBufferPS33x3( CSMDepthAtlasSampler, float3( vPositionLs.x, vPositionLs.y, flComparisonDepth ) );
|
||
|
#endif
|
||
|
#else
|
||
|
#error Unsupported
|
||
|
#endif
|
||
|
}
|
||
|
|
||
|
float CSMSampleShadowBuffer( float2 vPositionLs, float flComparisonDepth )
|
||
|
{
|
||
|
return CSMSampleShadowBuffer1Tap( vPositionLs, flComparisonDepth );
|
||
|
}
|
||
|
|
||
|
int CSMRangeTestExpanded( float2 vCoords )
|
||
|
{
|
||
|
// Returns true if the coordinates are within [.02,.98] - purposely a little sloppy to prevent the shadow filter kernel from leaking outside the cascade's portion of the atlas.
|
||
|
vCoords = vCoords * ( 1.0f / .96f ) - float2( .02f / .96f, .02f / .96f );
|
||
|
return ( dot( saturate( vCoords.xy ) - vCoords.xy, float2( 1, 1 ) ) == 0.0f );
|
||
|
}
|
||
|
|
||
|
int CSMRangeTestNonExpanded( float2 vCoords )
|
||
|
{
|
||
|
return ( dot( saturate( vCoords.xy ) - vCoords.xy, float2( 1, 1 ) ) == 0.0f );
|
||
|
}
|
||
|
|
||
|
float CSMComputeSplitLerpFactor( float2 vPositionToSampleLs )
|
||
|
{
|
||
|
float2 vSplitLerpFactorTemp = float2( 1.0f, 1.0f ) - saturate( ( abs( vPositionToSampleLs.xy - float2( .5f, .5f ) ) - float2( g_flSunShadowingSplitLerpFactorBase, g_flSunShadowingSplitLerpFactorBase ) ) * float2( g_flSunShadowingSplitLerpFactorInvRange, g_flSunShadowingSplitLerpFactorInvRange ) );
|
||
|
return vSplitLerpFactorTemp.x * vSplitLerpFactorTemp.y;
|
||
|
}
|
||
|
|
||
|
float4 CSMTransformLightToTexture( float4 pos, float4x4 mat )
|
||
|
{
|
||
|
#if defined(_PS3)
|
||
|
return mul( mat, pos );
|
||
|
#else
|
||
|
return mul( pos, mat );
|
||
|
#endif
|
||
|
}
|
||
|
|
||
|
#if ( CASCADE_SIZE == 0 )
|
||
|
float CSMComputeShadowing( float3 vPositionWs )
|
||
|
{
|
||
|
return 1.0f;
|
||
|
}
|
||
|
#elif ( CSM_MODE >= 1 )
|
||
|
|
||
|
#error Invalid CSM_MODE
|
||
|
|
||
|
#else
|
||
|
// CSM shader quality level 0 (the only supported level on gameconsole)
|
||
|
float CSMComputeShadowing( float3 vPositionWs )
|
||
|
{
|
||
|
float flShadowScalar = 1.0f;
|
||
|
|
||
|
float4 vPosition4Ws = float4( vPositionWs.xyz, 1.0f );
|
||
|
|
||
|
float3 vPositionToSampleLs = float3( 0.0f, 0.0f, CSMTransformLightToTexture( vPosition4Ws.xyzw, g_matWorldToShadowTexMatrices[0] ).z );
|
||
|
|
||
|
#if ( CSM_VIEWMODELQUALITY == 0 )
|
||
|
|
||
|
// only consider cascade 1 and 2 for console perf
|
||
|
|
||
|
#if defined(_PS3)
|
||
|
float4 cascadeAtlasUVOffsets_1 = g_vCascadeAtlasUVOffsets[1];
|
||
|
float4 cascadeAtlasUVOffsets_2 = g_vCascadeAtlasUVOffsets[2];
|
||
|
|
||
|
float4 cascadeAtlasUVOffset = cascadeAtlasUVOffsets_1;
|
||
|
#else
|
||
|
int nCascadeIndex = 1;
|
||
|
#endif
|
||
|
|
||
|
vPositionToSampleLs.xy = CSMTransformLightToTexture( vPosition4Ws.xyzw, g_matWorldToShadowTexMatrices[1] ).xy;
|
||
|
|
||
|
if ( !CSMRangeTestExpanded( vPositionToSampleLs.xy ) )
|
||
|
{
|
||
|
vPositionToSampleLs.xy = CSMTransformLightToTexture( vPosition4Ws.xyzw, g_matWorldToShadowTexMatrices[2] ).xy;
|
||
|
#if defined(_PS3)
|
||
|
cascadeAtlasUVOffset = cascadeAtlasUVOffsets_2;
|
||
|
#else
|
||
|
nCascadeIndex = 2;
|
||
|
#endif
|
||
|
}
|
||
|
|
||
|
#if defined(_PS3)
|
||
|
vPositionToSampleLs.xy = saturate( vPositionToSampleLs.xy ) * cascadeAtlasUVOffset.zw + cascadeAtlasUVOffset.xy;
|
||
|
#else
|
||
|
vPositionToSampleLs.xy = saturate( vPositionToSampleLs.xy ) * g_vCascadeAtlasUVOffsets[nCascadeIndex].zw + g_vCascadeAtlasUVOffsets[nCascadeIndex].xy;
|
||
|
#endif
|
||
|
float3 vCamDelta = vPositionWs - g_vCamPosition.xyz;
|
||
|
float flZLerpFactor = saturate( dot( vCamDelta, vCamDelta ) * g_flSunShadowingZLerpFactorRange + g_flSunShadowingZLerpFactorBase );
|
||
|
|
||
|
flShadowScalar = CSMSampleShadowBuffer( vPositionToSampleLs.xy, vPositionToSampleLs.z );
|
||
|
flShadowScalar = lerp( flShadowScalar, 1.0f, flZLerpFactor );
|
||
|
#else
|
||
|
// Viewmodel shadowing
|
||
|
// only use cascade 0 for viewmodel rendering
|
||
|
|
||
|
vPositionToSampleLs.xy = CSMTransformLightToTexture( vPosition4Ws.xyzw, g_matWorldToShadowTexMatrices[0] ).xy;
|
||
|
|
||
|
vPositionToSampleLs.xy = saturate( vPositionToSampleLs.xy ) * g_vCascadeAtlasUVOffsets[0].zw + g_vCascadeAtlasUVOffsets[0].xy;
|
||
|
|
||
|
flShadowScalar = CSMSampleShadowBuffer( vPositionToSampleLs.xy, vPositionToSampleLs.z );
|
||
|
#endif // CSM_VIEWMODELQUALITY == 0
|
||
|
|
||
|
return flShadowScalar;
|
||
|
}
|
||
|
|
||
|
#endif // #if ( CSM_MODE == 0 )
|