2021-07-24 21:11:47 -07:00

4336 lines
146 KiB
C++

//===== Copyright (c) 1996-2008, Valve Corporation, All rights reserved. ======//
//
// Purpose:
//
// $NoKeywords: $
//
//===========================================================================//
#define DISABLE_PROTECTED_THINGS
#include "locald3dtypes.h"
#include "shaderdevicedx8.h"
#include "shaderapi/ishaderutil.h"
#include "shaderapidx8_global.h"
#include "filesystem.h"
#include "tier0/icommandline.h"
#include "tier2/tier2.h"
#include "shadershadowdx8.h"
#include "colorformatdx8.h"
#include "materialsystem/IShader.h"
#include "shaderapidx8.h"
#include "shaderapidx8_global.h"
#include "imeshdx8.h"
#include "materialsystem/materialsystem_config.h"
#include "vertexshaderdx8.h"
#include "recording.h"
#include "vstdlib/ikeyvaluessystem.h"
#include "winutils.h"
#include "tier0/vprof_telemetry.h"
#include "tier0/miniprofiler.h"
#if defined ( DX_TO_GL_ABSTRACTION )
// Placed here so inlines placed in dxabstract.h can access gGL
COpenGLEntryPoints *gGL = NULL;
#endif
#define D3D_BATCH_PERF_ANALYSIS 0
#if D3D_BATCH_PERF_ANALYSIS
#if defined( DX_TO_GL_ABSTRACTION )
#error Cannot enable D3D_BATCH_PERF_ANALYSIS when using DX_TO_GL_ABSTRACTION, use GL_BATCH_PERF_ANALYSIS instead.
#endif
// Define this if you want all d3d9 interfaces hooked and run through the dx9hook.h shim interfaces. For profiling, etc.
#define DO_DX9_HOOK
#endif
#ifdef DO_DX9_HOOK
#if D3D_BATCH_PERF_ANALYSIS
ConVar d3d_batch_vis( "d3d_batch_vis", "0" );
ConVar d3d_batch_vis_abs_scale( "d3d_batch_vis_abs_scale", ".050" );
ConVar d3d_present_vis_abs_scale( "d3d_batch_vis_abs_scale", ".050" );
ConVar d3d_batch_vis_y_scale( "d3d_batch_vis_y_scale", "0.0" );
uint64 g_nTotalD3DCalls, g_nTotalD3DCycles;
static double s_rdtsc_to_ms;
#endif
#include "dx9hook.h"
#endif
#ifndef _X360
#include "wmi.h"
#endif
#if defined( _X360 )
#include "xbox/xbox_console.h"
#include "xbox/xbox_win32stubs.h"
#include "xbox/xbox_launch.h"
#endif
#ifdef _PS3
#include <sys/tty.h>
#include <sysutil/sysutil_sysparam.h>
#include <ps3gcm/gcmstate.h>
#endif
// NOTE: This has to be the last file included!
#include "tier0/memdbgon.h"
// A logging channel used during engine initialization
DEFINE_LOGGING_CHANNEL_NO_TAGS( LOG_EngineInitialization, "EngineInitialization" );
#if defined( _X360 )
#define JUNE_2009_XDK_ISSUES
#endif
//-----------------------------------------------------------------------------
// Globals
//-----------------------------------------------------------------------------
static CShaderDeviceMgrDx8 g_ShaderDeviceMgrDx8;
CShaderDeviceMgrDx8* g_pShaderDeviceMgrDx8 = &g_ShaderDeviceMgrDx8;
#ifndef SHADERAPIDX10
// In the shaderapidx10.dll, we use its version of IShaderDeviceMgr.
EXPOSE_SINGLE_INTERFACE_GLOBALVAR( CShaderDeviceMgrDx8, IShaderDeviceMgr,
SHADER_DEVICE_MGR_INTERFACE_VERSION, g_ShaderDeviceMgrDx8 )
#endif
#if defined( _X360 )
IDirect3D9 *m_pD3D;
#endif
// hook into mat_forcedynamic from the engine.
static ConVar mat_forcedynamic( "mat_forcedynamic", "0", FCVAR_CHEAT );
// Turn this on to record frames that are longer than what CERT requires on the 360.
ConVar mat_spew_long_frames( "mat_spew_long_frames", "0", 0, "warn about frames that go over 66ms for CERT purposes." );
#if defined( _PS3 ) || defined( _OSX )
extern ConVar mat_debugalttab;
#else
// this is hooked into the engines convar
ConVar mat_debugalttab( "mat_debugalttab", "0", FCVAR_CHEAT );
#endif
//-----------------------------------------------------------------------------
//
// Device manager
//
//-----------------------------------------------------------------------------
//-----------------------------------------------------------------------------
// constructor, destructor
//-----------------------------------------------------------------------------
CShaderDeviceMgrDx8::CShaderDeviceMgrDx8()
{
m_pD3D = NULL;
m_bAdapterInfoIntialized = false;
#if defined( PIX_INSTRUMENTATION ) && defined ( DX_TO_GL_ABSTRACTION ) && defined( _WIN32 )
m_hD3D9 = NULL;
m_pBeginEvent = NULL;
m_pEndEvent = NULL;
m_pSetMarker = NULL;
m_pSetOptions = NULL;
#endif
}
CShaderDeviceMgrDx8::~CShaderDeviceMgrDx8()
{
}
#ifdef OSX
#include <Carbon/Carbon.h>
#endif
//-----------------------------------------------------------------------------
// Connect, disconnect
//-----------------------------------------------------------------------------
bool CShaderDeviceMgrDx8::Connect( CreateInterfaceFn factory )
{
LOCK_SHADERAPI();
if ( !BaseClass::Connect( factory ) )
return false;
#if defined ( DX_TO_GL_ABSTRACTION )
gGL = ToGLConnectLibraries( factory );
#endif
#if defined( DO_DX9_HOOK )
m_pD3D = Direct3DCreate9Hook(D3D_SDK_VERSION);
#else
m_pD3D = Direct3DCreate9(D3D_SDK_VERSION);
#endif
if ( !m_pD3D )
{
Warning( "Failed to create D3D9!\n" );
return false;
}
#if defined( PIX_INSTRUMENTATION ) && defined ( DX_TO_GL_ABSTRACTION ) && defined( _WIN32 )
// This is a little odd, but AMD PerfStudio hooks D3D9.DLL and intercepts all of the D3DPERF API's (even for OpenGL apps).
// So dynamically load d3d9.dll and get the address of these exported functions.
if ( !m_hD3D9 )
{
m_hD3D9 = LoadLibraryA("d3d9.dll");
}
if ( m_hD3D9 )
{
Plat_DebugString( "PIX_INSTRUMENTATION: Loaded d3d9.dll\n" );
printf( "PIX_INSTRUMENTATION: Loaded d3d9.dll\n" );
m_pBeginEvent = (D3DPERF_BeginEvent_FuncPtr)GetProcAddress( m_hD3D9, "D3DPERF_BeginEvent" );
m_pEndEvent = (D3DPERF_EndEvent_FuncPtr)GetProcAddress( m_hD3D9, "D3DPERF_EndEvent" );
m_pSetMarker = (D3DPERF_SetMarker_FuncPtr)GetProcAddress( m_hD3D9, "D3DPERF_SetOptions" );
m_pSetOptions = (D3DPERF_SetOptions_FuncPtr)GetProcAddress( m_hD3D9, "D3DPERF_SetMarker" );
}
#endif
// FIXME: Want this to be here, but we can't because Steam
// hasn't had it's application ID set up yet.
// InitAdapterInfo();
return true;
}
void CShaderDeviceMgrDx8::Disconnect()
{
LOCK_SHADERAPI();
#if defined( PIX_INSTRUMENTATION ) && defined ( DX_TO_GL_ABSTRACTION ) && defined( _WIN32 )
if ( m_hD3D9 )
{
m_pBeginEvent = NULL;
m_pEndEvent = NULL;
m_pSetMarker = NULL;
m_pSetOptions = NULL;
FreeLibrary( m_hD3D9 );
m_hD3D9 = NULL;
}
#endif
if ( m_pD3D )
{
m_pD3D->Release();
m_pD3D = 0;
}
#if defined ( DX_TO_GL_ABSTRACTION )
ToGLDisconnectLibraries();
#endif
BaseClass::Disconnect();
}
//-----------------------------------------------------------------------------
// Initialization
//-----------------------------------------------------------------------------
InitReturnVal_t CShaderDeviceMgrDx8::Init( )
{
// FIXME: Remove call to InitAdapterInfo once Steam startup issues are resolved.
// Do it in Connect instead.
InitAdapterInfo();
return INIT_OK;
}
//-----------------------------------------------------------------------------
// Shutdown
//-----------------------------------------------------------------------------
void CShaderDeviceMgrDx8::Shutdown( )
{
LOCK_SHADERAPI();
// FIXME: Make PIX work
// BeginPIXEvent( PIX_VALVE_ORANGE, "Shutdown" );
if ( g_pShaderAPI )
{
g_pShaderAPI->OnDeviceShutdown();
}
if ( g_pShaderDevice )
{
g_pShaderDevice->ShutdownDevice();
g_pMaterialSystemHardwareConfig = NULL;
}
// EndPIXEvent();
}
//-----------------------------------------------------------------------------
// Inline methods
//-----------------------------------------------------------------------------
#if !defined( _GAMECONSOLE )
bool CShaderDeviceDx8::IsActive() const
{
return Dx9Device()->IsActive();
}
#endif
//-----------------------------------------------------------------------------
// Initialize adapter information
//-----------------------------------------------------------------------------
void CShaderDeviceMgrDx8::InitAdapterInfo()
{
if ( m_bAdapterInfoIntialized )
return;
m_bAdapterInfoIntialized = true;
m_Adapters.RemoveAll();
int nCount = m_pD3D->GetAdapterCount( );
for( int i = 0; i < nCount; ++i )
{
int j = m_Adapters.AddToTail();
AdapterInfo_t &info = m_Adapters[j];
#ifdef _DEBUG
memset( &info.m_ActualCaps, 0xDD, sizeof(info.m_ActualCaps) );
#endif
info.m_ActualCaps.m_bDeviceOk = ComputeCapsFromD3D( &info.m_ActualCaps, i );
if ( !info.m_ActualCaps.m_bDeviceOk )
continue;
ReadDXSupportLevels( info.m_ActualCaps );
// Read dxsupport.cfg which has config overrides for particular cards.
ReadHardwareCaps( info.m_ActualCaps, info.m_ActualCaps.m_nMaxDXSupportLevel );
// What's in "-shader" overrides dxsupport.cfg
const char *pShaderParam = CommandLine()->ParmValue( "-shader" );
if ( pShaderParam )
{
Q_strncpy( info.m_ActualCaps.m_pShaderDLL, pShaderParam, sizeof( info.m_ActualCaps.m_pShaderDLL ) );
}
}
}
//--------------------------------------------------------------------------------
// Code to detect support for texture border color (widely supported but the caps
// bit is messed up in drivers due to a stupid WHQL test that requires this to work
// with float textures which we don't generally care about wrt this address mode)
//--------------------------------------------------------------------------------
void CShaderDeviceMgrDx8::CheckBorderColorSupport( HardwareCaps_t *pCaps, int nAdapter )
{
#ifdef DX_TO_GL_ABSTRACTION
if( true )
#else
if( IsX360() )
#endif
{
pCaps->m_bSupportsBorderColor = true;
}
else // Most PC parts do this, but let's not deal with that yet (JasonM)
{
pCaps->m_bSupportsBorderColor = false;
}
}
//--------------------------------------------------------------------------------
// Vendor-dependent code to detect support for various flavors of shadow mapping
//--------------------------------------------------------------------------------
void CShaderDeviceMgrDx8::CheckVendorDependentShadowMappingSupport( HardwareCaps_t *pCaps, int nAdapter )
{
// Set a default null texture format...may be overridden below by IHV-specific surface type
pCaps->m_NullTextureFormat = IMAGE_FORMAT_ARGB8888;
if ( m_pD3D->CheckDeviceFormat( nAdapter, DX8_DEVTYPE, D3DFMT_X8R8G8B8, D3DUSAGE_RENDERTARGET, D3DRTYPE_TEXTURE, D3DFMT_R5G6B5 ) == S_OK )
{
pCaps->m_NullTextureFormat = IMAGE_FORMAT_RGB565;
}
#if defined( _X360 )
//pCaps->m_ShadowDepthTextureFormat = ReverseDepthOnX360() ? IMAGE_FORMAT_X360_DST24F : IMAGE_FORMAT_X360_DST24;
pCaps->m_ShadowDepthTextureFormat = ReverseDepthOnX360() ? IMAGE_FORMAT_D24FS8 : IMAGE_FORMAT_D24S8;
pCaps->m_bSupportsShadowDepthTextures = true;
pCaps->m_bSupportsFetch4 = false;
pCaps->m_HighPrecisionShadowDepthTextureFormat = pCaps->m_ShadowDepthTextureFormat;
return;
#elif defined ( _PS3 )
pCaps->m_NullTextureFormat = IMAGE_FORMAT_ARGB8888;
if ( CommandLine()->CheckParm( "-d24shadowbuffer" ) )
{
pCaps->m_ShadowDepthTextureFormat = IMAGE_FORMAT_D24S8;
}
else
{
pCaps->m_ShadowDepthTextureFormat = IMAGE_FORMAT_D16;
}
pCaps->m_bSupportsShadowDepthTextures = true;
pCaps->m_bSupportsFetch4 = false;
pCaps->m_HighPrecisionShadowDepthTextureFormat = pCaps->m_ShadowDepthTextureFormat;
return;
#elif defined ( DX_TO_GL_ABSTRACTION )
// We may want to only do this on the higher-end Mac SKUs, since it's not free...
pCaps->m_ShadowDepthTextureFormat = IMAGE_FORMAT_D16_SHADOW; // This format shunts us down the right shader combo path
pCaps->m_bSupportsShadowDepthTextures = true;
pCaps->m_bSupportsFetch4 = false;
pCaps->m_HighPrecisionShadowDepthTextureFormat = pCaps->m_ShadowDepthTextureFormat;
return;
#endif
if ( IsPC() )
{
bool bToolsMode = IsPlatformWindows() && ( CommandLine()->CheckParm( "-tools" ) != NULL );
if ( ( pCaps->m_VendorID == VENDORID_NVIDIA ) && ( pCaps->m_SupportsShaderModel_3_0 ) ) // ps_3_0 parts from nVidia
{
// First, test for null texture support
if ( m_pD3D->CheckDeviceFormat( nAdapter, DX8_DEVTYPE, D3DFMT_X8R8G8B8, D3DUSAGE_RENDERTARGET, D3DRTYPE_TEXTURE, NVFMT_NULL ) == S_OK )
{
pCaps->m_NullTextureFormat = IMAGE_FORMAT_NULL;
}
//
// NVIDIA has two no-PCF formats (these are not filtering modes, but surface formats
// NVFMT_RAWZ is supported by NV4x (not supported here yet...requires a dp3 to reconstruct in shader code, which doesn't seem to work)
// NVFMT_INTZ is supported on newer chips as of G8x (just read like ATI non-fetch4 mode)
//
/*
if ( m_pD3D->CheckDeviceFormat( nAdapter, DX8_DEVTYPE, D3DFMT_X8R8G8B8, D3DUSAGE_RENDERTARGET, D3DRTYPE_TEXTURE, NVFMT_INTZ ) == S_OK )
{
pCaps->m_ShadowDepthTextureFormat = IMAGE_FORMAT_NV_INTZ;
pCaps->m_bSupportsFetch4 = false;
pCaps->m_bSupportsShadowDepthTextures = true;
return;
}
*/
bool bSupports16Bit = ( m_pD3D->CheckDeviceFormat( nAdapter, DX8_DEVTYPE, D3DFMT_X8R8G8B8, D3DUSAGE_DEPTHSTENCIL, D3DRTYPE_TEXTURE, D3DFMT_D16 ) == S_OK );
bool bSupports24Bit = ( m_pD3D->CheckDeviceFormat( nAdapter, DX8_DEVTYPE, D3DFMT_X8R8G8B8, D3DUSAGE_DEPTHSTENCIL, D3DRTYPE_TEXTURE, D3DFMT_D24S8 ) == S_OK );
if ( bSupports24Bit || bSupports16Bit )
{
pCaps->m_bSupportsFetch4 = false;
pCaps->m_bSupportsShadowDepthTextures = true;
// Prefer 16-bit
if ( bSupports16Bit )
{
pCaps->m_ShadowDepthTextureFormat = IMAGE_FORMAT_D16_SHADOW;
pCaps->m_HighPrecisionShadowDepthTextureFormat = IMAGE_FORMAT_D16_SHADOW;
if ( bSupports24Bit )
{
pCaps->m_HighPrecisionShadowDepthTextureFormat = IMAGE_FORMAT_D24X8_SHADOW;
if ( bToolsMode)
{
pCaps->m_ShadowDepthTextureFormat = IMAGE_FORMAT_D24X8_SHADOW;
}
}
}
else
{
pCaps->m_ShadowDepthTextureFormat = IMAGE_FORMAT_D24X8_SHADOW;
pCaps->m_HighPrecisionShadowDepthTextureFormat = IMAGE_FORMAT_D24X8_SHADOW;
}
return;
}
}
else if ( ( pCaps->m_VendorID == VENDORID_ATI ) && pCaps->m_SupportsPixelShaders_2_b ) // ps_2_b parts from ATI
{
// Initially, check for Fetch4 (tied to ATIFMT_D24S8 support)
pCaps->m_bSupportsFetch4 = false;
if ( m_pD3D->CheckDeviceFormat( nAdapter, DX8_DEVTYPE, D3DFMT_X8R8G8B8, D3DUSAGE_DEPTHSTENCIL, D3DRTYPE_TEXTURE, ATIFMT_D24S8 ) == S_OK )
{
pCaps->m_bSupportsFetch4 = true;
}
// ATI prefers the NVIDIA PCF path on their DX10 parts:
// http://developer.amd.com/gpu_assets/Advanced%20DX9%20Capabilities%20for%20ATI%20Radeon%20Cards_v2.pdf
if ( !CommandLine()->CheckParm( "-forceatifetch4" ) )
{
if ( pCaps->m_bDX10Card )
{
pCaps->m_bSupportsFetch4 = false;
}
}
bool bSupports16Bit = ( m_pD3D->CheckDeviceFormat( nAdapter, DX8_DEVTYPE, D3DFMT_X8R8G8B8, D3DUSAGE_DEPTHSTENCIL, D3DRTYPE_TEXTURE, ATIFMT_D16 ) == S_OK );
bool bSupports24Bit = ( m_pD3D->CheckDeviceFormat( nAdapter, DX8_DEVTYPE, D3DFMT_X8R8G8B8, D3DUSAGE_DEPTHSTENCIL, D3DRTYPE_TEXTURE, ATIFMT_D24S8 ) == S_OK );
if ( bSupports24Bit || bSupports16Bit )
{
pCaps->m_bSupportsShadowDepthTextures = true;
// Prefer 16-bit
if ( bSupports16Bit )
{
pCaps->m_ShadowDepthTextureFormat = IMAGE_FORMAT_D16_SHADOW;
pCaps->m_HighPrecisionShadowDepthTextureFormat = IMAGE_FORMAT_D16_SHADOW;
if ( bSupports24Bit )
{
pCaps->m_HighPrecisionShadowDepthTextureFormat = IMAGE_FORMAT_D24X8_SHADOW;
if ( bToolsMode)
{
pCaps->m_ShadowDepthTextureFormat = IMAGE_FORMAT_D24X8_SHADOW;
}
}
}
else
{
pCaps->m_ShadowDepthTextureFormat = IMAGE_FORMAT_D24X8_SHADOW;
pCaps->m_HighPrecisionShadowDepthTextureFormat = IMAGE_FORMAT_D24X8_SHADOW;
}
return;
}
}
else if ( ( pCaps->m_VendorID == VENDORID_INTEL ) && pCaps->m_SupportsPixelShaders_2_b ) // ps_2_b parts from INTEL
{
if ( m_pD3D->CheckDeviceFormat( nAdapter, DX8_DEVTYPE, D3DFMT_X8R8G8B8, D3DUSAGE_DEPTHSTENCIL, D3DRTYPE_TEXTURE, D3DFMT_D24S8 ) == S_OK )
{
pCaps->m_ShadowDepthTextureFormat = IMAGE_FORMAT_D24X8_SHADOW;
pCaps->m_bSupportsFetch4 = false;
pCaps->m_bSupportsShadowDepthTextures = true;
return;
}
}
}
// Other vendor or old hardware
pCaps->m_ShadowDepthTextureFormat = IMAGE_FORMAT_UNKNOWN;
pCaps->m_bSupportsShadowDepthTextures = false;
pCaps->m_bSupportsFetch4 = false;
}
//-----------------------------------------------------------------------------
// Vendor-dependent code to detect Alpha To Coverage Backdoors
//-----------------------------------------------------------------------------
void CShaderDeviceMgrDx8::CheckVendorDependentAlphaToCoverage( HardwareCaps_t *pCaps, int nAdapter )
{
pCaps->m_bSupportsAlphaToCoverage = false;
// Bail out on OpenGL
#ifdef DX_TO_GL_ABSTRACTION
pCaps->m_bSupportsAlphaToCoverage = true;
pCaps->m_AlphaToCoverageEnableValue = TRUE;
pCaps->m_AlphaToCoverageDisableValue = FALSE;
pCaps->m_AlphaToCoverageState = D3DRS_ADAPTIVETESS_Y; // Just match the NVIDIA state hackery
return;
#endif
#ifdef _X360
{
pCaps->m_bSupportsAlphaToCoverage = true;
pCaps->m_AlphaToCoverageEnableValue = TRUE;
pCaps->m_AlphaToCoverageDisableValue = FALSE;
pCaps->m_AlphaToCoverageState = D3DRS_ALPHATOMASKENABLE;
return;
}
#endif // _X360
if ( pCaps->m_VendorID == VENDORID_NVIDIA )
{
// nVidia has two modes...assume SSAA is superior to MSAA and hence more desirable (though it's probably not)
//
// Currently, they only seem to expose any of this on 7800 and up though older parts certainly
// support at least the MSAA mode since they support it on OpenGL via the arb_multisample extension
bool bNVIDIA_MSAA = false;
bool bNVIDIA_SSAA = false;
if ( m_pD3D->CheckDeviceFormat( nAdapter, DX8_DEVTYPE, // Check MSAA version
D3DFMT_X8R8G8B8, 0, D3DRTYPE_SURFACE,
(D3DFORMAT)MAKEFOURCC('A', 'T', 'O', 'C')) == S_OK )
{
bNVIDIA_MSAA = true;
}
if ( m_pD3D->CheckDeviceFormat( nAdapter, DX8_DEVTYPE, // Check SSAA version
D3DFMT_X8R8G8B8, 0, D3DRTYPE_SURFACE,
(D3DFORMAT)MAKEFOURCC('S', 'S', 'A', 'A')) == S_OK )
{
bNVIDIA_SSAA = true;
}
// nVidia pitches SSAA but we prefer ATOC
if ( bNVIDIA_MSAA )// || bNVIDIA_SSAA )
{
// if ( bNVIDIA_SSAA )
// m_AlphaToCoverageEnableValue = MAKEFOURCC('S', 'S', 'A', 'A');
// else
pCaps->m_AlphaToCoverageEnableValue = MAKEFOURCC('A', 'T', 'O', 'C');
pCaps->m_AlphaToCoverageState = D3DRS_ADAPTIVETESS_Y;
pCaps->m_AlphaToCoverageDisableValue = (DWORD)D3DFMT_UNKNOWN;
pCaps->m_bSupportsAlphaToCoverage = true;
return;
}
}
else if ( pCaps->m_VendorID == VENDORID_ATI )
{
// Supported on all ATI parts...just go ahead and set the state when appropriate
pCaps->m_AlphaToCoverageState = D3DRS_POINTSIZE;
pCaps->m_AlphaToCoverageEnableValue = MAKEFOURCC('A','2','M','1');
pCaps->m_AlphaToCoverageDisableValue = MAKEFOURCC('A','2','M','0');
pCaps->m_bSupportsAlphaToCoverage = true;
return;
}
}
//-----------------------------------------------------------------------------
// Vendor-dependent code to detect support for optimal depth buffer rt resolve
//-----------------------------------------------------------------------------
#define FOURCC_RESZ ((D3DFORMAT)(MAKEFOURCC('R','E','S','Z')))
#define FOURCC_INTZ ((D3DFORMAT)(MAKEFOURCC('I','N','T','Z')))
void CShaderDeviceMgrDx8::CheckVendorDependentDepthResolveSupport( HardwareCaps_t *pCaps, int nAdapter )
{
// Bail out on OpenGL
#ifdef DX_TO_GL_ABSTRACTION
pCaps->m_bSupportsRESZ = false;
pCaps->m_bSupportsINTZ = false;
#endif
HRESULT hr;
hr = m_pD3D->CheckDeviceFormat( nAdapter, DX8_DEVTYPE, D3DFMT_X8R8G8B8,//D3DFMT_D24S8,
D3DUSAGE_RENDERTARGET, D3DRTYPE_SURFACE,
FOURCC_RESZ );
pCaps->m_bSupportsRESZ = (hr == D3D_OK);
Msg( "RESZ %sSUPPORTED!\n", pCaps->m_bSupportsRESZ ? "" : "NOT " );
hr = m_pD3D->CheckDeviceFormat( nAdapter, DX8_DEVTYPE, D3DFMT_X8R8G8B8,
D3DUSAGE_DEPTHSTENCIL, D3DRTYPE_TEXTURE,
FOURCC_INTZ );
pCaps->m_bSupportsINTZ = (hr == D3D_OK);
Msg( "INTZ %sSUPPORTED!\n", pCaps->m_bSupportsINTZ ? "" : "NOT " );
}
ConVar mat_hdr_level( "mat_hdr_level", "2" );
#if defined( _PS3 )
#define SHADOWMAP_SLOPESCALEDEPTHBIAS_D24 "5"
#define SHADOWMAP_DEPTHBIAS_D24 "2500"
#define SHADOWMAP_SLOPESCALEDEPTHBIAS "2"
#define SHADOWMAP_DEPTHBIAS ".25"
#elif defined( DX_TO_GL_ABSTRACTION )
#define SHADOWMAP_SLOPESCALEDEPTHBIAS "8"
#define SHADOWMAP_DEPTHBIAS "20"
#elif defined ( _X360 )
#define SHADOWMAP_SLOPESCALEDEPTHBIAS "2.15"
#define SHADOWMAP_DEPTHBIAS ".000032"
#else
#define SHADOWMAP_SLOPESCALEDEPTHBIAS "3"
#define SHADOWMAP_DEPTHBIAS ".000025"
#endif
ConVar mat_slopescaledepthbias_shadowmap( "mat_slopescaledepthbias_shadowmap", SHADOWMAP_SLOPESCALEDEPTHBIAS, FCVAR_NONE );
ConVar mat_depthbias_shadowmap( "mat_depthbias_shadowmap", SHADOWMAP_DEPTHBIAS, FCVAR_NONE );
// For testing Fast Clip
ConVar mat_fastclip( "mat_fastclip", "0", FCVAR_CHEAT );
//-----------------------------------------------------------------------------
// Determine capabilities
//-----------------------------------------------------------------------------
bool CShaderDeviceMgrDx8::ComputeCapsFromD3D( HardwareCaps_t *pCaps, int nAdapter )
{
D3DCAPS caps;
D3DADAPTER_IDENTIFIER9 ident;
HRESULT hr;
// NOTE: When getting the caps, we want to be limited by the hardware
// even if we're running with software T&L...
hr = m_pD3D->GetDeviceCaps( nAdapter, DX8_DEVTYPE, &caps );
if ( FAILED( hr ) )
return false;
hr = m_pD3D->GetAdapterIdentifier( nAdapter, D3DENUM_WHQL_LEVEL, &ident );
if ( FAILED( hr ) )
return false;
if ( IsOpenGL() )
{
if ( !ident.DeviceId && !ident.VendorId )
{
ident.DeviceId = 1;
ident.VendorId = 1;
}
}
// Make sure mac users do not fake their graphic cards and bypass the mandatory
// CSMs for high end GPUs
#ifndef OSX
// Intended for debugging only
if ( CommandLine()->CheckParm( "-force_device_id" ) )
{
const char *pDevID = CommandLine()->ParmValue( "-force_device_id", "" );
if ( pDevID )
{
int nDevID = V_atoi( pDevID ); // use V_atoi for hex support
if ( nDevID > 0 )
{
ident.DeviceId = nDevID;
}
}
}
// Intended for debugging only
if ( CommandLine()->CheckParm( "-force_vendor_id" ) )
{
const char *pVendorID = CommandLine()->ParmValue( "-force_vendor_id", "" );
if ( pVendorID )
{
int nVendorID = V_atoi( pVendorID ); // use V_atoi for hex support
if ( pVendorID > 0 )
{
ident.VendorId = nVendorID;
}
}
}
#endif
Q_strncpy( pCaps->m_pDriverName, ident.Description, MATERIAL_ADAPTER_NAME_LENGTH );
pCaps->m_VendorID = ident.VendorId;
pCaps->m_DeviceID = ident.DeviceId;
pCaps->m_SubSysID = ident.SubSysId;
pCaps->m_Revision = ident.Revision;
pCaps->m_nDriverVersionHigh = ident.DriverVersion.HighPart;
pCaps->m_nDriverVersionLow = ident.DriverVersion.LowPart;
pCaps->m_pShaderDLL[0] = 0;
pCaps->m_nMaxViewports = 1;
pCaps->m_PreferDynamicTextures = ( caps.Caps2 & D3DCAPS2_DYNAMICTEXTURES ) ? 1 : 0;
pCaps->m_HasSetDeviceGammaRamp = (caps.Caps2 & D3DCAPS2_CANCALIBRATEGAMMA) != 0;
Assert( ((caps.VertexShaderVersion >> 8) & 0xFF) >= 1 );
Assert( ((caps.PixelShaderVersion >> 8) & 0xFF) >= 1 );
pCaps->m_bScissorSupported = ( caps.RasterCaps & D3DPRASTERCAPS_SCISSORTEST ) != 0;
#if defined( DX8_COMPATABILITY_MODE )
pCaps->m_SupportsPixelShaders_2_b = false;
pCaps->m_SupportsShaderModel_3_0 = false;
pCaps->m_SupportsMipmappedCubemaps = false;
#else
Assert( ( caps.PixelShaderVersion & 0xffff ) >= 0x0200 );
pCaps->m_SupportsPixelShaders_2_b = ( ( caps.PixelShaderVersion & 0xffff ) >= 0x0200) && (caps.PS20Caps.NumInstructionSlots >= 512); // More caps to this, but this will do
Assert( ( caps.VertexShaderVersion & 0xffff ) >= 0x0200 );
pCaps->m_SupportsShaderModel_3_0 = ( caps.PixelShaderVersion & 0xffff ) >= 0x0300;
pCaps->m_SupportsMipmappedCubemaps = ( caps.TextureCaps & D3DPTEXTURECAPS_MIPCUBEMAP ) ? true : false;
#endif
if ( IsOpenGL() )
{
pCaps->m_SupportsShaderModel_3_0 = true;
}
#if 0
// Slam 3.0 shaders off for Intel
// Don't do this anymore on CS:GO because we require shader model 3.0, and there are Intel chipsets with decent SM3 support now.
if ( pCaps->m_VendorID == VENDORID_INTEL )
{
pCaps->m_SupportsShaderModel_3_0 = false;
}
#endif
pCaps->m_MaxVertexShader30InstructionSlots = 0;
pCaps->m_MaxPixelShader30InstructionSlots = 0;
if ( pCaps->m_SupportsShaderModel_3_0 )
{
pCaps->m_MaxVertexShader30InstructionSlots = caps.MaxVertexShader30InstructionSlots;
pCaps->m_MaxPixelShader30InstructionSlots = caps.MaxPixelShader30InstructionSlots;
}
pCaps->m_bSoftwareVertexProcessing = false;
if ( IsPlatformWindows() && CommandLine()->CheckParm( "-mat_softwaretl" ) )
{
pCaps->m_bSoftwareVertexProcessing = true;
}
if ( IsPlatformWindows() && !( caps.DevCaps & D3DDEVCAPS_HWTRANSFORMANDLIGHT ) )
{
// no hardware t&l. . use software
pCaps->m_bSoftwareVertexProcessing = true;
}
// Set mat_forcedynamic if software vertex processing since the software vp pipe has
// problems with sparse vertex buffers (it transforms the whole thing.)
if ( pCaps->m_bSoftwareVertexProcessing )
{
mat_forcedynamic.SetValue( 1 );
}
#ifdef _PS3
pCaps->m_bSupportsStaticControlFlow = true;
#elif defined DX_TO_GL_ABSTRACTION
// On OSX, we can force ourselves down a static control flow path, but this only works with GLSL
if ( IsOSX() )
{
pCaps->m_bSupportsStaticControlFlow = CommandLine()->CheckParm("-glslcontrolflow") != NULL;
}
else
{
pCaps->m_bSupportsStaticControlFlow = !CommandLine()->CheckParm("-noglslcontrolflow");
}
#else
pCaps->m_bSupportsStaticControlFlow = true;
#endif
// NOTE: Texture stages is a fixed-function concept
// NOTE: Normally, the number of texture units == the number of texture
// stages except for NVidia hardware, which reports more stages than units.
// The reason for this is because they expose the inner hardware pixel
// pipeline through the extra stages. The only thing we use stages for
// in the hardware is for configuring the color + alpha args + ops.
pCaps->m_NumSamplers = caps.MaxSimultaneousTextures;
pCaps->m_NumSamplers = 16;
// Clamp
pCaps->m_NumSamplers = MIN( pCaps->m_NumSamplers, MAX_SAMPLERS );
pCaps->m_SupportsCompressedTextures = COMPRESSED_TEXTURES_ON;
pCaps->m_bSupportsAnisotropicFiltering = (caps.TextureFilterCaps & D3DPTFILTERCAPS_MINFANISOTROPIC) != 0;
pCaps->m_bSupportsMagAnisotropicFiltering = (caps.TextureFilterCaps & D3DPTFILTERCAPS_MAGFANISOTROPIC) != 0;
pCaps->m_nMaxAnisotropy = pCaps->m_bSupportsAnisotropicFiltering ? caps.MaxAnisotropy : 1;
Assert( caps.TextureCaps & D3DPTEXTURECAPS_CUBEMAP );
Assert( !( caps.TextureCaps & D3DPTEXTURECAPS_POW2 ) || ( caps.TextureCaps & D3DPTEXTURECAPS_NONPOW2CONDITIONAL ) );
Assert( caps.TextureCaps & D3DPTEXTURECAPS_PROJECTED );
if ( pCaps->m_bSoftwareVertexProcessing )
{
// This should be pushed down based on pixel shaders.
pCaps->m_NumVertexShaderConstants = 256;
pCaps->m_NumBooleanVertexShaderConstants = 16; // 2.0 parts have 16 bool vs registers
pCaps->m_NumBooleanPixelShaderConstants = 16; // 2.0 parts have 16 bool ps registers
pCaps->m_NumIntegerVertexShaderConstants = 16; // 2.0 parts have 16 bool vs registers
pCaps->m_NumIntegerPixelShaderConstants = 16; // 2.0 parts have 16 bool ps registers
}
else
{
pCaps->m_NumVertexShaderConstants = caps.MaxVertexShaderConst;
if ( CommandLine()->FindParm( "-limitvsconst" ) )
{
pCaps->m_NumVertexShaderConstants = MIN( 256, pCaps->m_NumVertexShaderConstants );
}
pCaps->m_NumBooleanVertexShaderConstants = 16; // 2.0 parts have 16 bool vs registers
pCaps->m_NumBooleanPixelShaderConstants = 16; // 2.0 parts have 16 bool ps registers
// This is a little misleading...this is really 16 int4 registers
pCaps->m_NumIntegerVertexShaderConstants = 16; // 2.0 parts have 16 bool vs registers
pCaps->m_NumIntegerPixelShaderConstants = 16; // 2.0 parts have 16 bool ps registers
}
if ( IsX360() )
{
// NOTE! This is really 224, but we do an optimization that only blasts the first 32 always.
if ( IsGPUOwnSupported() )
{
pCaps->m_NumPixelShaderConstants = 32;
}
else
{
pCaps->m_NumPixelShaderConstants = 224;
}
}
else if ( IsPS3() )
{
pCaps->m_NumVertexShaderConstants = 256;
#if defined( _PS3 )
pCaps->m_NumPixelShaderConstants = MAX_FRAGMENT_PROGRAM_CONSTS; // this is somewhat of a lie... fragment shader constants are special on PS3 and we actually have a larger number of these
#endif
pCaps->m_NumIntegerVertexShaderConstants = pCaps->m_NumIntegerPixelShaderConstants = 0;
pCaps->m_NumBooleanVertexShaderConstants = 32;
pCaps->m_NumBooleanPixelShaderConstants = 0;
}
else
{
if ( pCaps->m_SupportsShaderModel_3_0 )
{
pCaps->m_NumPixelShaderConstants = 224;
}
else
{
pCaps->m_NumPixelShaderConstants = 32;
}
}
pCaps->m_MaxNumLights = caps.MaxActiveLights;
if ( pCaps->m_MaxNumLights > MAX_NUM_LIGHTS )
{
pCaps->m_MaxNumLights = MAX_NUM_LIGHTS;
}
// Set according to control flow bit on OpenGL
if ( IsOpenGL() )
{
pCaps->m_MaxNumLights = pCaps->m_bSupportsStaticControlFlow ? 4 : 2;
}
if ( pCaps->m_bSoftwareVertexProcessing )
{
pCaps->m_MaxNumLights = 2;
}
pCaps->m_MaxTextureWidth = caps.MaxTextureWidth;
pCaps->m_MaxTextureHeight = caps.MaxTextureHeight;
pCaps->m_MaxTextureDepth = caps.MaxVolumeExtent ? caps.MaxVolumeExtent : 1;
pCaps->m_MaxTextureAspectRatio = caps.MaxTextureAspectRatio;
if ( pCaps->m_MaxTextureAspectRatio == 0 )
{
pCaps->m_MaxTextureAspectRatio = MAX( pCaps->m_MaxTextureWidth, pCaps->m_MaxTextureHeight);
}
pCaps->m_MaxPrimitiveCount = caps.MaxPrimitiveCount;
pCaps->m_bNeedsATICentroidHack = false;
pCaps->m_bDisableShaderOptimizations = false;
pCaps->m_bPreferZPrepass = IsPS3(); // turn on ZPass on PS/3 by default
pCaps->m_bSuppressPixelShaderCentroidHackFixup = false;
pCaps->m_bPreferTexturesInHWMemory = true;
pCaps->m_bPreferHardwareSync = IsPC();
pCaps->m_bUnsupported = false;
// Check if ZBias and SlopeScaleDepthBias are supported. .if not, tweak the projection matrix instead
// for polyoffset.
pCaps->m_ZBiasAndSlopeScaledDepthBiasSupported =
( ( caps.RasterCaps & D3DPRASTERCAPS_DEPTHBIAS) != 0 ) &&
( ( caps.RasterCaps & D3DPRASTERCAPS_SLOPESCALEDEPTHBIAS ) != 0 );
if ( IsX360() )
{
// driver lies, force it
pCaps->m_ZBiasAndSlopeScaledDepthBiasSupported = true;
}
// How many user clip planes?
pCaps->m_MaxUserClipPlanes = caps.MaxUserClipPlanes;
if ( CommandLine()->CheckParm( "-nouserclip" ) /* || (IsOSXOpenGL() && (!CommandLine()->FindParm("-glslmode"))) || r_emulategl.GetBool() */ )
{
// rbarris 03Feb10: this now ignores POSIX / -glslmode / r_emulategl because we're defaulting GLSL mode "on".
// so this will mean that the engine will always ask for user clip planes.
// this will misbehave under ARB mode, since ARB shaders won't respect that state.
// it's difficult to make this fluid without teaching the engine about a cap that could change during run.
pCaps->m_MaxUserClipPlanes = 0;
}
if ( pCaps->m_MaxUserClipPlanes > MAXUSERCLIPPLANES )
{
pCaps->m_MaxUserClipPlanes = MAXUSERCLIPPLANES;
}
pCaps->m_FakeSRGBWrite = false;
pCaps->m_CanDoSRGBReadFromRTs = true;
pCaps->m_bSupportsGLMixedSizeTargets = false;
#ifdef DX_TO_GL_ABSTRACTION
// using #if because we're referencing fields in the RHS which don't exist in Windows headers for the caps9 struct
pCaps->m_FakeSRGBWrite = caps.FakeSRGBWrite != 0;
pCaps->m_CanDoSRGBReadFromRTs = caps.CanDoSRGBReadFromRTs != 0;
pCaps->m_bSupportsGLMixedSizeTargets = caps.MixedSizeTargets != 0;
#endif
// Query for SRGB support as needed for our DX 9 stuff
if ( IsPC() || !IsX360() )
{
pCaps->m_SupportsSRGB = ( D3D()->CheckDeviceFormat( nAdapter, DX8_DEVTYPE, D3DFMT_X8R8G8B8, D3DUSAGE_QUERY_SRGBREAD, D3DRTYPE_TEXTURE, D3DFMT_DXT1 ) == S_OK);
if ( pCaps->m_SupportsSRGB )
{
pCaps->m_SupportsSRGB = ( D3D()->CheckDeviceFormat( nAdapter, DX8_DEVTYPE, D3DFMT_X8R8G8B8, D3DUSAGE_QUERY_SRGBREAD | D3DUSAGE_QUERY_SRGBWRITE, D3DRTYPE_TEXTURE, D3DFMT_A8R8G8B8 ) == S_OK);
}
}
else
{
// 360 does support it, but is queried in the wrong manner, so force it
pCaps->m_SupportsSRGB = true;
}
if ( CommandLine()->CheckParm( "-nosrgb" ) )
{
pCaps->m_SupportsSRGB = false;
}
if ( IsOpenGL() )
{
// HACK HACK: A lot of code in various branches assumes vertex texture support == SM3, so we're going to set that to true in GL mode and just set m_nVertexTextureCount to 0.
pCaps->m_bSupportsVertexTextures = true;
pCaps->m_NumVertexSamplers = 0;
}
else
{
pCaps->m_bSupportsVertexTextures = ( D3D()->CheckDeviceFormat( nAdapter, DX8_DEVTYPE, D3DFMT_X8R8G8B8,
D3DUSAGE_QUERY_VERTEXTEXTURE, D3DRTYPE_TEXTURE, D3DFMT_R32F ) == S_OK );
// FIXME: vs30 has a fixed setting here at 4.
// Future hardware will need some other way of computing this.
pCaps->m_NumVertexSamplers = pCaps->m_bSupportsVertexTextures ? 4 : 0;
}
// FIXME: How do I actually compute this?
pCaps->m_nMaxVertexTextureDimension = pCaps->m_bSupportsVertexTextures ? 4096 : 0;
// Does the device support filterable int16 textures?
bool bSupportsInteger16Textures =
( D3D()->CheckDeviceFormat( nAdapter, DX8_DEVTYPE,
D3DFMT_X8R8G8B8, D3DUSAGE_QUERY_FILTER,
D3DRTYPE_TEXTURE, D3DFMT_A16B16G16R16 ) == S_OK );
// Does the device support filterable fp16 textures?
bool bSupportsFloat16Textures =
( D3D()->CheckDeviceFormat( nAdapter, DX8_DEVTYPE,
D3DFMT_X8R8G8B8, D3DUSAGE_QUERY_FILTER,
D3DRTYPE_TEXTURE, D3DFMT_A16B16G16R16F ) == S_OK );
// Does the device support blendable fp16 render targets?
bool bSupportsFloat16RenderTargets =
( D3D()->CheckDeviceFormat( nAdapter, DX8_DEVTYPE,
D3DFMT_X8R8G8B8, D3DUSAGE_QUERY_POSTPIXELSHADER_BLENDING | D3DUSAGE_RENDERTARGET,
D3DRTYPE_TEXTURE, D3DFMT_A16B16G16R16F ) == S_OK );
// Essentially a proxy for a DX10 device running DX9 code path
pCaps->m_bSupportsFloat32RenderTargets = ( D3D()->CheckDeviceFormat( nAdapter, DX8_DEVTYPE,
D3DFMT_X8R8G8B8, D3DUSAGE_QUERY_POSTPIXELSHADER_BLENDING | D3DUSAGE_RENDERTARGET,
D3DRTYPE_TEXTURE, D3DFMT_A32B32G32R32F ) == S_OK );
pCaps->m_bFogColorSpecifiedInLinearSpace = false;
pCaps->m_bFogColorAlwaysLinearSpace = false;
// Assume not DX10. Check below.
pCaps->m_bDX10Card = false;
pCaps->m_bDX10Blending = false;
if ( IsOpenGL() )
{
if ( ( pCaps->m_VendorID <= 1 ) && ( pCaps->m_DeviceID <= 1 ) )
{
// HACK HACK - need to fix this once we get proper vendor/device ID's
pCaps->m_bFogColorAlwaysLinearSpace = true;
pCaps->m_bDX10Card = true;
pCaps->m_bDX10Blending = true;
}
}
if ( IsPC() && pCaps->m_SupportsSRGB )
{
if ( pCaps->m_VendorID == VENDORID_NVIDIA )
{
// NVidia wants fog color to be specified in linear space
pCaps->m_bFogColorSpecifiedInLinearSpace = true;
if ( IsOpenGL() )
{
// If we're not the Quadro 4500 or GeForce 7x000, we're an NVIDIA DX10 part on MacOS
if ( !( (pCaps->m_DeviceID == 0x009d) || ( (pCaps->m_DeviceID >= 0x0391) && (pCaps->m_DeviceID <= 0x0395) ) ) )
{
pCaps->m_bFogColorAlwaysLinearSpace = true;
pCaps->m_bDX10Card = true;
pCaps->m_bDX10Blending = true;
}
}
else
{
// On G80 and later, always specify in linear space
if ( pCaps->m_bSupportsFloat32RenderTargets )
{
pCaps->m_bFogColorAlwaysLinearSpace = true;
pCaps->m_bDX10Card = true;
pCaps->m_bDX10Blending = true;
}
}
}
else if ( pCaps->m_VendorID == VENDORID_ATI )
{
if ( IsOpenGL() )
{
// If we're not a Radeon X1x00 (device IDs in this range), we're a DX10 chip
if ( !( (pCaps->m_DeviceID >= 0x7109) && (pCaps->m_DeviceID <= 0x7291) ) )
{
pCaps->m_bFogColorSpecifiedInLinearSpace = true;
pCaps->m_bFogColorAlwaysLinearSpace = true;
pCaps->m_bDX10Card = true;
pCaps->m_bDX10Blending = true;
}
}
else
{
// Check for DX10 part
pCaps->m_bDX10Card = pCaps->m_SupportsShaderModel_3_0 &&
( pCaps->m_MaxVertexShader30InstructionSlots > 1024 ) &&
( pCaps->m_MaxPixelShader30InstructionSlots > 512 ) ;
// On ATI, DX10 card means DX10 blending
pCaps->m_bDX10Blending = pCaps->m_bDX10Card;
if( pCaps->m_bDX10Blending )
{
pCaps->m_bFogColorSpecifiedInLinearSpace = true;
pCaps->m_bFogColorAlwaysLinearSpace = true;
}
}
}
else if ( pCaps->m_VendorID == VENDORID_INTEL )
{
// Intel does not have performant vertex textures
pCaps->m_bDX10Card = false;
bool bPostBlendSRGBConvert = true;
// The source for these PCI IDs for Intel GPUs is the mesa driver source code:
// https://cgit.freedesktop.org/mesa/mesa/tree/include/pci_ids
// We are here detecting i915 (Gen3). Anything else is Gen4+ which supports DX10
switch ( pCaps->m_DeviceID )
{
// From https://cgit.freedesktop.org/mesa/mesa/tree/include/pci_ids/i915_pci_ids.h
case 0x3577: //Intel(R) 830M
case 0x2562: //Intel(R) 845G
case 0x3582: //Intel(R) 852GM/855GM
case 0x2572: //Intel(R) 865G
case 0x2582: //Intel(R) 915G
case 0x258A: //Intel(R) E7221G (i915)
case 0x2592: //Intel(R) 915GM
case 0x2772: //Intel(R) 945G
case 0x27A2: //Intel(R) 945GM
case 0x27AE: //Intel(R) 945GME
case 0x29B2: //Intel(R) Q35
case 0x29C2: //Intel(R) G33
case 0x29D2: //Intel(R) Q33
case 0xA011: //Intel(R) Pineview M
case 0xA001: //Intel(R) Pineview
bPostBlendSRGBConvert = false;
break;
}
pCaps->m_bDX10Blending = bPostBlendSRGBConvert;
if( pCaps->m_bDX10Blending )
{
pCaps->m_bFogColorSpecifiedInLinearSpace = true;
pCaps->m_bFogColorAlwaysLinearSpace = true;
}
}
}
// Do we have everything necessary to run with integer HDR? Note that
// even if we don't support integer 16-bit/component textures, we
// can still run in this mode if fp16 textures are supported.
bool bSupportsIntegerHDR =
// (caps.Caps3 & D3DCAPS3_ALPHA_FULLSCREEN_FLIP_OR_DISCARD) &&
// (caps.PrimitiveMiscCaps & D3DPMISCCAPS_SEPARATEALPHABLEND) &&
( bSupportsInteger16Textures || bSupportsFloat16Textures ) &&
pCaps->m_SupportsSRGB;
// Do we have everything necessary to run with float HDR?
bool bSupportsFloatHDR = pCaps->m_SupportsShaderModel_3_0 &&
// (caps.Caps3 & D3DCAPS3_ALPHA_FULLSCREEN_FLIP_OR_DISCARD) &&
// (caps.PrimitiveMiscCaps & D3DPMISCCAPS_SEPARATEALPHABLEND) &&
bSupportsFloat16Textures &&
bSupportsFloat16RenderTargets &&
pCaps->m_SupportsSRGB &&
!IsX360();
pCaps->m_MaxHDRType = HDR_TYPE_NONE;
if ( bSupportsFloatHDR )
pCaps->m_MaxHDRType = HDR_TYPE_FLOAT;
else
if ( bSupportsIntegerHDR )
pCaps->m_MaxHDRType = HDR_TYPE_INTEGER;
if ( bSupportsFloatHDR && ( mat_hdr_level.GetInt() == 3 ) )
{
pCaps->m_HDRType = HDR_TYPE_FLOAT;
}
else if ( bSupportsIntegerHDR )
{
pCaps->m_HDRType = HDR_TYPE_INTEGER;
}
else
{
pCaps->m_HDRType = HDR_TYPE_NONE;
}
Assert( caps.MaxStreams > 1 );
pCaps->m_bSupportsStreamOffset = ( caps.DevCaps2 & D3DDEVCAPS2_STREAMOFFSET );
pCaps->m_flMinGammaControlPoint = 0.0f;
pCaps->m_flMaxGammaControlPoint = 65535.0f;
pCaps->m_nGammaControlPointCount = 256;
// Compute the effective DX support level based on all the other caps
ComputeDXSupportLevel( *pCaps );
pCaps->m_nDXSupportLevel = pCaps->m_nMaxDXSupportLevel;
int nModelIndex = VERTEX_SHADER_MODEL;
pCaps->m_MaxVertexShaderBlendMatrices = (pCaps->m_NumVertexShaderConstants - nModelIndex) / 3;
if ( pCaps->m_MaxVertexShaderBlendMatrices > NUM_MODEL_TRANSFORMS )
{
pCaps->m_MaxVertexShaderBlendMatrices = NUM_MODEL_TRANSFORMS;
}
CheckBorderColorSupport( pCaps, nAdapter );
// This may get more complex if we start using multiple flavors of compressed vertex - for now it's "on or off"
pCaps->m_SupportsCompressedVertices = VERTEX_COMPRESSION_ON;
#if !defined( _GAMECONSOLE ) // Disabling vertex compression for Portal 2 to help PS3 perf
if ( CommandLine()->CheckParm( "-no_compressed_verts" ) )
#endif
{
pCaps->m_SupportsCompressedVertices = VERTEX_COMPRESSION_NONE;
}
// Various vendor-dependent checks...
CheckVendorDependentAlphaToCoverage( pCaps, nAdapter );
CheckVendorDependentShadowMappingSupport( pCaps, nAdapter );
CheckVendorDependentDepthResolveSupport( pCaps, nAdapter );
// Cascaded shadow mapping
// Note: dxsupport can only DISABLE CSM support, not enable it.
pCaps->m_nCSMQuality = CSMQUALITY_VERY_LOW;
pCaps->m_bSupportsCascadedShadowMapping = pCaps->m_bSupportsShadowDepthTextures;
// If we're not on a 3.0 part, these values are more appropriate (X800 & X850 parts from ATI do shadow mapping but not 3.0 )
if ( !IsOpenGL() )
{
if ( !pCaps->m_SupportsShaderModel_3_0 )
{
mat_slopescaledepthbias_shadowmap.SetValue( 5.9f );
mat_depthbias_shadowmap.SetValue( 0.003f );
}
}
#if defined( _PS3 )
if ( CommandLine()->CheckParm( "-d24shadowbuffer" ) )
{
// Slam in larger depth bias settings if we're using D24 shadow buffering (only used for comparison/profiling purposes).
mat_slopescaledepthbias_shadowmap.SetValue( SHADOWMAP_SLOPESCALEDEPTHBIAS_D24 );
mat_depthbias_shadowmap.SetValue( SHADOWMAP_DEPTHBIAS_D24 );
}
#endif
if( pCaps->m_MaxUserClipPlanes == 0 )
{
pCaps->m_UseFastClipping = true;
}
pCaps->m_MaxSimultaneousRenderTargets = caps.NumSimultaneousRTs;
return true;
}
//-----------------------------------------------------------------------------
// Compute the effective DX support level based on all the other caps
//-----------------------------------------------------------------------------
void CShaderDeviceMgrDx8::ComputeDXSupportLevel( HardwareCaps_t &caps )
{
// NOTE: Support level is actually DX level * 10 + subversion
// So, 70 = DX7, 80 = DX8, 81 = DX8 w/ 1.4 pixel shaders
// 90 = DX9 w/ 2.0 pixel shaders
// 92 = DX9 w/ 2.0b pixel shaders
// 95 = DX9 w/ 3.0 pixel shaders and vertex textures
// 98 = DX9 XBox360
// 100 = DX10 (but running on XP, using the DX9 API)
// NOTE: 82 = NVidia nv3x cards, which can't run dx9 fast
// FIXME: Improve this!! There should be a whole list of features
// we require in order to be considered a DX7 board, DX8 board, etc.
if ( IsX360() )
{
caps.m_nMinDXSupportLevel = 98;
caps.m_nMaxDXSupportLevel = 98;
return;
}
#if !defined( CSTRIKE15 )
if ( caps.m_bDX10Card ) // Note that we don't tie vertex textures to 30 shaders anymore
{
caps.m_nMinDXSupportLevel = 92;
caps.m_nMaxDXSupportLevel = 100;
return;
}
#endif
if ( caps.m_SupportsShaderModel_3_0 ) // Note that we don't tie vertex textures to 30 shaders anymore
{
caps.m_nMinDXSupportLevel = 90;
caps.m_nMaxDXSupportLevel = 95;
return;
}
if ( caps.m_SupportsPixelShaders_2_b )
{
caps.m_nMinDXSupportLevel = 90;
caps.m_nMaxDXSupportLevel = 92;
return;
}
// NOTE: sRGB is currently required for dx90 because it isn't doing
// gamma correctly if that feature doesn't exist
if ( caps.m_SupportsSRGB )
{
caps.m_nMinDXSupportLevel = 90;
caps.m_nMaxDXSupportLevel = 90;
return;
}
Assert( 0 );
// we don't support this!
caps.m_nMinDXSupportLevel = 90;
caps.m_nMaxDXSupportLevel = 90;
}
//-----------------------------------------------------------------------------
// Gets the number of adapters...
//-----------------------------------------------------------------------------
int CShaderDeviceMgrDx8::GetAdapterCount() const
{
// FIXME: Remove call to InitAdapterInfo once Steam startup issues are resolved.
const_cast<CShaderDeviceMgrDx8*>( this )->InitAdapterInfo();
return m_Adapters.Count();
}
//-----------------------------------------------------------------------------
// Returns info about each adapter
//-----------------------------------------------------------------------------
void CShaderDeviceMgrDx8::GetAdapterInfo( int nAdapter, MaterialAdapterInfo_t& info ) const
{
// FIXME: Remove call to InitAdapterInfo once Steam startup issues are resolved.
const_cast<CShaderDeviceMgrDx8*>( this )->InitAdapterInfo();
Assert( ( nAdapter >= 0 ) && ( nAdapter < m_Adapters.Count() ) );
const HardwareCaps_t &caps = m_Adapters[ nAdapter ].m_ActualCaps;
memcpy( &info, &caps, sizeof(MaterialAdapterInfo_t) );
}
//-----------------------------------------------------------------------------
// Sets the adapter
//-----------------------------------------------------------------------------
bool CShaderDeviceMgrDx8::SetAdapter( int nAdapter, int nAdapterFlags )
{
LOCK_SHADERAPI();
// FIXME:
// g_pShaderDeviceDx8->m_bReadPixelsEnabled = (nAdapterFlags & MATERIAL_INIT_READ_PIXELS_ENABLED) != 0;
// Set up hardware information for this adapter...
g_pShaderDeviceDx8->m_DeviceType = (nAdapterFlags & MATERIAL_INIT_REFERENCE_RASTERIZER) ?
D3DDEVTYPE_REF : D3DDEVTYPE_HAL;
g_pShaderDeviceDx8->m_DisplayAdapter = nAdapter;
if ( g_pShaderDeviceDx8->m_DisplayAdapter >= (UINT)GetAdapterCount() )
{
g_pShaderDeviceDx8->m_DisplayAdapter = 0;
}
#ifdef NVPERFHUD
// hack for nvperfhud
g_pShaderDeviceDx8->m_DisplayAdapter = m_pD3D->GetAdapterCount() - 1;
g_pShaderDeviceDx8->m_DeviceType = D3DDEVTYPE_REF;
#endif
// backward compat
if ( !g_pShaderDeviceDx8->OnAdapterSet() )
return false;
// if ( !g_pShaderDeviceDx8->Init() )
// {
// Warning( "Unable to initialize dx8 device!\n" );
// return false;
// }
g_pShaderDevice = g_pShaderDeviceDx8;
return true;
}
//-----------------------------------------------------------------------------
// Returns the screen resolution
//-----------------------------------------------------------------------------
void CShaderDeviceMgrDx8::GetDesktopResolution( int *pWidth, int *pHeight, int nAdapter ) const
{
#if defined ( _X360 )
#elif defined ( DX_TO_GL_ABSTRACTION )
D3DDISPLAYMODE d3dDisplayMode;
m_pD3D->GetAdapterDisplayMode( nAdapter, &d3dDisplayMode );
*pWidth = d3dDisplayMode.Width;
*pHeight = d3dDisplayMode.Height;
#elif defined( _X360 ) || defined( _PS3 ) || defined( POSIX )
// Empty
#else
HMONITOR hMonitor = m_pD3D->GetAdapterMonitor( nAdapter );
// *pWidth = ::GetDeviceCaps( hMonitor, HORZSIZE );
// *pHeight = ::GetDeviceCaps( hMonitor, VERTSIZE );
MONITORINFO monitorInfo;
memset( &monitorInfo, 0, sizeof(monitorInfo) );
monitorInfo.cbSize = sizeof(monitorInfo);
GetMonitorInfo( hMonitor, &monitorInfo );
*pWidth = monitorInfo.rcMonitor.right - monitorInfo.rcMonitor.left;
*pHeight = monitorInfo.rcMonitor.bottom - monitorInfo.rcMonitor.top;
#endif
}
//-----------------------------------------------------------------------------
// Returns the number of modes
//-----------------------------------------------------------------------------
int CShaderDeviceMgrDx8::GetModeCount( int nAdapter ) const
{
LOCK_SHADERAPI();
Assert( m_pD3D && (nAdapter < GetAdapterCount() ) );
#if !defined( _X360 )
// fixme - what format should I use here?
return m_pD3D->GetAdapterModeCount( nAdapter, D3DFMT_X8R8G8B8 );
#else
return 1; // Only one mode, which is the current mode set in the 360 dashboard. Going to fill it in with exactly what the 360 is set to.
#endif
}
#ifdef _PS3
static void PS3_GetVideoOutResolution( int *pWidth, int *pHeight, float *pAspectRatio )
{
*pWidth = 640;
*pHeight = 480;
CellVideoOutState videoOutState;
int ret = cellVideoOutGetState( CELL_VIDEO_OUT_PRIMARY, 0, &videoOutState);
if ( ret < CELL_OK )
return;
CellVideoOutResolution resolution;
ret = cellVideoOutGetResolution( videoOutState.displayMode.resolutionId, &resolution );
if ( ret < CELL_OK )
return;
*pWidth = resolution.width;
*pHeight = resolution.height;
#ifndef _CERT
static bool s_bPrintOnce = false;
if ( !s_bPrintOnce )
{
s_bPrintOnce = true;
char chDbg[512];
Q_snprintf( chDbg, sizeof( chDbg ),
"----- VIDEO MODE -----\n"
"STATE: %s\n"
"COLOR: %s\n"
"RES: %u x %u [#%d]\n"
"ASPECT: %s\n"
"RRATE: %s%s%s%s\n"
"SCAN: %s\n"
"----------------------\n",
(videoOutState.state == CELL_VIDEO_OUT_OUTPUT_STATE_ENABLED) ? "ENABLED" : "NOT READY",
(videoOutState.colorSpace == CELL_VIDEO_OUT_COLOR_SPACE_RGB) ? "RGB" : ( (videoOutState.colorSpace == CELL_VIDEO_OUT_COLOR_SPACE_YUV) ? "YUV" : "UNDEFINED" ),
resolution.width, resolution.height, videoOutState.displayMode.resolutionId,
(videoOutState.displayMode.aspect == CELL_VIDEO_OUT_ASPECT_4_3) ? "4x3" : ( (videoOutState.displayMode.aspect == CELL_VIDEO_OUT_ASPECT_16_9) ? "16x9" : "AUTO" ),
(videoOutState.displayMode.refreshRates & CELL_VIDEO_OUT_REFRESH_RATE_30HZ) ? " 30Hz" : "",
(videoOutState.displayMode.refreshRates & CELL_VIDEO_OUT_REFRESH_RATE_50HZ) ? " 50Hz" : "",
(videoOutState.displayMode.refreshRates & CELL_VIDEO_OUT_REFRESH_RATE_60HZ) ? " 60Hz" : "",
(videoOutState.displayMode.refreshRates & CELL_VIDEO_OUT_REFRESH_RATE_59_94HZ) ? " 59.94Hz" : "",
videoOutState.displayMode.scanMode ? "PROGRESSIVE" : "INTERLACED"
);
unsigned int dummy;
sys_tty_write( SYS_TTYP15, chDbg, Q_strlen( chDbg ), &dummy );
}
#endif
// Clamp 1080p resolution down to 720p
if ( resolution.height >= 720 && CommandLine()->FindParm( "-480p" ) )
{
*pWidth = 640;
*pHeight = 480;
}
else if ( resolution.height >= 1080 && !CommandLine()->FindParm( "-1080p" ) )
{
*pWidth = 1280;
*pHeight = 720;
}
switch ( videoOutState.displayMode.aspect )
{
case CELL_VIDEO_OUT_ASPECT_4_3:
*pAspectRatio = 4.0f/3.0f;
break;
case CELL_VIDEO_OUT_ASPECT_16_9:
*pAspectRatio = 16.0f/9.0f;
break;
default:
*pAspectRatio = float( *pWidth ) / float( *pHeight );
break;
}
}
#endif // _PS3
//-----------------------------------------------------------------------------
// Returns mode information..
//-----------------------------------------------------------------------------
void CShaderDeviceMgrDx8::GetModeInfo( ShaderDisplayMode_t* pInfo, int nAdapter, int nMode ) const
{
Assert( pInfo->m_nVersion == SHADER_DISPLAY_MODE_VERSION );
LOCK_SHADERAPI();
Assert( m_pD3D && (nAdapter < GetAdapterCount() ) );
Assert( nMode < GetModeCount( nAdapter ) );
#if defined( _PS3 )
PS3_GetVideoOutResolution( &pInfo->m_nWidth, &pInfo->m_nHeight, &pInfo->m_flAspectRatio );
pInfo->m_Format = ImageLoader::D3DFormatToImageFormat( D3DFMT_X8R8G8B8 );
pInfo->m_nRefreshRateNumerator = 60;
pInfo->m_nRefreshRateDenominator = 1;
#elif defined( _X360 )
pInfo->m_Format = ImageLoader::D3DFormatToImageFormat( D3DFMT_X8R8G8B8 );
pInfo->m_nRefreshRateNumerator = 60;
pInfo->m_nRefreshRateDenominator = 1;
pInfo->m_nWidth = GetSystemMetrics( SM_CXSCREEN );
pInfo->m_nHeight = GetSystemMetrics( SM_CYSCREEN );
#else
HRESULT hr;
D3DDISPLAYMODE d3dInfo;
// fixme - what format should I use here?
hr = D3D()->EnumAdapterModes( nAdapter, D3DFMT_X8R8G8B8, nMode, &d3dInfo );
Assert( !FAILED(hr) );
pInfo->m_nWidth = d3dInfo.Width;
pInfo->m_nHeight = d3dInfo.Height;
pInfo->m_Format = ImageLoader::D3DFormatToImageFormat( d3dInfo.Format );
pInfo->m_nRefreshRateNumerator = d3dInfo.RefreshRate;
pInfo->m_nRefreshRateDenominator = 1;
#endif
}
//-----------------------------------------------------------------------------
// Returns the current mode information for an adapter
//-----------------------------------------------------------------------------
void CShaderDeviceMgrDx8::GetCurrentModeInfo( ShaderDisplayMode_t* pInfo, int nAdapter ) const
{
Assert( pInfo->m_nVersion == SHADER_DISPLAY_MODE_VERSION );
LOCK_SHADERAPI();
Assert( D3D() );
HRESULT hr;
D3DDISPLAYMODE mode;
#if defined( _PS3 )
PS3_GetVideoOutResolution( ( int *)&mode.Width, ( int *)&mode.Height, &pInfo->m_flAspectRatio );
mode.Format = D3DFMT_X8R8G8B8;
mode.RefreshRate = 60;
#elif defined( _X360 )
if ( !m_pD3DDevice )
{
// the console has no prior display or mode until its created
mode.Width = GetSystemMetrics( SM_CXSCREEN );
mode.Height = GetSystemMetrics( SM_CYSCREEN );
mode.RefreshRate = 60;
mode.Format = D3DFMT_X8R8G8B8;
}
else
{
hr = m_pD3DDevice->GetDisplayMode( 0, &mode );
Assert( !FAILED(hr) );
}
#else
hr = D3D()->GetAdapterDisplayMode( nAdapter, &mode );
Assert( !FAILED(hr) );
#endif
pInfo->m_nWidth = mode.Width;
pInfo->m_nHeight = mode.Height;
pInfo->m_Format = ImageLoader::D3DFormatToImageFormat( mode.Format );
pInfo->m_nRefreshRateNumerator = mode.RefreshRate;
pInfo->m_nRefreshRateDenominator = 1;
}
//-----------------------------------------------------------------------------
// Sets the video mode
//-----------------------------------------------------------------------------
CreateInterfaceFn CShaderDeviceMgrDx8::SetMode( void *hWnd, int nAdapter, const ShaderDeviceInfo_t& mode )
{
LOCK_SHADERAPI();
Assert( nAdapter < GetAdapterCount() );
int nDXLevel = mode.m_nDXLevel != 0 ? mode.m_nDXLevel : m_Adapters[nAdapter].m_ActualCaps.m_nDXSupportLevel;
if ( nDXLevel > m_Adapters[nAdapter].m_ActualCaps.m_nMaxDXSupportLevel )
{
nDXLevel = m_Adapters[nAdapter].m_ActualCaps.m_nMaxDXSupportLevel;
}
nDXLevel = GetClosestActualDXLevel( nDXLevel );
if ( nDXLevel > 100 )
return NULL;
bool bReacquireResourcesNeeded = false;
if ( g_pShaderDevice )
{
bReacquireResourcesNeeded = IsPC();
g_pShaderDevice->ReleaseResources();
}
if ( g_pShaderAPI )
{
g_pShaderAPI->OnDeviceShutdown();
g_pShaderAPI = NULL;
}
if ( g_pShaderDevice )
{
g_pShaderDevice->ShutdownDevice();
g_pShaderDevice = NULL;
}
g_pShaderShadow = NULL;
ShaderDeviceInfo_t adjustedMode = mode;
adjustedMode.m_nDXLevel = nDXLevel;
if ( !g_pShaderDeviceDx8->InitDevice( hWnd, nAdapter, adjustedMode ) )
return NULL;
if ( !g_pShaderAPIDX8->OnDeviceInit() )
return NULL;
g_pShaderDevice = g_pShaderDeviceDx8;
g_pShaderAPI = g_pShaderAPIDX8;
g_pShaderShadow = g_pShaderShadowDx8;
if ( bReacquireResourcesNeeded )
{
g_pShaderDevice->ReacquireResources();
}
return ShaderInterfaceFactory;
}
//-----------------------------------------------------------------------------
// Validates the mode...
//-----------------------------------------------------------------------------
bool CShaderDeviceMgrDx8::ValidateMode( int nAdapter, const ShaderDeviceInfo_t &info ) const
{
if ( nAdapter >= (int)D3D()->GetAdapterCount() )
return false;
ShaderDisplayMode_t displayMode;
GetCurrentModeInfo( &displayMode, nAdapter );
if ( info.m_bWindowed )
{
// make sure the window fits within the current video mode
if ( ( info.m_DisplayMode.m_nWidth > displayMode.m_nWidth ) ||
( info.m_DisplayMode.m_nHeight > displayMode.m_nHeight ) )
return false;
}
// Make sure the image format requested is valid
ImageFormat backBufferFormat = FindNearestSupportedBackBufferFormat( nAdapter,
DX8_DEVTYPE, displayMode.m_Format, info.m_DisplayMode.m_Format, info.m_bWindowed );
return ( backBufferFormat != IMAGE_FORMAT_UNKNOWN );
}
//-----------------------------------------------------------------------------
// Returns the amount of video memory in bytes for a particular adapter
//-----------------------------------------------------------------------------
int CShaderDeviceMgrDx8::GetVidMemBytes( int nAdapter ) const
{
#if defined( _X360 )
return 256*1024*1024;
#elif defined (DX_TO_GL_ABSTRACTION)
D3DADAPTER_IDENTIFIER9 devIndentifier;
D3D()->GetAdapterIdentifier( nAdapter, D3DENUM_WHQL_LEVEL, &devIndentifier );
return devIndentifier.VideoMemory;
#else
// FIXME: This currently ignores the adapter
return ::GetVidMemBytes();
#endif
}
//-----------------------------------------------------------------------------
//
// Shader device
//
//-----------------------------------------------------------------------------
#if 0
// FIXME: Enable after I've separated it out from shaderapidx8 a little better
static CShaderDeviceDx8 s_ShaderDeviceDX8;
CShaderDeviceDx8* g_pShaderDeviceDx8 = &s_ShaderDeviceDX8;
#endif
#if defined( _GAMECONSOLE )
IDirect3DDevice *m_pD3DDevice;
#endif
//-----------------------------------------------------------------------------
// Constructor, destructor
//-----------------------------------------------------------------------------
CShaderDeviceDx8::CShaderDeviceDx8()
{
m_pD3DDevice = NULL;
for ( int i = 0; i < ARRAYSIZE(m_pFrameSyncQueryObject); i++ )
{
m_pFrameSyncQueryObject[i] = NULL;
m_bQueryIssued[i] = false;
}
m_pFrameSyncTexture = NULL;
m_bQueuedDeviceLost = false;
m_DeviceState = DEVICE_STATE_OK;
m_bOtherAppInitializing = false;
m_IsResizing = false;
m_bPendingVideoModeChange = false;
m_DeviceSupportsCreateQuery = -1;
m_bUsingStencil = false;
m_bResourcesReleased = false;
m_iStencilBufferBits = 0;
m_NonInteractiveRefresh.m_Mode = MATERIAL_NON_INTERACTIVE_MODE_NONE;
m_NonInteractiveRefresh.m_pVertexShader = NULL;
m_NonInteractiveRefresh.m_pPixelShader = NULL;
m_NonInteractiveRefresh.m_pPixelShaderStartup = NULL;
m_NonInteractiveRefresh.m_pPixelShaderStartupPass2 = NULL;
m_NonInteractiveRefresh.m_pVertexDecl = NULL;
m_NonInteractiveRefresh.m_nPacifierFrame = 0;
m_numReleaseResourcesRefCount = 0;
}
CShaderDeviceDx8::~CShaderDeviceDx8()
{
}
//-----------------------------------------------------------------------------
// Computes device creation paramters
//-----------------------------------------------------------------------------
static DWORD ComputeDeviceCreationFlags( D3DCAPS& caps, bool bSoftwareVertexProcessing )
{
// Find out what type of device to make
bool bPureDeviceSupported = (caps.DevCaps & D3DDEVCAPS_PUREDEVICE) != 0;
DWORD nDeviceCreationFlags;
if ( !bSoftwareVertexProcessing )
{
nDeviceCreationFlags = D3DCREATE_HARDWARE_VERTEXPROCESSING;
if ( bPureDeviceSupported )
{
nDeviceCreationFlags |= D3DCREATE_PUREDEVICE;
}
}
else
{
nDeviceCreationFlags = D3DCREATE_SOFTWARE_VERTEXPROCESSING;
}
nDeviceCreationFlags |= D3DCREATE_FPU_PRESERVE;
#ifdef _X360
nDeviceCreationFlags |= D3DCREATE_BUFFER_2_FRAMES;
#endif
return nDeviceCreationFlags;
}
//-----------------------------------------------------------------------------
// Computes the supersample flags
//-----------------------------------------------------------------------------
D3DMULTISAMPLE_TYPE CShaderDeviceDx8::ComputeMultisampleType( int nSampleCount )
{
switch (nSampleCount)
{
#if !defined( _X360 )
case 2: return D3DMULTISAMPLE_2_SAMPLES;
case 3: return D3DMULTISAMPLE_3_SAMPLES;
case 4: return D3DMULTISAMPLE_4_SAMPLES;
case 5: return D3DMULTISAMPLE_5_SAMPLES;
case 6: return D3DMULTISAMPLE_6_SAMPLES;
case 7: return D3DMULTISAMPLE_7_SAMPLES;
case 8: return D3DMULTISAMPLE_8_SAMPLES;
case 9: return D3DMULTISAMPLE_9_SAMPLES;
case 10: return D3DMULTISAMPLE_10_SAMPLES;
case 11: return D3DMULTISAMPLE_11_SAMPLES;
case 12: return D3DMULTISAMPLE_12_SAMPLES;
case 13: return D3DMULTISAMPLE_13_SAMPLES;
case 14: return D3DMULTISAMPLE_14_SAMPLES;
case 15: return D3DMULTISAMPLE_15_SAMPLES;
case 16: return D3DMULTISAMPLE_16_SAMPLES;
#else
case 2: return D3DMULTISAMPLE_2_SAMPLES;
case 4: return D3DMULTISAMPLE_4_SAMPLES;
#endif
default:
case 0:
case 1:
return D3DMULTISAMPLE_NONE;
}
}
void CShaderDeviceDx8::CalcBackBufferDimensions( const ShaderDisplayMode_t &mode, const ShaderDeviceInfo_t &info, int *pBackBufferWidth, int *pBackBufferHeight )
{
if ( IsX360() || !info.m_bWindowed )
{
// fullscreen
bool useDefault = ( info.m_DisplayMode.m_nWidth == 0 ) || ( info.m_DisplayMode.m_nHeight == 0 );
*pBackBufferWidth = useDefault ? mode.m_nWidth : info.m_DisplayMode.m_nWidth;
*pBackBufferHeight = useDefault ? mode.m_nHeight : info.m_DisplayMode.m_nHeight;
}
else
{
// windowed
if ( info.m_bResizing )
{
if ( info.m_bLimitWindowedSize &&
( info.m_nWindowedSizeLimitWidth < mode.m_nWidth || info.m_nWindowedSizeLimitHeight < mode.m_nHeight ) )
{
// When using material system in windowed resizing apps, it's
// sometimes not a good idea to allocate stuff as big as the screen
// video cards can soo run out of resources
*pBackBufferWidth = info.m_nWindowedSizeLimitWidth;
*pBackBufferHeight = info.m_nWindowedSizeLimitHeight;
}
else
{
// When in resizing windowed mode,
// we want to allocate enough memory to deal with any resizing...
*pBackBufferWidth = mode.m_nWidth;
*pBackBufferHeight = mode.m_nHeight;
}
}
else
{
*pBackBufferWidth = info.m_DisplayMode.m_nWidth;
*pBackBufferHeight = info.m_DisplayMode.m_nHeight;
}
}
}
//-----------------------------------------------------------------------------
// Sets the present parameters
//-----------------------------------------------------------------------------
void CShaderDeviceDx8::SetPresentParameters( void* hWnd, int nAdapter, const ShaderDeviceInfo_t &info, bool bSetSymbolsOnly )
{
ShaderDisplayMode_t mode;
g_pShaderDeviceMgr->GetCurrentModeInfo( &mode, nAdapter );
int backBufferWidth = 0;
int backBufferHeight = 0;
CalcBackBufferDimensions( mode, info, &backBufferWidth, &backBufferHeight );
m_AspectRatioInfo.m_flFrameBufferAspectRatio = ( float )backBufferWidth / ( float )backBufferHeight;
m_AspectRatioInfo.m_flPhysicalAspectRatio = m_AspectRatioInfo.m_flFrameBufferAspectRatio;
m_AspectRatioInfo.m_flFrameBuffertoPhysicalScalar = 1.0f;
#ifdef _PS3
// Device physical aspect ratio / framebuffer pixel aspect ratio.
m_AspectRatioInfo.m_flPhysicalAspectRatio = mode.m_flAspectRatio;
m_AspectRatioInfo.m_flFrameBuffertoPhysicalScalar = m_AspectRatioInfo.m_flPhysicalAspectRatio / m_AspectRatioInfo.m_flFrameBufferAspectRatio;
#endif
m_AspectRatioInfo.m_flPhysicalToFrameBufferScalar = 1.0f / m_AspectRatioInfo.m_flFrameBuffertoPhysicalScalar;
m_AspectRatioInfo.m_bIsWidescreen = ( m_AspectRatioInfo.m_flPhysicalAspectRatio >= 1.5999f );
if ( IsGameConsole () )
{
m_AspectRatioInfo.m_bIsHidef = backBufferHeight > 480;
}
else
{
m_AspectRatioInfo.m_bIsHidef = backBufferHeight >= 720;
}
#ifdef DX_TO_GL_ABSTRACTION
{
m_AspectRatioInfo.m_bIsHidef = backBufferHeight >= 640;
}
#endif
m_AspectRatioInfo.m_bInitialized = true;
// Set kv conditional
KeyValuesSystem()->SetKeyValuesExpressionSymbol( "WIN32WIDE", IsGameConsole() ? false : m_AspectRatioInfo.m_bIsWidescreen );
KeyValuesSystem()->SetKeyValuesExpressionSymbol( "WIN32HIDEF", IsGameConsole() ? false : m_AspectRatioInfo.m_bIsHidef );
KeyValuesSystem()->SetKeyValuesExpressionSymbol( "WIN32LODEF", IsGameConsole() ? false : !m_AspectRatioInfo.m_bIsHidef );
#if defined( _X360 )
XVIDEO_MODE videoMode;
XGetVideoMode( &videoMode );
m_AspectRatioInfo.m_bIsWidescreen = videoMode.fIsWideScreen != 0;
#endif
// Set kv conditional
KeyValuesSystem()->SetKeyValuesExpressionSymbol( "GAMECONSOLEWIDE", IsGameConsole() ? m_AspectRatioInfo.m_bIsWidescreen : false );
KeyValuesSystem()->SetKeyValuesExpressionSymbol( "GAMECONSOLEHIDEF", IsGameConsole() ? m_AspectRatioInfo.m_bIsHidef : false );
KeyValuesSystem()->SetKeyValuesExpressionSymbol( "GAMECONSOLELODEF", IsGameConsole() ? !m_AspectRatioInfo.m_bIsHidef : false );
// UI needs to layout differently for lowdef anamorphic widescreen on PS3 since we don't have square pixels there, ie:
// 720x480 widescreen
// 720x576 widescreen
KeyValuesSystem()->SetKeyValuesExpressionSymbol( "ANAMORPHIC", IsPlatformPS3() && m_AspectRatioInfo.m_bIsWidescreen && ( backBufferWidth == 720 ) );
#if defined( _X360 )
// Commented out and using presentation interval to clamp to 30fps
//
// // want 30 for 60Hz, and 25 for 50Hz (PAL)
// int nNewFpsMax = ( ( int )( videoMode.RefreshRate + 0.5f ) ) >> 1;
// // slam to either 30 or 25 so that we don't end up with any other cases.
// if( nNewFpsMax < 26 )
// {
// nNewFpsMax = 25;
// }
// else
// {
// nNewFpsMax = 30;
// }
// DevMsg( "*******Monitor refresh is %f, setting fps_max to %d*********\n", videoMode.RefreshRate, nNewFpsMax );
// ConVarRef fps_max( "fps_max" );
// fps_max.SetValue( nNewFpsMax );
#endif
#ifdef _GAMECONSOLE
// This could probably be removed, but since we are changing fps_max above, I don't want to change the behavior.
// force these to resolve now, other systems at startup will peek at them
g_pCVar->ProcessQueuedMaterialThreadConVarSets();
#endif
if ( bSetSymbolsOnly )
{
// affect no state, just update KV symbols
return;
}
HRESULT hr;
ZeroMemory( &m_PresentParameters, sizeof( m_PresentParameters ) );
m_PresentParameters.Windowed = info.m_bWindowed;
m_PresentParameters.SwapEffect = info.m_bUsingMultipleWindows ? D3DSWAPEFFECT_COPY : D3DSWAPEFFECT_DISCARD;
// for 360, we want to create it ourselves for hierarchical z support
m_PresentParameters.EnableAutoDepthStencil = IsX360() ? FALSE : TRUE;
// What back-buffer format should we use?
ImageFormat backBufferFormat = FindNearestSupportedBackBufferFormat( nAdapter,
DX8_DEVTYPE, m_AdapterFormat, info.m_DisplayMode.m_Format, info.m_bWindowed );
// What depth format should we use?
m_bUsingStencil = info.m_bUseStencil;
if ( info.m_nDXLevel >= 80 )
{
// always stencil for dx9/hdr
m_bUsingStencil = true;
}
#if defined( _X360 )
D3DFORMAT nDepthFormat = ReverseDepthOnX360() ? D3DFMT_D24FS8 : D3DFMT_D24S8;
#else
D3DFORMAT nDepthFormat = m_bUsingStencil ? D3DFMT_D24S8 : D3DFMT_D24X8;
#endif
m_PresentParameters.AutoDepthStencilFormat = FindNearestSupportedDepthFormat(
nAdapter, m_AdapterFormat, backBufferFormat, nDepthFormat );
m_PresentParameters.hDeviceWindow = (VD3DHWND)hWnd;
// store how many stencil buffer bits we have available with the depth/stencil buffer
switch( m_PresentParameters.AutoDepthStencilFormat )
{
case D3DFMT_D24S8:
m_iStencilBufferBits = 8;
break;
#if defined( _X360 )
case D3DFMT_D24FS8:
m_iStencilBufferBits = 8;
break;
#else
case D3DFMT_D24X4S4:
m_iStencilBufferBits = 4;
break;
case D3DFMT_D15S1:
m_iStencilBufferBits = 1;
break;
#endif
default:
m_iStencilBufferBits = 0;
m_bUsingStencil = false; //couldn't acquire a stencil buffer
};
if ( IsX360() || !info.m_bWindowed ) // if fullscreen
{
bool useDefault = ( info.m_DisplayMode.m_nWidth == 0 ) || ( info.m_DisplayMode.m_nHeight == 0 );
m_PresentParameters.BackBufferWidth = useDefault ? mode.m_nWidth : info.m_DisplayMode.m_nWidth;
m_PresentParameters.BackBufferHeight = useDefault ? mode.m_nHeight : info.m_DisplayMode.m_nHeight;
m_PresentParameters.BackBufferFormat = ImageLoader::ImageFormatToD3DFormat( backBufferFormat );
#if defined( _X360 )
m_PresentParameters.FrontBufferFormat = D3DFMT_LE_X8R8G8B8;
#endif
if ( !info.m_bWaitForVSync || CommandLine()->FindParm( "-forcenovsync" ) )
{
// Not vsync'd so only double buffer
m_PresentParameters.BackBufferCount = 1;
m_PresentParameters.PresentationInterval = D3DPRESENT_INTERVAL_IMMEDIATE;
}
else
{
// We are vsync'd and fullscreen, so allow triple buffering
static ConVarRef mat_triplebuffered( "mat_triplebuffered" );
m_PresentParameters.BackBufferCount = mat_triplebuffered.GetInt() ? 2 : 1;
#if defined( _X360 )
m_PresentParameters.PresentationInterval = D3DPRESENT_INTERVAL_TWO;
#else
m_PresentParameters.PresentationInterval = D3DPRESENT_INTERVAL_ONE; // this is temporary until it's correctly defined on the PS3
#endif
}
m_PresentParameters.FullScreen_RefreshRateInHz = info.m_DisplayMode.m_nRefreshRateDenominator ?
info.m_DisplayMode.m_nRefreshRateNumerator / info.m_DisplayMode.m_nRefreshRateDenominator : D3DPRESENT_RATE_DEFAULT;
#if defined( _X360 )
// setup hardware scaling - should be native 720p upsampling to 1080i
if ( info.m_bScaleToOutputResolution )
{
m_PresentParameters.VideoScalerParameters.ScalerSourceRect.x2 = m_PresentParameters.BackBufferWidth;
m_PresentParameters.VideoScalerParameters.ScalerSourceRect.y2 = m_PresentParameters.BackBufferHeight;
m_PresentParameters.VideoScalerParameters.ScaledOutputWidth = videoMode.dwDisplayWidth;
m_PresentParameters.VideoScalerParameters.ScaledOutputHeight = videoMode.dwDisplayHeight;
DevMsg( "VIDEO SCALING: scaling from %dx%d to %dx%d\n", ( int )m_PresentParameters.BackBufferWidth, ( int )m_PresentParameters.BackBufferHeight,
( int )videoMode.dwDisplayWidth, ( int )videoMode.dwDisplayHeight );
}
else
{
DevMsg( "VIDEO SCALING: No scaling: %dx%d\n", ( int )m_PresentParameters.BackBufferWidth, ( int )m_PresentParameters.BackBufferHeight );
}
#endif
}
else // if windowed
{
// NJS: We are seeing a lot of time spent in present in some cases when this isn't set.
m_PresentParameters.PresentationInterval = D3DPRESENT_INTERVAL_IMMEDIATE;
if ( info.m_bResizing )
{
if ( info.m_bLimitWindowedSize &&
( info.m_nWindowedSizeLimitWidth < mode.m_nWidth || info.m_nWindowedSizeLimitHeight < mode.m_nHeight ) )
{
// When using material system in windowed resizing apps, it's
// sometimes not a good idea to allocate stuff as big as the screen
// video cards can soo run out of resources
m_PresentParameters.BackBufferWidth = info.m_nWindowedSizeLimitWidth;
m_PresentParameters.BackBufferHeight = info.m_nWindowedSizeLimitHeight;
}
else
{
// When in resizing windowed mode,
// we want to allocate enough memory to deal with any resizing...
m_PresentParameters.BackBufferWidth = mode.m_nWidth;
m_PresentParameters.BackBufferHeight = mode.m_nHeight;
}
}
else
{
m_PresentParameters.BackBufferWidth = info.m_DisplayMode.m_nWidth;
m_PresentParameters.BackBufferHeight = info.m_DisplayMode.m_nHeight;
}
m_PresentParameters.BackBufferFormat = ImageLoader::ImageFormatToD3DFormat( backBufferFormat );
m_PresentParameters.BackBufferCount = 1; // Windowed, so only double buffer
}
if ( info.m_nAASamples > 0 && ( m_PresentParameters.SwapEffect == D3DSWAPEFFECT_DISCARD ) )
{
D3DMULTISAMPLE_TYPE multiSampleType = ComputeMultisampleType( info.m_nAASamples );
DWORD nQualityLevel;
// FIXME: Should we add the quality level to the ShaderAdapterMode_t struct?
// 16x on nVidia refers to CSAA or "Coverage Sampled Antialiasing"
const HardwareCaps_t &adapterCaps = g_ShaderDeviceMgrDx8.GetHardwareCaps( nAdapter );
if ( ( info.m_nAASamples == 16 ) && ( adapterCaps.m_VendorID == VENDORID_NVIDIA ) )
{
multiSampleType = ComputeMultisampleType(4);
hr = D3D()->CheckDeviceMultiSampleType( nAdapter, DX8_DEVTYPE,
m_PresentParameters.BackBufferFormat, m_PresentParameters.Windowed,
multiSampleType, &nQualityLevel ); // 4x at highest quality level
if ( !FAILED( hr ) && ( nQualityLevel == 16 ) )
{
nQualityLevel = nQualityLevel - 1; // Highest quality level triggers 16x CSAA
}
else
{
nQualityLevel = 0; // No CSAA
}
}
else // Regular MSAA on any old vendor
{
hr = D3D()->CheckDeviceMultiSampleType( nAdapter, DX8_DEVTYPE,
m_PresentParameters.BackBufferFormat, m_PresentParameters.Windowed,
multiSampleType, &nQualityLevel );
nQualityLevel = 0;
}
if ( !FAILED( hr ) )
{
m_PresentParameters.MultiSampleType = multiSampleType;
m_PresentParameters.MultiSampleQuality = nQualityLevel;
}
}
else
{
m_PresentParameters.MultiSampleType = D3DMULTISAMPLE_NONE;
m_PresentParameters.MultiSampleQuality = 0;
}
}
//-----------------------------------------------------------------------------
// Initializes, shuts down the D3D device
//-----------------------------------------------------------------------------
bool CShaderDeviceDx8::InitDevice( void* hwnd, int nAdapter, const ShaderDeviceInfo_t &info )
{
//Debugger();
// good place to run some self tests.
//#if OSX
//{
// extern void GLMgrSelfTests( void );
// GLMgrSelfTests();
//}
//#endif
// windowed
if ( !CreateD3DDevice( (VD3DHWND)hwnd, nAdapter, info ) )
return false;
// Hook up our own windows proc to get at messages to tell us when
// other instances of the material system are trying to set the mode
InstallWindowHook( (VD3DHWND)m_hWnd );
return true;
}
void CShaderDeviceDx8::ShutdownDevice()
{
if ( ( IsPC() || IsPS3() ) && IsActive() )
{
Dx9Device()->Release();
#ifdef STUBD3D
delete ( CStubD3DDevice * )Dx9Device();
#endif
#if !defined( _X360 ) && !defined( _PS3 )
Dx9Device()->ShutDownDevice();
#endif
RemoveWindowHook( (VD3DHWND)m_hWnd );
m_hWnd = 0;
}
}
//-----------------------------------------------------------------------------
// Are we using graphics?
//-----------------------------------------------------------------------------
bool CShaderDeviceDx8::IsUsingGraphics() const
{
//*****LOCK_SHADERAPI();
return IsActive();
}
//-----------------------------------------------------------------------------
// Returns the current adapter in use
//-----------------------------------------------------------------------------
int CShaderDeviceDx8::GetCurrentAdapter() const
{
LOCK_SHADERAPI();
return m_DisplayAdapter;
}
//-----------------------------------------------------------------------------
// Use this to spew information about the 3D layer
//-----------------------------------------------------------------------------
void CShaderDeviceDx8::SpewDriverInfo() const
{
LOCK_SHADERAPI();
HRESULT hr;
D3DCAPS caps;
D3DADAPTER_IDENTIFIER9 ident;
RECORD_COMMAND( DX8_GET_DEVICE_CAPS, 0 );
RECORD_COMMAND( DX8_GET_ADAPTER_IDENTIFIER, 2 );
RECORD_INT( m_nAdapter );
RECORD_INT( 0 );
Dx9Device()->GetDeviceCaps( &caps );
hr = D3D()->GetAdapterIdentifier( m_nAdapter, D3DENUM_WHQL_LEVEL, &ident );
Warning("Shader API Driver Info:\n\nDriver : %s Version : %lld\n",
ident.Driver, ident.DriverVersion.QuadPart );
Warning("Driver Description : %s\n", ident.Description );
Warning("Chipset version %d %d %d %d\n\n",
ident.VendorId, ident.DeviceId, ident.SubSysId, ident.Revision );
ShaderDisplayMode_t mode;
g_pShaderDeviceMgr->GetCurrentModeInfo( &mode, m_nAdapter );
Warning("Display mode : %d x %d @%dHz (%s)\n",
mode.m_nWidth, mode.m_nHeight, mode.m_nRefreshRateNumerator, ImageLoader::GetName( mode.m_Format ) );
Warning("Vertex Shader Version : %d.%d Pixel Shader Version : %d.%d\n",
(caps.VertexShaderVersion >> 8) & 0xFF, caps.VertexShaderVersion & 0xFF,
(caps.PixelShaderVersion >> 8) & 0xFF, caps.PixelShaderVersion & 0xFF);
Warning("\nDevice Caps :\n");
Warning("CANBLTSYSTONONLOCAL %s CANRENDERAFTERFLIP %s HWRASTERIZATION %s\n",
(caps.DevCaps & D3DDEVCAPS_CANBLTSYSTONONLOCAL) ? " Y " : " N ",
(caps.DevCaps & D3DDEVCAPS_CANRENDERAFTERFLIP) ? " Y " : " N ",
(caps.DevCaps & D3DDEVCAPS_HWRASTERIZATION) ? " Y " : "*N*" );
Warning("HWTRANSFORMANDLIGHT %s NPATCHES %s PUREDEVICE %s\n",
(caps.DevCaps & D3DDEVCAPS_HWTRANSFORMANDLIGHT) ? " Y " : " N ",
(caps.DevCaps & D3DDEVCAPS_NPATCHES) ? " Y " : " N ",
(caps.DevCaps & D3DDEVCAPS_PUREDEVICE) ? " Y " : " N " );
Warning("SEPARATETEXTUREMEMORIES %s TEXTURENONLOCALVIDMEM %s TEXTURESYSTEMMEMORY %s\n",
(caps.DevCaps & D3DDEVCAPS_SEPARATETEXTUREMEMORIES) ? "*Y*" : " N ",
(caps.DevCaps & D3DDEVCAPS_TEXTURENONLOCALVIDMEM) ? " Y " : " N ",
(caps.DevCaps & D3DDEVCAPS_TEXTURESYSTEMMEMORY) ? " Y " : " N " );
Warning("TEXTUREVIDEOMEMORY %s TLVERTEXSYSTEMMEMORY %s TLVERTEXVIDEOMEMORY %s\n",
(caps.DevCaps & D3DDEVCAPS_TEXTUREVIDEOMEMORY) ? " Y " : "*N*",
(caps.DevCaps & D3DDEVCAPS_TLVERTEXSYSTEMMEMORY) ? " Y " : "*N*",
(caps.DevCaps & D3DDEVCAPS_TLVERTEXVIDEOMEMORY) ? " Y " : " N " );
Warning("\nPrimitive Caps :\n");
Warning("BLENDOP %s CLIPPLANESCALEDPOINTS %s CLIPTLVERTS %s\n",
(caps.PrimitiveMiscCaps & D3DPMISCCAPS_BLENDOP) ? " Y " : " N ",
(caps.PrimitiveMiscCaps & D3DPMISCCAPS_CLIPPLANESCALEDPOINTS) ? " Y " : " N ",
(caps.PrimitiveMiscCaps & D3DPMISCCAPS_CLIPTLVERTS) ? " Y " : " N " );
Warning("COLORWRITEENABLE %s MASKZ %s TSSARGTEMP %s\n",
(caps.PrimitiveMiscCaps & D3DPMISCCAPS_COLORWRITEENABLE) ? " Y " : " N ",
(caps.PrimitiveMiscCaps & D3DPMISCCAPS_MASKZ) ? " Y " : "*N*",
(caps.PrimitiveMiscCaps & D3DPMISCCAPS_TSSARGTEMP) ? " Y " : " N " );
Warning("\nRaster Caps :\n");
Warning("FOGRANGE %s FOGTABLE %s FOGVERTEX %s ZFOG %s WFOG %s\n",
(caps.RasterCaps & D3DPRASTERCAPS_FOGRANGE) ? " Y " : " N ",
(caps.RasterCaps & D3DPRASTERCAPS_FOGTABLE) ? " Y " : " N ",
(caps.RasterCaps & D3DPRASTERCAPS_FOGVERTEX) ? " Y " : " N ",
(caps.RasterCaps & D3DPRASTERCAPS_ZFOG) ? " Y " : " N ",
(caps.RasterCaps & D3DPRASTERCAPS_WFOG) ? " Y " : " N " );
Warning("MIPMAPLODBIAS %s WBUFFER %s ZBIAS %s ZTEST %s\n",
(caps.RasterCaps & D3DPRASTERCAPS_MIPMAPLODBIAS) ? " Y " : " N ",
(caps.RasterCaps & D3DPRASTERCAPS_WBUFFER) ? " Y " : " N ",
(caps.RasterCaps & D3DPRASTERCAPS_DEPTHBIAS) ? " Y " : " N ",
(caps.RasterCaps & D3DPRASTERCAPS_ZTEST) ? " Y " : "*N*" );
Warning("Size of Texture Memory : %d kb\n", g_pHardwareConfig->Caps().m_TextureMemorySize / 1024 );
Warning("Max Texture Dimensions : %d x %d\n",
caps.MaxTextureWidth, caps.MaxTextureHeight );
if (caps.MaxTextureAspectRatio != 0)
Warning("Max Texture Aspect Ratio : *%d*\n", caps.MaxTextureAspectRatio );
Warning("Max Textures : %d\n",
caps.MaxSimultaneousTextures );
Warning("\nTexture Caps :\n");
Warning("ALPHA %s CUBEMAP %s MIPCUBEMAP %s SQUAREONLY %s\n",
(caps.TextureCaps & D3DPTEXTURECAPS_ALPHA) ? " Y " : " N ",
(caps.TextureCaps & D3DPTEXTURECAPS_CUBEMAP) ? " Y " : " N ",
(caps.TextureCaps & D3DPTEXTURECAPS_MIPCUBEMAP) ? " Y " : " N ",
(caps.TextureCaps & D3DPTEXTURECAPS_SQUAREONLY) ? "*Y*" : " N " );
Warning( "vendor id: 0x%x\n", g_pHardwareConfig->ActualCaps().m_VendorID );
Warning( "device id: 0x%x\n", g_pHardwareConfig->ActualCaps().m_DeviceID );
Warning( "SHADERAPI CAPS:\n" );
Warning( "m_NumSamplers: %d\n", g_pHardwareConfig->Caps().m_NumSamplers );
Warning( "m_NumVertexSamplers: %d\n", g_pHardwareConfig->Caps().m_NumVertexSamplers );
Warning( "m_HasSetDeviceGammaRamp: %s\n", g_pHardwareConfig->Caps().m_HasSetDeviceGammaRamp ? "yes" : "no" );
Warning( "m_SupportsPixelShaders_2_b: %s\n", g_pHardwareConfig->Caps().m_SupportsPixelShaders_2_b ? "yes" : "no" );
Warning( "m_SupportsShaderModel_3_0: %s\n", g_pHardwareConfig->Caps().m_SupportsShaderModel_3_0 ? "yes" : "no" );
Warning( "m_SupportsCompressedVertices: %d\n", g_pHardwareConfig->Caps().m_SupportsCompressedVertices );
Warning( "m_bSupportsAnisotropicFiltering: %s\n", g_pHardwareConfig->Caps().m_bSupportsAnisotropicFiltering ? "yes" : "no" );
Warning( "m_nMaxAnisotropy: %d\n", g_pHardwareConfig->Caps().m_nMaxAnisotropy );
Warning( "m_MaxTextureWidth: %d\n", g_pHardwareConfig->Caps().m_MaxTextureWidth );
Warning( "m_MaxTextureHeight: %d\n", g_pHardwareConfig->Caps().m_MaxTextureHeight );
Warning( "m_MaxTextureAspectRatio: %d\n", g_pHardwareConfig->Caps().m_MaxTextureAspectRatio );
Warning( "m_MaxPrimitiveCount: %d\n", g_pHardwareConfig->Caps().m_MaxPrimitiveCount );
Warning( "m_ZBiasAndSlopeScaledDepthBiasSupported: %s\n", g_pHardwareConfig->Caps().m_ZBiasAndSlopeScaledDepthBiasSupported ? "yes" : "no" );
Warning( "m_NumPixelShaderConstants: %d\n", g_pHardwareConfig->Caps().m_NumPixelShaderConstants );
Warning( "m_NumVertexShaderConstants: %d\n", g_pHardwareConfig->Caps().m_NumVertexShaderConstants );
Warning( "m_NumBooleanVertexShaderConstants: %d\n", g_pHardwareConfig->Caps().m_NumBooleanVertexShaderConstants );
Warning( "m_NumIntegerVertexShaderConstants: %d\n", g_pHardwareConfig->Caps().m_NumIntegerVertexShaderConstants );
Warning( "m_TextureMemorySize: %d\n", g_pHardwareConfig->Caps().m_TextureMemorySize );
Warning( "m_MaxNumLights: %d\n", g_pHardwareConfig->Caps().m_MaxNumLights );
Warning( "m_MaxVertexShaderBlendMatrices: %d\n", g_pHardwareConfig->Caps().m_MaxVertexShaderBlendMatrices );
Warning( "m_SupportsMipmappedCubemaps: %s\n", g_pHardwareConfig->Caps().m_SupportsMipmappedCubemaps ? "yes" : "no" );
Warning( "m_nDXSupportLevel: %d\n", g_pHardwareConfig->Caps().m_nDXSupportLevel );
Warning( "m_PreferDynamicTextures: %s\n", g_pHardwareConfig->Caps().m_PreferDynamicTextures ? "yes" : "no" );
Warning( "m_MaxUserClipPlanes: %d\n", g_pHardwareConfig->Caps().m_MaxUserClipPlanes );
Warning( "m_SupportsSRGB: %s\n", g_pHardwareConfig->Caps().m_SupportsSRGB ? "yes" : "no" );
switch( g_pHardwareConfig->Caps().m_HDRType )
{
case HDR_TYPE_NONE:
Warning( "m_HDRType: HDR_TYPE_NONE\n" );
break;
case HDR_TYPE_INTEGER:
Warning( "m_HDRType: HDR_TYPE_INTEGER\n" );
break;
case HDR_TYPE_FLOAT:
Warning( "m_HDRType: HDR_TYPE_FLOAT\n" );
break;
default:
Assert( 0 );
break;
}
Warning( "m_UseFastClipping: %s\n", g_pHardwareConfig->Caps().m_UseFastClipping ? "yes" : "no" );
Warning( "m_pShaderDLL: %s\n", g_pHardwareConfig->Caps().m_pShaderDLL );
Warning( "m_bNeedsATICentroidHack: %s\n", g_pHardwareConfig->Caps().m_bNeedsATICentroidHack ? "yes" : "no" );
Warning( "m_bDisableShaderOptimizations: %s\n", g_pHardwareConfig->Caps().m_bDisableShaderOptimizations ? "yes" : "no" );
Warning( "m_MaxSimultaneousRenderTargets: %d\n", g_pHardwareConfig->Caps().m_MaxSimultaneousRenderTargets );
Warning( "m_bPreferZPrepass: %s\n", g_pHardwareConfig->Caps().m_bPreferZPrepass ? "yes" : "no" );
Warning( "m_bSuppressPixelShaderCentroidHackFixup: %s\n", g_pHardwareConfig->Caps().m_bSuppressPixelShaderCentroidHackFixup ? "yes" : "no" );
Warning( "m_bPreferTexturesInHWMemory: %s\n", g_pHardwareConfig->Caps().m_bPreferTexturesInHWMemory ? "yes" : "no" );
Warning( "m_bPreferHardwareSync: %s\n", g_pHardwareConfig->Caps().m_bPreferHardwareSync ? "yes" : "no" );
Warning( "m_bUnsupported: %s\n", g_pHardwareConfig->Caps().m_bUnsupported ? "yes" : "no" );
}
//-----------------------------------------------------------------------------
// Back buffer information
//-----------------------------------------------------------------------------
ImageFormat CShaderDeviceDx8::GetBackBufferFormat() const
{
return ImageLoader::D3DFormatToImageFormat( m_PresentParameters.BackBufferFormat );
}
void CShaderDeviceDx8::GetBackBufferDimensions( int& width, int& height ) const
{
width = m_PresentParameters.BackBufferWidth;
height = m_PresentParameters.BackBufferHeight;
}
const AspectRatioInfo_t &CShaderDeviceDx8::GetAspectRatioInfo() const
{
Assert( m_AspectRatioInfo.m_bInitialized );
if ( !m_AspectRatioInfo.m_bInitialized )
{
Error( "GetAspectRatioInfo called before aspect ratio is initialized!\n" );
}
return m_AspectRatioInfo;
}
//-----------------------------------------------------------------------------
// Detects support for CreateQuery
//-----------------------------------------------------------------------------
void CShaderDeviceDx8::DetectQuerySupport( IDirect3DDevice9 *pD3DDevice )
{
// Do I need to detect whether this device supports CreateQuery before creating it?
if ( m_DeviceSupportsCreateQuery != -1 )
return;
IDirect3DQuery9 *pQueryObject = NULL;
// Detect whether query is supported by creating and releasing:
HRESULT hr = pD3DDevice->CreateQuery( D3DQUERYTYPE_EVENT, &pQueryObject );
if ( !FAILED(hr) && pQueryObject )
{
pQueryObject->Release();
m_DeviceSupportsCreateQuery = 1;
}
else
{
m_DeviceSupportsCreateQuery = 0;
}
}
#ifdef _X360
void GPUHangCallback( const char *pDescription )
{
if ( !pDescription )
{
#ifdef _CERT
XboxLaunch()->Launch();
#endif
return;
}
#ifndef _CERT
Warning( pDescription );
#endif
}
#endif
#if(DIRECT3D_VERSION < 0x0900)
#define D3DDEVTYPE_NULLREF ( D3DDEVTYPE )4
#endif
//-----------------------------------------------------------------------------
// Actually creates the D3D Device once the present parameters are set up
//-----------------------------------------------------------------------------
IDirect3DDevice9* CShaderDeviceDx8::InvokeCreateDevice( void* hWnd, int nAdapter, DWORD deviceCreationFlags )
{
IDirect3DDevice9 *pD3DDevice = NULL;
D3DDEVTYPE devType = DX8_DEVTYPE;
#if NVPERFHUD
nAdapter = D3D()->GetAdapterCount()-1;
devType = D3DDEVTYPE_REF;
deviceCreationFlags = D3DCREATE_FPU_PRESERVE | D3DCREATE_HARDWARE_VERTEXPROCESSING;
#endif
if ( !IsX360() )
{
// Create the device with multi-threaded safeguards if we're using mat_queue_mode 2.
// The logic to enable multithreaded rendering happens well after the device has been created,
// so we replicate some of that logic here.
ConVarRef mat_queue_mode( "mat_queue_mode" );
if ( mat_queue_mode.GetInt() == 2 ||
( mat_queue_mode.GetInt() == -2 && GetCPUInformation().m_nPhysicalProcessors >= 2 ) ||
( mat_queue_mode.GetInt() == -1 && GetCPUInformation().m_nPhysicalProcessors >= 2 ) )
{
deviceCreationFlags |= D3DCREATE_MULTITHREADED;
}
}
#ifdef ENABLE_NULLREF_DEVICE_SUPPORT
devType = CommandLine()->FindParm( "-nulldevice" ) ? D3DDEVTYPE_NULLREF: devType;
#endif
#if defined ( DX_TO_GL_ABSTRACTION )
gGL = GetOpenGLEntryPoints(0);
#endif
HRESULT hr = D3D()->CreateDevice( nAdapter, devType,
(VD3DHWND)hWnd, deviceCreationFlags, &m_PresentParameters, &pD3DDevice );
if (FAILED(hr) || !pD3DDevice)
{
if ( !IsPC() )
return NULL;
// try again, other applications may be taking their time
Sleep( 1000 );
hr = D3D()->CreateDevice( nAdapter, devType, (VD3DHWND)hWnd, deviceCreationFlags, &m_PresentParameters, &pD3DDevice );
if (FAILED(hr) || !pD3DDevice)
{
// in this case, we actually are allocating too much memory....
// This will cause us to use less buffers...
if ( m_PresentParameters.Windowed )
{
m_PresentParameters.SwapEffect = D3DSWAPEFFECT_COPY;
m_PresentParameters.BackBufferCount = 0;
hr = D3D()->CreateDevice( nAdapter, devType,
(VD3DHWND)hWnd, deviceCreationFlags, &m_PresentParameters, &pD3DDevice );
}
}
}
if ( !FAILED( hr ) && pD3DDevice )
{
g_pShaderDeviceMgr->InvokeDeviceResetNotifications( pD3DDevice, &m_PresentParameters, hWnd );
#ifdef _X360
pD3DDevice->SetHangCallback( GPUHangCallback );
#endif
}
else
{
// Otherwise we failed, show a message and shutdown
pD3DDevice = NULL;
Log_Warning( LOG_EngineInitialization, "Failed to create %s device! Please see the following for more info.\n"
"http://support.steampowered.com/cgi-bin/steampowered.cfg/php/enduser/std_adp.php?p_faqid=772\n", IsOpenGL() ? "OpenGL" : "D3D" );
}
return pD3DDevice;
}
//-----------------------------------------------------------------------------
// Creates the D3D Device
//-----------------------------------------------------------------------------
bool CShaderDeviceDx8::CreateD3DDevice( void* pHWnd, int nAdapter, const ShaderDeviceInfo_t &info )
{
Assert( info.m_nVersion == SHADER_DEVICE_INFO_VERSION );
MEM_ALLOC_CREDIT_( __FILE__ ": D3D Device" );
VD3DHWND hWnd = (VD3DHWND)pHWnd;
#if ( !defined( PIX_INSTRUMENTATION ) && !defined( _X360 ) && !defined( NVPERFHUD ) )
D3DPERF_SetOptions(1); // Explicitly disallow PIX instrumented profiling in external builds
#endif
// Get some caps....
D3DCAPS caps;
HRESULT hr = D3D()->GetDeviceCaps( nAdapter, DX8_DEVTYPE, &caps );
if ( FAILED( hr ) )
return false;
// Determine the adapter format
ShaderDisplayMode_t mode;
g_pShaderDeviceMgrDx8->GetCurrentModeInfo( &mode, nAdapter );
m_AdapterFormat = mode.m_Format;
// FIXME: Need to do this prior to SetPresentParameters. Fix.
// Make it part of HardwareCaps_t
InitializeColorInformation( nAdapter, DX8_DEVTYPE, m_AdapterFormat );
Assert( D3DSupportsCompressedTextures() );
const HardwareCaps_t &adapterCaps = g_ShaderDeviceMgrDx8.GetHardwareCaps( nAdapter );
DWORD deviceCreationFlags = ComputeDeviceCreationFlags( caps, adapterCaps.m_bSoftwareVertexProcessing );
SetPresentParameters( hWnd, nAdapter, info );
// Tell all other instances of the material system to let go of memory
SendIPCMessage( RELEASE_MESSAGE );
// Create a stereo texture updater so the nvidia dll's can init. Must be BEFORE device creation!
#if !defined( _GAMECONSOLE ) && !defined(DX_TO_GL_ABSTRACTION) && ( IS_WINDOWS_PC )
nv::stereo::HL2StereoD3D9 *pStereoD3D9 = new nv::stereo::HL2StereoD3D9;
#endif
// Creates the device
IDirect3DDevice9 *pD3DDevice = InvokeCreateDevice( pHWnd, nAdapter, deviceCreationFlags );
if ( !pD3DDevice )
{
#if !defined( _GAMECONSOLE ) && !defined(DX_TO_GL_ABSTRACTION) && ( IS_WINDOWS_PC )
delete pStereoD3D9;
#endif
return false;
}
DetectQuerySupport( pD3DDevice ); // Check to see if query is supported
// This must happen AFTER device creation
#if !defined( _GAMECONSOLE ) && !defined(DX_TO_GL_ABSTRACTION) && ( IS_WINDOWS_PC )
pStereoD3D9->Init( pD3DDevice );
#endif
#ifdef STUBD3D
Dx9Device() = new CStubD3DDevice( pD3DDevice, g_pFullFileSystem );
#elif !defined( _GAMECONSOLE )
Dx9Device()->SetDevicePtr( pD3DDevice, &m_PresentParameters, pHWnd );
#if !defined( _GAMECONSOLE ) && !defined(DX_TO_GL_ABSTRACTION) && ( IS_WINDOWS_PC )
// Give pointer to d3d_async layer (it will free the memory later)
Dx9Device()->SetStereoTextureUpdater( pStereoD3D9 );
#endif
#else
m_pD3DDevice = pD3DDevice;
#endif
#if defined( _X360 )
// Create the depth buffer, created manually to enable hierarchical z
{
D3DSURFACE_PARAMETERS DepthStencilParams;
V_memset( &DepthStencilParams, 0, sizeof( DepthStencilParams ) );
// Depth is immediately after the back buffer in EDRAM
// allocate the hierarchical z tiles at the end of the area so all other allocations can trivially allocate at 0
DepthStencilParams.Base = XGSurfaceSize(
m_PresentParameters.BackBufferWidth,
m_PresentParameters.BackBufferHeight,
m_PresentParameters.BackBufferFormat,
m_PresentParameters.MultiSampleType );
DepthStencilParams.ColorExpBias = 0;
DepthStencilParams.HierarchicalZBase = GPU_HIERARCHICAL_Z_TILES - XGHierarchicalZSize( m_PresentParameters.BackBufferWidth, m_PresentParameters.BackBufferHeight, m_PresentParameters.MultiSampleType );
DepthStencilParams.HiZFunc = D3DHIZFUNC_DEFAULT;
IDirect3DSurface *pDepthStencilSurface = NULL;
hr = Dx9Device()->CreateDepthStencilSurface(
m_PresentParameters.BackBufferWidth,
m_PresentParameters.BackBufferHeight,
m_PresentParameters.AutoDepthStencilFormat,
m_PresentParameters.MultiSampleType,
m_PresentParameters.MultiSampleQuality,
TRUE,
&pDepthStencilSurface,
&DepthStencilParams );
Assert( SUCCEEDED( hr ) );
if ( FAILED( hr ) )
return false;
hr = Dx9Device()->SetDepthStencilSurface( pDepthStencilSurface );
Assert( SUCCEEDED( hr ) );
if ( FAILED( hr ) )
return false;
}
// Initialize XUI, needed for TTF font rasterization
// xui requires and shares our d3d device
{
hr = XuiRenderInitShared( pD3DDevice, &m_PresentParameters, XuiD3DXTextureLoader );
if ( FAILED( hr ) )
return false;
XUIInitParams xuiInit;
XUI_INIT_PARAMS( xuiInit );
xuiInit.dwFlags = XUI_INIT_PARAMS_FLAGS_NONE;
xuiInit.pHooks = NULL;
hr = XuiInit( &xuiInit );
if ( FAILED( hr ) )
return false;
hr = XuiRenderCreateDC( &m_hDC );
if ( FAILED( hr ) )
return false;
}
#endif
// CheckDeviceLost();
// Tell all other instances of the material system it's ok to grab memory
SendIPCMessage( REACQUIRE_MESSAGE );
m_hWnd = pHWnd;
m_nAdapter = m_DisplayAdapter = nAdapter;
m_DeviceState = DEVICE_STATE_OK;
m_bIsMinimized = false;
m_bQueuedDeviceLost = false;
m_IsResizing = info.m_bWindowed && info.m_bResizing;
// This is our current view.
m_ViewHWnd = hWnd;
GetWindowSize( m_nWindowWidth, m_nWindowHeight );
g_pHardwareConfig->SetupHardwareCaps( info, g_ShaderDeviceMgrDx8.GetHardwareCaps( nAdapter ) );
g_pHardwareConfig->CapsForEdit().m_SupportsCompressedTextures = COMPRESSED_TEXTURES_ON;
return ( !FAILED( hr ) );
}
//-----------------------------------------------------------------------------
// Frame sync
//-----------------------------------------------------------------------------
void CShaderDeviceDx8::AllocFrameSyncTextureObject()
{
if ( IsGameConsole() || IsOSX() )
return;
FreeFrameSyncTextureObject();
// Create a tiny managed texture.
HRESULT hr = Dx9Device()->CreateTexture(
1, 1, // width, height
0, // levels
D3DUSAGE_DYNAMIC, // usage
D3DFMT_A8R8G8B8, // format
D3DPOOL_DEFAULT,
&m_pFrameSyncTexture,
NULL );
if ( FAILED( hr ) )
{
m_pFrameSyncTexture = NULL;
}
}
void CShaderDeviceDx8::FreeFrameSyncTextureObject()
{
if ( IsGameConsole() || IsOSX() )
return;
if ( m_pFrameSyncTexture )
{
m_pFrameSyncTexture->Release();
m_pFrameSyncTexture = NULL;
}
}
void CShaderDeviceDx8::AllocFrameSyncObjects( void )
{
if ( IsGameConsole() || IsOSX() )
return;
if ( mat_debugalttab.GetBool() )
{
Warning( "mat_debugalttab: CShaderAPIDX8::AllocFrameSyncObjects\n" );
}
// Allocate the texture for frame syncing in case we force that to be on.
AllocFrameSyncTextureObject();
if ( m_DeviceSupportsCreateQuery == 0 )
{
for ( int i = 0; i < ARRAYSIZE(m_pFrameSyncQueryObject); i++ )
{
m_pFrameSyncQueryObject[i] = NULL;
m_bQueryIssued[i] = false;
}
return;
}
// FIXME FIXME FIXME!!!!! Need to record this.
for ( int i = 0; i < ARRAYSIZE(m_pFrameSyncQueryObject); i++ )
{
HRESULT hr = Dx9Device()->CreateQuery( D3DQUERYTYPE_EVENT, &m_pFrameSyncQueryObject[i] );
if( hr == D3DERR_NOTAVAILABLE )
{
Warning( "D3DQUERYTYPE_EVENT not available on this driver\n" );
Assert( m_pFrameSyncQueryObject[i] == NULL );
}
else
{
Assert( hr == D3D_OK );
Assert( m_pFrameSyncQueryObject[i] );
m_pFrameSyncQueryObject[i]->Issue( D3DISSUE_END );
m_bQueryIssued[i] = true;
}
}
}
void CShaderDeviceDx8::FreeFrameSyncObjects( void )
{
if ( IsX360() || IsOSX() )
return;
if ( mat_debugalttab.GetBool() )
{
Warning( "mat_debugalttab: CShaderAPIDX8::FreeFrameSyncObjects\n" );
}
FreeFrameSyncTextureObject();
// FIXME FIXME FIXME!!!!! Need to record this.
for ( int i = 0; i < ARRAYSIZE(m_pFrameSyncQueryObject); i++ )
{
if ( m_pFrameSyncQueryObject[i] )
{
if ( m_bQueryIssued[i] )
{
double flStartTime = Plat_FloatTime();
BOOL dummyData = 0;
HRESULT hr = S_OK;
// Make every attempt (within 2 seconds) to get the result from the query. Doing so may prevent
// crashes in the driver if we try to release outstanding queries.
do
{
hr = m_pFrameSyncQueryObject[i]->GetData( &dummyData, sizeof( dummyData ), D3DGETDATA_FLUSH );
double flCurrTime = Plat_FloatTime();
// don't wait more than 2 seconds for these
if ( flCurrTime - flStartTime > 2.00 )
break;
} while ( hr == S_FALSE );
}
#ifdef DBGFLAG_ASSERT
int nRetVal =
#endif
m_pFrameSyncQueryObject[i]->Release();
Assert( nRetVal == 0 );
m_pFrameSyncQueryObject[i] = NULL;
m_bQueryIssued[i] = false;
}
}
}
//-----------------------------------------------------------------------------
// Occurs when another application is initializing
//-----------------------------------------------------------------------------
void CShaderDeviceDx8::OtherAppInitializing( bool initializing )
{
if ( !ThreadOwnsDevice() || !ThreadInMainThread() )
{
if ( initializing )
{
ShaderUtil()->OnThreadEvent( SHADER_THREAD_OTHER_APP_START );
}
else
{
ShaderUtil()->OnThreadEvent( SHADER_THREAD_OTHER_APP_END );
}
return;
}
Assert( m_bOtherAppInitializing != initializing );
if ( !IsDeactivated() )
{
Dx9Device()->EndScene();
}
// NOTE: OtherApp is set in this way because we need to know we're
// active as we release and restore everything
CheckDeviceLost( initializing );
if ( !IsDeactivated() )
{
Dx9Device()->BeginScene();
}
}
void CShaderDeviceDx8::HandleThreadEvent( uint32 threadEvent )
{
Assert(ThreadOwnsDevice());
switch ( threadEvent )
{
case SHADER_THREAD_OTHER_APP_START:
OtherAppInitializing(true);
break;
case SHADER_THREAD_RELEASE_RESOURCES:
ReleaseResources();
break;
case SHADER_THREAD_EVICT_RESOURCES:
EvictManagedResourcesInternal();
break;
case SHADER_THREAD_RESET_RENDER_STATE:
ResetRenderState();
break;
case SHADER_THREAD_ACQUIRE_RESOURCES:
ReacquireResources();
break;
case SHADER_THREAD_OTHER_APP_END:
OtherAppInitializing(false);
break;
}
}
//-----------------------------------------------------------------------------
// We lost the device, but we have a chance to recover
//-----------------------------------------------------------------------------
bool CShaderDeviceDx8::TryDeviceReset()
{
if ( IsX360() )
return true;
// Don't try to reset the device until we're sure our resources have been released
if ( !m_bResourcesReleased )
{
return false;
}
// FIXME: Make this rebuild the Dx9Device from scratch!
// Helps with compatibility
HRESULT hr = Dx9Device()->Reset( &m_PresentParameters );
bool bResetSuccess = !FAILED(hr);
if ( bResetSuccess )
{
m_bResourcesReleased = false;
#if !defined( _GAMECONSOLE )
Dx9Device()->ReportDeviceReset();
#endif
}
return bResetSuccess;
}
//-----------------------------------------------------------------------------
// Release, reacquire resources
//-----------------------------------------------------------------------------
void CShaderDeviceDx8::ReleaseResources( bool bReleaseManagedResources /*= true*/ )
{
if ( !ThreadOwnsDevice() || !ThreadInMainThread() )
{
// We shouldn't be asked to release resources but keep mananged resources around unless
// this thread owns the device.
Assert( bReleaseManagedResources == true );
// Set our resources as not being released yet.
// We reset this in two places since release resources can be called without a call to TryDeviceReset.
m_bResourcesReleased = false;
ShaderUtil()->OnThreadEvent( SHADER_THREAD_RELEASE_RESOURCES );
return;
}
// Only the initial "ReleaseResources" actually has effect
if ( m_numReleaseResourcesRefCount ++ != 0 )
{
Warning( "ReleaseResources has no effect, now at level %d.\n", m_numReleaseResourcesRefCount );
DevWarning( "ReleaseResources called twice is a bug: use IsDeactivated to check for a valid device.\n" );
Assert( 0 );
return;
}
LOCK_SHADERAPI();
CPixEvent( PIX_VALVE_ORANGE, "ReleaseResources" );
FreeFrameSyncObjects();
FreeNonInteractiveRefreshObjects();
int nRestoreFlags = bReleaseManagedResources ? MATERIAL_RESTORE_RELEASE_MANAGED_RESOURCES : 0;
ShaderUtil()->ReleaseShaderObjects( nRestoreFlags );
MeshMgr()->ReleaseBuffers();
g_pShaderAPI->ReleaseShaderObjects( bReleaseManagedResources );
#ifdef _DEBUG
if ( MeshMgr()->BufferCount() != 0 )
{
for( int i = 0; i < MeshMgr()->BufferCount(); i++ )
{
}
}
#endif
// All meshes cleaned up?
Assert( MeshMgr()->BufferCount() == 0 );
// Signal that our resources have been released so that we can try to reset the device
m_bResourcesReleased = true;
}
void CShaderDeviceDx8::ReacquireResources()
{
ReacquireResourcesInternal();
}
void CShaderDeviceDx8::ReacquireResourcesInternal( bool bResetState, bool bForceReacquire, char const *pszForceReason )
{
if ( !ThreadOwnsDevice() || !ThreadInMainThread() )
{
if ( bResetState )
{
ShaderUtil()->OnThreadEvent( SHADER_THREAD_RESET_RENDER_STATE );
}
ShaderUtil()->OnThreadEvent( SHADER_THREAD_ACQUIRE_RESOURCES );
return;
}
if ( bForceReacquire )
{
// If we are forcing reacquire then warn if release calls are remaining unpaired
if ( m_numReleaseResourcesRefCount > 1 )
{
Warning( "Forcefully resetting device (%s), resources release level was %d.\n", pszForceReason ? pszForceReason : "unspecified", m_numReleaseResourcesRefCount );
Assert( 0 );
}
m_numReleaseResourcesRefCount = 0;
}
else
{
// Only the final "ReacquireResources" actually has effect
if ( -- m_numReleaseResourcesRefCount != 0 )
{
Warning( "ReacquireResources has no effect, now at level %d.\n", m_numReleaseResourcesRefCount );
DevWarning( "ReacquireResources being discarded is a bug: use IsDeactivated to check for a valid device.\n" );
Assert( 0 );
if ( m_numReleaseResourcesRefCount < 0 )
{
m_numReleaseResourcesRefCount = 0;
}
return;
}
}
if ( bResetState )
{
ResetRenderState();
}
LOCK_SHADERAPI();
CPixEvent event( PIX_VALVE_ORANGE, "ReacquireResources" );
#ifdef VPROF_ENABLED
VPROF_INCREMENT_GROUP_COUNTER( "reacquire_resources", COUNTER_GROUP_NO_RESET, 1 );
#endif
g_pShaderAPI->RestoreShaderObjects();
AllocFrameSyncObjects();
AllocNonInteractiveRefreshObjects();
MeshMgr()->RestoreBuffers();
ShaderUtil()->RestoreShaderObjects( CShaderDeviceMgrBase::ShaderInterfaceFactory );
}
//-----------------------------------------------------------------------------
// Changes the window size
//-----------------------------------------------------------------------------
bool CShaderDeviceDx8::ResizeWindow( const ShaderDeviceInfo_t &info )
{
if ( IsGameConsole() )
return false;
m_bPendingVideoModeChange = false;
// We don't need to do crap if the window was set up to set up
// to be resizing...
if ( info.m_bResizing )
return false;
// needs to run prior to mode change cllbacks that has dependencies on this info
// this is not the "real" set, but an earlier call to just update the dependencies
SetPresentParameters( (HWND)m_hWnd, m_DisplayAdapter, info, true );
g_pShaderDeviceMgr->InvokeModeChangeCallbacks( info.m_DisplayMode.m_nWidth, info.m_DisplayMode.m_nHeight );
SetPresentParameters( (VD3DHWND)m_hWnd, m_DisplayAdapter, info );
g_pShaderDeviceMgr->InvokeDeviceLostNotifications();
// We were ok, now we're not. Release resources
ReleaseResources( ( g_pShaderUtil->GetThreadMode() != MATERIAL_QUEUED_THREADED ) );
m_DeviceState = DEVICE_STATE_NEEDS_RESET;
return true;
}
//-----------------------------------------------------------------------------
// Queue up the fact that the device was lost
//-----------------------------------------------------------------------------
void CShaderDeviceDx8::MarkDeviceLost( )
{
if ( IsX360() )
return;
m_bQueuedDeviceLost = true;
}
//-----------------------------------------------------------------------------
// Checks if the device was lost
//-----------------------------------------------------------------------------
#if defined( _DEBUG ) && !defined( _X360 )
ConVar mat_forcelostdevice( "mat_forcelostdevice", "0" );
#endif
void CShaderDeviceDx8::CheckDeviceLost( bool bOtherAppInitializing )
{
#if !defined( _X360 )
// FIXME: We could also queue up if WM_SIZE changes and look at that
// but that seems to only make sense if we have resizable windows where
// we do *not* allocate buffers as large as the entire current video mode
// which we're not doing
#ifdef _WIN32
m_bIsMinimized = ( static_cast<BOOL>(IsIconic( ( HWND )m_hWnd )) == (BOOL)TRUE );
#else
m_bIsMinimized = ( IsIconic( (VD3DHWND)m_hWnd ) == TRUE );
#endif
m_bOtherAppInitializing = bOtherAppInitializing;
RECORD_COMMAND( DX8_TEST_COOPERATIVE_LEVEL, 0 );
HRESULT hr = Dx9Device()->TestCooperativeLevel();
#ifdef _DEBUG
if ( mat_forcelostdevice.GetBool() )
{
mat_forcelostdevice.SetValue( 0 );
MarkDeviceLost();
}
#endif
// If some other call returned device lost previously in the frame, spoof the return value from TCL
if ( m_bQueuedDeviceLost )
{
hr = (hr != D3D_OK) ? hr : D3DERR_DEVICENOTRESET;
m_bQueuedDeviceLost = false;
}
if ( m_DeviceState == DEVICE_STATE_OK )
{
// Release managed resources if we're anything but in MATERIAL_QUEUED_THREADED. MATERIAL_QUEUED_THREADED is a proxy for whether
// we're actually running the game or in the middle of some loading or concommand that might load gpu resources. This isn't the best
// approach. What we really want is whether we're done loading managed resources or not. However, it's not entirely clear that
// we can bracket that. The upside of using the threadmode is that we are pretty much guaranteed that we don't be in the middle of
// loading. The downside is that on single core PCs, we'll always use the old and slow bReleaseManagedResources == true path that we
// had in l4d1 and previous titles.
bool bReleaseManagedResources = ( g_pShaderUtil->GetThreadMode() != MATERIAL_QUEUED_THREADED );
// We can transition out of ok if bOtherAppInitializing is set
// or if we become minimized, or if TCL returns anything other than D3D_OK.
if ( ( hr != D3D_OK ) || m_bIsMinimized )
{
// purge unreferenced materials
g_pShaderUtil->UncacheUnusedMaterials( true );
g_pShaderDeviceMgr->InvokeDeviceLostNotifications();
// We were ok, now we're not. Release resources
ReleaseResources( bReleaseManagedResources );
m_DeviceState = DEVICE_STATE_LOST_DEVICE;
}
else if ( bOtherAppInitializing )
{
// purge unreferenced materials
g_pShaderUtil->UncacheUnusedMaterials( true );
g_pShaderDeviceMgr->InvokeDeviceLostNotifications();
// We were ok, now we're not. Release resources
ReleaseResources( bReleaseManagedResources );
m_DeviceState = DEVICE_STATE_OTHER_APP_INIT;
}
}
// Immediately checking devicelost after ok helps in the case where we got D3DERR_DEVICENOTRESET
// in which case we want to immdiately try to switch out of DEVICE_STATE_LOST and into DEVICE_STATE_NEEDS_RESET
if ( m_DeviceState == DEVICE_STATE_LOST_DEVICE )
{
// We can only try to reset if we're not minimized and not lost
if ( !m_bIsMinimized && (hr != D3DERR_DEVICELOST) )
{
m_DeviceState = DEVICE_STATE_NEEDS_RESET;
}
}
// Immediately checking needs reset also helps for the case where we got D3DERR_DEVICENOTRESET
if ( m_DeviceState == DEVICE_STATE_NEEDS_RESET )
{
if ( ( hr == D3DERR_DEVICELOST ) || m_bIsMinimized )
{
m_DeviceState = DEVICE_STATE_LOST_DEVICE;
}
else
{
bool bResetSucceeded = TryDeviceReset();
if ( bResetSucceeded )
{
if ( !bOtherAppInitializing )
{
m_DeviceState = DEVICE_STATE_OK;
// purge unreferenced materials
g_pShaderUtil->UncacheUnusedMaterials( true );
// We were bad, now we're ok. Restore resources and reset render state.
ReacquireResourcesInternal( true, true, "NeedsReset" );
}
else
{
m_DeviceState = DEVICE_STATE_OTHER_APP_INIT;
}
}
}
}
if ( m_DeviceState == DEVICE_STATE_OTHER_APP_INIT )
{
if ( ( hr != D3D_OK ) || m_bIsMinimized )
{
m_DeviceState = DEVICE_STATE_LOST_DEVICE;
}
else if ( !bOtherAppInitializing )
{
m_DeviceState = DEVICE_STATE_OK;
// purge unreferenced materials
g_pShaderUtil->UncacheUnusedMaterials( true );
#if !defined( _GAMECONSOLE )
Dx9Device()->ReportDeviceReset();
#else
g_pShaderDeviceMgr->InvokeDeviceResetNotifications( m_pD3DDevice, &m_PresentParameters, m_hWnd );
#endif
// We were bad, now we're ok. Restore resources and reset render state.
ReacquireResourcesInternal( true, true, "OtherAppInit" );
}
}
// Do mode change if we have a video mode change.
if ( m_bPendingVideoModeChange && !IsDeactivated() )
{
#ifdef _DEBUG
Warning( "mode change!\n" );
#endif
ResizeWindow( m_PendingVideoModeChangeConfig );
}
#endif
}
bool CShaderDeviceDx8::BuildStaticShader( bool bVertexShader, void **ppShader, const char *pShaderName,
const char *strShaderProgram, const DWORD *shaderData, unsigned int shaderSize )
{
#if defined( X360_LINK_WITH_SHADER_COMPILE )
// Compile our shader from HLSL-in-a-string
ID3DXBuffer *pErrorMsg = NULL;
ID3DXBuffer *pShaderCode = NULL;
const char *shaderModel = bVertexShader ? "vs_2_0" : "ps_2_0";
HRESULT hr = D3DXCompileShader( strShaderProgram, (UINT)strlen( strShaderProgram ), NULL, NULL, "main", shaderModel, 0, &pShaderCode, &pErrorMsg, NULL );
if ( FAILED( hr ) )
return false;
// Check that our static shader data is valid
if ( ( shaderSize != pShaderCode->GetBufferSize() ) || memcmp( shaderData, pShaderCode->GetBufferPointer(), shaderSize ) )
{
// Use the fallback compiled-from-string data
shaderData = (DWORD*)pShaderCode->GetBufferPointer();
shaderSize = pShaderCode->GetBufferSize();
#if defined( _CERT )
#error "X360_LINK_WITH_SHADER_COMPILE should not be defined when _CERT is defined!! Only use it when revving XDK."
#endif
// Force a crash, so the user will attach a debugger and thus see the below spew
char *p = 0;
*p = 0;
// Shader data needs updating - allow me to spew it out for your cut'n'paste convenience
Plat_DebugString( "\n\nERROR: static shader data in RestorePersistedDisplay needs updating for new XDK/compiler version! (" );
Plat_DebugString( pShaderName );
Plat_DebugString( ")\nconst DWORD shaderData[] = {\n " );
int numLines = ( shaderSize + 31 ) / 32;
for ( int i = 0; i < numLines; i++ )
{
int numWords = MIN( 8, ( ( shaderSize / 4 ) - i*8 ) );
for ( int j = 0; j < numWords; j++ )
{
char wordBuffer[ 32 ];
V_snprintf( wordBuffer, sizeof( wordBuffer ), "0x%08x, ", shaderData[ i*8 + j ] );
Plat_DebugString( wordBuffer );
}
Plat_DebugString( "\n " );
}
Plat_DebugString( "};\n\n" );
}
#endif // defined( X360_LINK_WITH_SHADER_COMPILE )
if ( bVertexShader )
{
#ifdef _GAMECONSOLE
Dx9Device()->CreateVertexShader( shaderData, (IDirect3DVertexShader9 **)ppShader );
#else
Dx9Device()->CreateVertexShader( shaderData, (IDirect3DVertexShader9 **)ppShader, pShaderName );
#endif
}
else
{
#ifdef _GAMECONSOLE
Dx9Device()->CreatePixelShader( shaderData, (IDirect3DPixelShader9 **)ppShader );
#else
Dx9Device()->CreatePixelShader( shaderData, (IDirect3DPixelShader9 **)ppShader, pShaderName );
#endif
}
#if defined( X360_LINK_WITH_SHADER_COMPILE )
pShaderCode->Release();
pShaderCode = NULL;
if ( pErrorMsg )
{
pErrorMsg->Release();
pErrorMsg = NULL;
}
#endif // defined( X360_LINK_WITH_SHADER_COMPILE )
return true;
}
//-----------------------------------------------------------------------------
// Special method to refresh the screen on the XBox360
//-----------------------------------------------------------------------------
bool CShaderDeviceDx8::AllocNonInteractiveRefreshObjects()
{
#if defined( _GAMECONSOLE )
#if defined( _X360 )
// HLSL source for the refresh shaders:
const char *strVertexShaderProgram =
" float4x4 matWVP : register(c0);"
" struct VS_IN"
" {"
" float4 ObjPos : POSITION;"
" float2 TexCoord : TEXCOORD;"
" };"
" struct VS_OUT"
" {"
" float4 ProjPos : POSITION;"
" float2 TexCoord : TEXCOORD;"
" };"
" VS_OUT main( VS_IN In )"
" {"
" VS_OUT Out; "
" Out.ProjPos = mul( matWVP, In.ObjPos );"
" Out.TexCoord = In.TexCoord;"
" return Out;"
" }";
const char *strPixelShaderProgram =
" struct PS_IN"
" {"
" float2 TexCoord : TEXCOORD;"
" };"
" sampler detail : register( s0 );"
" float4 main( PS_IN In ) : COLOR"
" {"
" return tex2D( detail, In.TexCoord );"
" }";
const char *strPixelShaderProgram2 =
" struct PS_IN"
" {"
" float2 TexCoord : TEXCOORD;"
" };"
" sampler detail : register( s0 );"
" float4 main( PS_IN In ) : COLOR"
" {"
" return tex2D( detail, In.TexCoord );"
" }";
const char *strPixelShaderProgram3 =
" struct PS_IN"
" {"
" float2 TexCoord : TEXCOORD;"
" };"
" float SrgbGammaToLinear( float flSrgbGammaValue )"
" {"
" float x = saturate( flSrgbGammaValue );"
" return ( x <= 0.04045f ) ? ( x / 12.92f ) : ( pow( ( x + 0.055f ) / 1.055f, 2.4f ) );"
" }"
" float X360LinearToGamma( float flLinearValue )"
" {"
" float fl360GammaValue;"
" flLinearValue = saturate( flLinearValue );"
" if ( flLinearValue < ( 128.0f / 1023.0f ) )"
" {"
" if ( flLinearValue < ( 64.0f / 1023.0f ) )"
" {"
" fl360GammaValue = flLinearValue * ( 1023.0f * ( 1.0f / 255.0f ) );"
" }"
" else"
" {"
" fl360GammaValue = flLinearValue * ( ( 1023.0f / 2.0f ) * ( 1.0f / 255.0f ) ) + ( 32.0f / 255.0f );"
" }"
" }"
" else"
" {"
" if ( flLinearValue < ( 512.0f / 1023.0f ) )"
" {"
" fl360GammaValue = flLinearValue * ( ( 1023.0f / 4.0f ) * ( 1.0f / 255.0f ) ) + ( 64.0f / 255.0f );"
" }"
" else"
" {"
" fl360GammaValue = flLinearValue * ( ( 1023.0f /8.0f ) * ( 1.0f / 255.0f ) ) + ( 128.0f /255.0f );"
" if ( fl360GammaValue > 1.0f )"
" {"
" fl360GammaValue = 1.0f;"
" }"
" }"
" }"
" fl360GammaValue = saturate( fl360GammaValue );"
" return fl360GammaValue;"
" }"
" sampler detail : register( s0 );"
" float4 main( PS_IN In ) : COLOR"
" {"
" float4 vTextureColor = tex2D( detail, In.TexCoord );"
// Only needed in TOB, not needed for L4D which had a corrected offline PWL processing
// " vTextureColor.r = X360LinearToGamma( SrgbGammaToLinear( vTextureColor.r ) );"
// " vTextureColor.g = X360LinearToGamma( SrgbGammaToLinear( vTextureColor.g ) );"
// " vTextureColor.b = X360LinearToGamma( SrgbGammaToLinear( vTextureColor.b ) );"
" return vTextureColor;"
" }";
// Hard-coded compiled shader data, so we don't have to bloat our DLLs
// with all the shader compilation stuff from the D3D libs (over 2 MB!)
#if defined( _X360 ) && ( _XDK_VER != 20764 )
// Make sure this hard-coded shader data gets updated with each XDK rev
#if !defined( JUNE_2009_XDK_ISSUES )
#error "Define X360_LINK_WITH_SHADER_COMPILE temporarily (to verify compiled static shader data, and spew out new data if necessary)"
#endif
#endif
DWORD vertexShaderData[] = {
0x102a1101, 0x000000bc, 0x00000084, 0x00000000, 0x00000024, 0x00000000, 0x00000084, 0x00000000,
0x00000000, 0x0000005c, 0x0000001c, 0x0000004f, 0xfffe0300, 0x00000001, 0x0000001c, 0x00000000,
0x00000048, 0x00000030, 0x00020000, 0x00040000, 0x00000038, 0x00000000, 0x6d617457, 0x565000ab,
0x00030003, 0x00040004, 0x00010000, 0x00000000, 0x76735f33, 0x5f300032, 0x2e302e32, 0x30373634,
0x2e3000ab, 0x00000000, 0x00000084, 0x00010002, 0x00000000, 0x00000000, 0x00000821, 0x00000001,
0x00000002, 0x00000001, 0x00000290, 0x00100003, 0x00305004, 0x00003050, 0x00001009, 0x30052003,
0x00001200, 0xc2000000, 0x00004005, 0x00001200, 0xc4000000, 0x00001009, 0x00002200, 0x00000000,
0x05f82000, 0x00000688, 0x00000000, 0x05f80000, 0x00000fc8, 0x00000000, 0xc80f0001, 0x001b8800,
0xa1020300, 0xc80f0001, 0x00c68800, 0xab020201, 0xc80f0001, 0x00b13494, 0xab020101, 0xc80f803e,
0x006c0034, 0xab020001, 0xc8038000, 0x00b0b000, 0xe2000000, 0x00000000, 0x00000000, 0x00000000,
};
DWORD pixelShaderData1[] = {
0x102a1100, 0x000000a8, 0x0000003c, 0x00000000, 0x00000024, 0x00000000, 0x00000084, 0x00000000,
0x00000000, 0x0000005c, 0x0000001c, 0x0000004f, 0xffff0300, 0x00000001, 0x0000001c, 0x00000000,
0x00000048, 0x00000030, 0x00030000, 0x00010000, 0x00000038, 0x00000000, 0x64657461, 0x696c00ab,
0x0004000c, 0x00010001, 0x00010000, 0x00000000, 0x70735f33, 0x5f300032, 0x2e302e32, 0x30373634,
0x2e3000ab, 0x00000000, 0x0000003c, 0x10000000, 0x00000004, 0x00000000, 0x00000821, 0x00010001,
0x00000001, 0x00003050, 0x00011002, 0x00001200, 0xc4000000, 0x00001003, 0x00002200, 0x00000000,
0x10080001, 0x1f1ff688, 0x00004000, 0xc80f8000, 0x00000000, 0xe2000000, 0x00000000, 0x00000000,
0x00000000,
};
DWORD pixelShaderData2[] = {
0x102a1100, 0x000000a8, 0x0000003c, 0x00000000, 0x00000024, 0x00000000, 0x00000084, 0x00000000,
0x00000000, 0x0000005c, 0x0000001c, 0x0000004f, 0xffff0300, 0x00000001, 0x0000001c, 0x00000000,
0x00000048, 0x00000030, 0x00030000, 0x00010000, 0x00000038, 0x00000000, 0x64657461, 0x696c00ab,
0x0004000c, 0x00010001, 0x00010000, 0x00000000, 0x70735f33, 0x5f300032, 0x2e302e32, 0x30373634,
0x2e3000ab, 0x00000000, 0x0000003c, 0x10000000, 0x00000004, 0x00000000, 0x00000821, 0x00010001,
0x00000001, 0x00003050, 0x00011002, 0x00001200, 0xc4000000, 0x00001003, 0x00002200, 0x00000000,
0x10080001, 0x1f1ff688, 0x00004000, 0xc80f8000, 0x00000000, 0xe2000000, 0x00000000, 0x00000000,
0x00000000,
};
DWORD pixelShaderData3[] = {
0x102a1100, 0x000000a8, 0x0000003c, 0x00000000, 0x00000024, 0x00000000, 0x00000084, 0x00000000,
0x00000000, 0x0000005c, 0x0000001c, 0x0000004f, 0xffff0300, 0x00000001, 0x0000001c, 0x00000000,
0x00000048, 0x00000030, 0x00030000, 0x00010000, 0x00000038, 0x00000000, 0x64657461, 0x696c00ab,
0x0004000c, 0x00010001, 0x00010000, 0x00000000, 0x70735f33, 0x5f300032, 0x2e302e32, 0x30373634,
0x2e3000ab, 0x00000000, 0x0000003c, 0x10000000, 0x00000004, 0x00000000, 0x00000821, 0x00010001,
0x00000001, 0x00003050, 0x00011002, 0x00001200, 0xc4000000, 0x00001003, 0x00002200, 0x00000000,
0x10080001, 0x1f1ff688, 0x00004000, 0xc80f8000, 0x00000000, 0xe2000000, 0x00000000, 0x00000000,
0x00000000,
};
// Build the requisite shaders:
if ( !BuildStaticShader( true, (void **)&m_NonInteractiveRefresh.m_pVertexShader, "m_pVertexShader",
strVertexShaderProgram, vertexShaderData, sizeof( vertexShaderData ) ) )
return false;
if ( !BuildStaticShader( false, (void **)&m_NonInteractiveRefresh.m_pPixelShader, "m_pPixelShader",
strPixelShaderProgram, pixelShaderData1, sizeof( pixelShaderData1 ) ) )
return false;
if ( !BuildStaticShader( false, (void **)&m_NonInteractiveRefresh.m_pPixelShaderStartup, "m_pPixelShaderStartup",
strPixelShaderProgram2, pixelShaderData2, sizeof( pixelShaderData2 ) ) )
return false;
if ( !BuildStaticShader( false, (void **)&m_NonInteractiveRefresh.m_pPixelShaderStartupPass2, "m_pPixelShaderStartupPass2",
strPixelShaderProgram3, pixelShaderData3, sizeof( pixelShaderData3 ) ) )
return false;
#elif defined( _PS3 )
extern uint32_t _binary_noninteractiveshader_vpo_start;
extern uint32_t _binary_noninteractiveshader_vpo_end;
extern uint32_t _binary_noninteractiveshader_fpo_start;
extern uint32_t _binary_noninteractiveshader_fpo_end;
extern uint32_t _binary_noninteractiveshaderstartup_fpo_start;
extern uint32_t _binary_noninteractiveshaderstartup_fpo_end;
extern uint32_t _binary_noninteractiveshaderstartuppass2_fpo_start;
extern uint32_t _binary_noninteractiveshaderstartuppass2_fpo_end;
Dx9Device()->CreateVertexShader( ( const DWORD* )&_binary_noninteractiveshader_vpo_start, &m_NonInteractiveRefresh.m_pVertexShader, "m_pVertexShader" );
Dx9Device()->CreatePixelShader( ( const DWORD* )&_binary_noninteractiveshader_fpo_start, &m_NonInteractiveRefresh.m_pPixelShader, "m_pPixelShader" );
Dx9Device()->CreatePixelShader( ( const DWORD* )&_binary_noninteractiveshaderstartup_fpo_start, &m_NonInteractiveRefresh.m_pPixelShaderStartup, "m_pPixelShaderStartup" );
Dx9Device()->CreatePixelShader( ( const DWORD* )&_binary_noninteractiveshaderstartuppass2_fpo_start, &m_NonInteractiveRefresh.m_pPixelShaderStartupPass2, "m_pPixelShaderStartupPass2" );
#endif
D3DVERTEXELEMENT9 VertexElements[4] =
{
{ 0, 0, D3DDECLTYPE_FLOAT3, D3DDECLMETHOD_DEFAULT, D3DDECLUSAGE_POSITION, 0 },
{ 0, 12, D3DDECLTYPE_FLOAT2, D3DDECLMETHOD_DEFAULT, D3DDECLUSAGE_TEXCOORD, 0 },
D3DDECL_END()
};
// Create a vertex declaration from the element descriptions.
Dx9Device()->CreateVertexDeclaration( VertexElements, &m_NonInteractiveRefresh.m_pVertexDecl );
#endif
return true;
}
void CShaderDeviceDx8::FreeNonInteractiveRefreshObjects()
{
if ( m_NonInteractiveRefresh.m_pVertexShader )
{
m_NonInteractiveRefresh.m_pVertexShader->Release();
m_NonInteractiveRefresh.m_pVertexShader = NULL;
}
if ( m_NonInteractiveRefresh.m_pPixelShader )
{
m_NonInteractiveRefresh.m_pPixelShader->Release();
m_NonInteractiveRefresh.m_pPixelShader = NULL;
}
if ( m_NonInteractiveRefresh.m_pPixelShaderStartup )
{
m_NonInteractiveRefresh.m_pPixelShaderStartup->Release();
m_NonInteractiveRefresh.m_pPixelShaderStartup = NULL;
}
if ( m_NonInteractiveRefresh.m_pPixelShaderStartupPass2 )
{
m_NonInteractiveRefresh.m_pPixelShaderStartupPass2->Release();
m_NonInteractiveRefresh.m_pPixelShaderStartupPass2 = NULL;
}
if ( m_NonInteractiveRefresh.m_pVertexDecl )
{
m_NonInteractiveRefresh.m_pVertexDecl->Release();
m_NonInteractiveRefresh.m_pVertexDecl = NULL;
}
}
bool CShaderDeviceDx8::InNonInteractiveMode() const
{
return m_NonInteractiveRefresh.m_Mode != MATERIAL_NON_INTERACTIVE_MODE_NONE;
}
void CShaderDeviceDx8::EnableNonInteractiveMode( MaterialNonInteractiveMode_t mode, ShaderNonInteractiveInfo_t *pInfo )
{
if ( !IsGameConsole() )
return;
if ( pInfo && ( pInfo->m_hTempFullscreenTexture == INVALID_SHADERAPI_TEXTURE_HANDLE ) )
{
mode = MATERIAL_NON_INTERACTIVE_MODE_NONE;
}
if ( ( mode == MATERIAL_NON_INTERACTIVE_MODE_STARTUP ) && ( !pInfo || ( pInfo->m_nPacifierCount <= 0 ) ) )
{
Warning( "Badness! Non interactive startup mode wasn't given a pacifier texture!\n" );
}
m_NonInteractiveRefresh.m_Mode = mode;
if ( pInfo )
{
m_NonInteractiveRefresh.m_Info = *pInfo;
}
m_NonInteractiveRefresh.m_nPacifierFrame = 0;
if ( mode != MATERIAL_NON_INTERACTIVE_MODE_NONE )
{
ConVarRef mat_monitorgamma( "mat_monitorgamma" );
ConVarRef mat_monitorgamma_tv_range_min( "mat_monitorgamma_tv_range_min" );
ConVarRef mat_monitorgamma_tv_range_max( "mat_monitorgamma_tv_range_max" );
ConVarRef mat_monitorgamma_tv_exp( "mat_monitorgamma_tv_exp" );
ConVarRef mat_monitorgamma_tv_enabled( "mat_monitorgamma_tv_enabled" );
SetHardwareGammaRamp( mat_monitorgamma.GetFloat(), mat_monitorgamma_tv_range_min.GetFloat(), mat_monitorgamma_tv_range_max.GetFloat(),
mat_monitorgamma_tv_exp.GetFloat(), mat_monitorgamma_tv_enabled.GetBool() );
}
#ifdef _X360
if ( mode != MATERIAL_NON_INTERACTIVE_MODE_NONE )
{
// HACK: VSync off (prevents us wasting time blocking on VSync due to our irregular present intervals)
Dx9Device()->SetRenderState( D3DRS_PRESENTINTERVAL, D3DPRESENT_INTERVAL_IMMEDIATE );
}
else
{
// HACK: VSync on if we want it.
Dx9Device()->SetRenderState( D3DRS_PRESENTINTERVAL, m_PresentParameters.PresentationInterval );
}
#elif defined (_PS3)
if ( mode != MATERIAL_NON_INTERACTIVE_MODE_NONE )
{
// HACK: VSync off (prevents us wasting time blocking on VSync due to our irregular present intervals)
g_ps3gcmGlobalState.SetFastFlip(1);
}
else
{
// HACK: VSync on if we want it.
g_ps3gcmGlobalState.SetFastFlip(0);
}
#endif
// Msg( "Time elapsed: %.3f Peak %.3f Ave %.5f Count %d Count Above %d\n", Plat_FloatTime() - m_NonInteractiveRefresh.m_flStartTime,
// m_NonInteractiveRefresh.m_flPeakDt, m_NonInteractiveRefresh.m_flTotalDt / m_NonInteractiveRefresh.m_nSamples, m_NonInteractiveRefresh.m_nSamples, m_NonInteractiveRefresh.m_nCountAbove66 );
m_NonInteractiveRefresh.m_flStartTime = m_NonInteractiveRefresh.m_flLastPresentTime =
m_NonInteractiveRefresh.m_flLastPacifierTime = Plat_FloatTime();
m_NonInteractiveRefresh.m_flPeakDt = 0.0f;
m_NonInteractiveRefresh.m_flTotalDt = 0.0f;
m_NonInteractiveRefresh.m_nSamples = 0;
m_NonInteractiveRefresh.m_nCountAbove66 = 0;
}
void CShaderDeviceDx8::UpdatePresentStats()
{
float t = Plat_FloatTime();
float flActualDt = t - m_NonInteractiveRefresh.m_flLastPresentTime;
if ( flActualDt > m_NonInteractiveRefresh.m_flPeakDt )
{
m_NonInteractiveRefresh.m_flPeakDt = flActualDt;
}
if ( flActualDt > 0.066 )
{
++m_NonInteractiveRefresh.m_nCountAbove66;
if ( mat_spew_long_frames.GetBool() )
{
Warning( "****LONG FRAME: %04d>66ms\n", ( int )( flActualDt * 1000 ) );
}
}
m_NonInteractiveRefresh.m_flTotalDt += flActualDt;
++m_NonInteractiveRefresh.m_nSamples;
t = Plat_FloatTime();
m_NonInteractiveRefresh.m_flLastPresentTime = t;
}
// at least on PS/3, framerate is capped at 30 fps (33ms) and trying to Present every
// 15 ms will cause a backlog of frames to render, which will effectively stall every Present after the first 2 for 33ms
#define LOADING_PRESENT_UPDATE_INTERVAL 0.05f
float g_flLastUpdateTime = 0.0f;
bool g_bInSwap = false;
#ifdef _PS3
struct Vector4
{
Vector4(){}
Vector4( float fx, float fy, float fz, float fw) { x=fx;y=fy;z=fz;w=fw; }
float x,y,z,w;
};
struct Matrix4x4
{
Vector4 r[4];
};
Matrix4x4 Matrix4x4OrthographicOffCenterLH( float ViewLeft, float ViewRight, float ViewBottom, float ViewTop, float NearZ, float FarZ )
{
Matrix4x4 M;
float ReciprocalWidth = 1.0f / (ViewRight - ViewLeft);
float ReciprocalHeight = 1.0f / (ViewTop - ViewBottom);
M.r[0] = Vector4(2 * ReciprocalWidth, 0.0f, 0.0f, 0.0f);
M.r[1] = Vector4(0.0f, -2 * ReciprocalHeight, 0.0f, 0.0f);
M.r[2] = Vector4(0.0f, 0.0f, 1.0f / (FarZ - NearZ), 0.0f);
M.r[3] = Vector4(-(ViewLeft + ViewRight) * ReciprocalWidth,
(ViewTop + ViewBottom) * ReciprocalHeight,
-M.r[2].z * NearZ,
1.0f);
return M;
}
#elif defined( _X360 )
#define Matrix4x4OrthographicOffCenterLH XMMatrixOrthographicOffCenterLH
#define Matrix4x4 XMMATRIX
#endif
#if ENABLE_MICRO_PROFILER
double g_time_PresentProfilerReset = 0;
CMicroProfiler g_mp_Present;
#endif
void CShaderDeviceDx8::OnDebugEvent( const char * pEvent )
{
#if ENABLE_MICRO_PROFILER
if( !IsCert() )
{
double timeNow = Plat_FloatTime(), timeDelta = timeNow - g_time_PresentProfilerReset;
double flSleepMilliseconds = g_mp_Present.GetTotalMilliseconds();
if( g_mp_Present.m_numCalls )
{
COM_TimestampedLog( "Present() Stats: %d flips / %.1f sec = ave %.1f fps. Sleep %.2f seconds = %.3fms/flip. %s\n", g_mp_Present.m_numCalls, timeDelta, timeDelta > 0.001 ? float( g_mp_Present.m_numCalls ) / timeDelta : 0.0f, flSleepMilliseconds * 1e-3f, g_mp_Present.m_numCalls ? flSleepMilliseconds / double( g_mp_Present.m_numCalls ) : 0.0f, pEvent );
}
else
{
COM_TimestampedLog( "Present() Stats: no flips / %.1f sec. %s\n", timeDelta, pEvent );
}
g_mp_Present.Reset();
g_time_PresentProfilerReset = timeNow;
}
#endif
}
void CShaderDeviceDx8::RefreshFrontBufferNonInteractive()
{
if ( !IsGameConsole() || !InNonInteractiveMode() )
return;
float flTimeBegin = Plat_FloatTime();
float dt = flTimeBegin - g_flLastUpdateTime;
#ifdef _PS3
// 7ltodo extern bool IsRsxReadyForNoninteractiveRefresh( );
// if( !IsRsxReadyForNoninteractiveRefresh( ) )
// {
// // why bother rendering anything if there are front buffers in the queue for flipping, or something was flipped 1 or less vblanks ago?
// // if we do bother to render in this case, we may enter a self-perpetuating bad state where we fill up the queue of front buffers to flip
// // and have to wait for up to 33 ms in every Present, effectively making this function stall for 33 ms for no good reason.
// return;
// }
#endif
if( dt < LOADING_PRESENT_UPDATE_INTERVAL || g_bInSwap || g_pMaterialSystem->IsInFrame() )
return;
g_bInSwap = true;
// Other code should not be talking to D3D at the same time as this
AUTO_LOCK_FM( m_nonInteractiveModeMutex );
#ifdef _GAMECONSOLE
g_pShaderAPI->OwnGPUResources( false );
IDirect3DBaseTexture *pTexture = g_pShaderAPI->GetD3DTexture( m_NonInteractiveRefresh.m_Info.m_hTempFullscreenTexture );
int w, h;
g_pShaderAPI->GetBackBufferDimensions( w, h );
Matrix4x4 matWVP = Matrix4x4OrthographicOffCenterLH( 0, (float)w, (float)h, 0, 0, 1 );
// Structure to hold vertex data.
struct TEXVERTEX
{
FLOAT Position[3];
FLOAT TexCoord[2];
};
TEXVERTEX Vertices[4];
float flPixelCenter = IsPS3() ? 0 : 0.5f;
bool bInStartupMode = ( m_NonInteractiveRefresh.m_Mode == MATERIAL_NON_INTERACTIVE_MODE_STARTUP );
#if defined( CSTRIKE15 )
if ( bInStartupMode )
{
// Render the initial vtf loading screen to match how we render our Scaleform backgrounds,
// so the transition between loading and Scaleform is seamless:
// HACK: These are the dimensions of the src background vtf
const float th = 1024.f;
const float tw = 1024.f;
// VTFs are forced to be square, even if the source texture is non 1:1. Rescale the
// texture to assume its actually in 16:9, as it was authored
float convertTH = th * 720.0f / 1280.0f;
// Now, determine the scale between the texture and the viewport in height
float heightScale = (float)h / convertTH;
int scaledTH = (int)( heightScale * (float) convertTH );
int scaledTW = (int)( heightScale * (float) tw );
float bgTop = (h / 2) - (scaledTH / 2) - flPixelCenter;
float bgLeft = (w / 2) - (scaledTW / 2) - flPixelCenter;
float bgBottom = (h / 2) + (scaledTH / 2) - flPixelCenter;
float bgRight = (w / 2) + (scaledTW / 2) - flPixelCenter;
Vertices[0].Position[0] = bgLeft;
Vertices[0].Position[1] = bgTop;
Vertices[0].Position[2] = 0;
Vertices[0].TexCoord[0] = 0;
Vertices[0].TexCoord[1] = 0;
Vertices[1].Position[0] = bgRight;
Vertices[1].Position[1] = bgTop;
Vertices[1].Position[2] = 0;
Vertices[1].TexCoord[0] = 1;
Vertices[1].TexCoord[1] = 0;
Vertices[2].Position[0] = bgRight;
Vertices[2].Position[1] = bgBottom;
Vertices[2].Position[2] = 0;
Vertices[2].TexCoord[0] = 1;
Vertices[2].TexCoord[1] = 1;
Vertices[3].Position[0] = bgLeft;
Vertices[3].Position[1] = bgBottom;
Vertices[3].Position[2] = 0;
Vertices[3].TexCoord[0] = 0;
Vertices[3].TexCoord[1] = 1;
}
else
#endif // !CSTRIKE15
{
Vertices[0].Position[0] = -flPixelCenter;
Vertices[0].Position[1] = -flPixelCenter;
Vertices[0].Position[2] = 0;
Vertices[0].TexCoord[0] = 0;
Vertices[0].TexCoord[1] = 0;
Vertices[1].Position[0] = w - flPixelCenter;
Vertices[1].Position[1] = -flPixelCenter;
Vertices[1].Position[2] = 0;
Vertices[1].TexCoord[0] = 1;
Vertices[1].TexCoord[1] = 0;
Vertices[2].Position[0] = w - flPixelCenter;
Vertices[2].Position[1] = h - flPixelCenter;
Vertices[2].Position[2] = 0;
Vertices[2].TexCoord[0] = 1;
Vertices[2].TexCoord[1] = 1;
Vertices[3].Position[0] = -flPixelCenter;
Vertices[3].Position[1] = h - flPixelCenter;
Vertices[3].Position[2] = 0;
Vertices[3].TexCoord[0] = 0;
Vertices[3].TexCoord[1] = 1;
}
D3DVIEWPORT9 viewport;
viewport.X = viewport.Y = 0;
viewport.Width = w; viewport.Height = h;
viewport.MinZ = ReverseDepthOnX360() ? 1.0f : 0.0f;
viewport.MaxZ = 1.0f - viewport.MinZ;
float flDepth = (ShaderUtil()->GetConfig().bReverseDepth ^ ReverseDepthOnX360()) ? 0.0f : 1.0f;
#ifdef _PS3
Dx9Device()->AntiAliasingHint( AA_HINT_MENU );
#endif
Dx9Device()->Clear( 0, NULL, D3DCLEAR_ZBUFFER | D3DCLEAR_STENCIL | D3DCLEAR_TARGET0, 0, flDepth, 0L );
Dx9Device()->SetViewport( &viewport );
Dx9Device()->SetTexture( 0, pTexture );
Dx9Device()->SetVertexShader( m_NonInteractiveRefresh.m_pVertexShader );
Dx9Device()->SetPixelShader( bInStartupMode ? m_NonInteractiveRefresh.m_pPixelShaderStartup : m_NonInteractiveRefresh.m_pPixelShader );
Dx9Device()->SetVertexShaderConstantF( 0, (FLOAT*)&matWVP, 4 );
Dx9Device()->SetVertexDeclaration( m_NonInteractiveRefresh.m_pVertexDecl );
Dx9Device()->SetSamplerState( 0, D3DSAMP_ADDRESSU, D3DTADDRESS_CLAMP );
Dx9Device()->SetSamplerState( 0, D3DSAMP_ADDRESSV, D3DTADDRESS_CLAMP );
Dx9Device()->SetSamplerState( 0, D3DSAMP_MINFILTER, D3DTEXF_LINEAR );
Dx9Device()->SetSamplerState( 0, D3DSAMP_MAGFILTER, D3DTEXF_LINEAR );
Dx9Device()->SetRenderState( D3DRS_ZENABLE, FALSE );
Dx9Device()->DrawPrimitiveUP( D3DPT_QUADLIST, 1, Vertices, sizeof( TEXVERTEX ) );
if ( bInStartupMode && m_NonInteractiveRefresh.m_Info.m_flLogoNormalizedW && m_NonInteractiveRefresh.m_Info.m_flLogoNormalizedH )
{
float flXPos = m_NonInteractiveRefresh.m_Info.m_flLogoNormalizedX;
float flYPos = m_NonInteractiveRefresh.m_Info.m_flLogoNormalizedY;
float flWidth = m_NonInteractiveRefresh.m_Info.m_flLogoNormalizedW;
float flHeight = m_NonInteractiveRefresh.m_Info.m_flLogoNormalizedH;
int x = w * flXPos;
int y = h * flYPos;
int logoW = w * flWidth;
int logoH = h * flHeight;
Vertices[0].Position[0] = x - flPixelCenter;
Vertices[0].Position[1] = y - flPixelCenter;
Vertices[1].Position[0] = x + logoW - flPixelCenter;
Vertices[1].Position[1] = y - flPixelCenter;
Vertices[2].Position[0] = x + logoW - flPixelCenter;
Vertices[2].Position[1] = y + logoH - flPixelCenter;
Vertices[3].Position[0] = x - flPixelCenter;
Vertices[3].Position[1] = y + logoH - flPixelCenter;
pTexture = g_pShaderAPI->GetD3DTexture( m_NonInteractiveRefresh.m_Info.m_hLogoTexture );
Dx9Device()->SetRenderState( D3DRS_ALPHABLENDENABLE, 1 );
Dx9Device()->SetRenderState( D3DRS_SRCBLEND, D3DBLEND_SRCALPHA );
Dx9Device()->SetRenderState( D3DRS_DESTBLEND, D3DBLEND_INVSRCALPHA );
Dx9Device()->SetTexture( 0, pTexture );
Dx9Device()->SetPixelShader( m_NonInteractiveRefresh.m_pPixelShaderStartupPass2 );
//Dx9Device()->SetVertexShaderConstantF( 0, (FLOAT*)&matWVP, 4 );
Dx9Device()->DrawPrimitiveUP( D3DPT_QUADLIST, 1, Vertices, sizeof( TEXVERTEX ) );
}
if ( bInStartupMode && ( m_NonInteractiveRefresh.m_Info.m_nPacifierCount > 0 ) )
{
float flXPos = m_NonInteractiveRefresh.m_Info.m_flNormalizedX;
float flYPos = m_NonInteractiveRefresh.m_Info.m_flNormalizedY;
float flHeight = m_NonInteractiveRefresh.m_Info.m_flNormalizedSize;
int nSize = h * flHeight;
int x = w * flXPos - nSize * 0.5f;
int y = h * flYPos - nSize * 0.5f;
Vertices[0].Position[0] = x - flPixelCenter;
Vertices[0].Position[1] = y - flPixelCenter;
Vertices[1].Position[0] = x + nSize - flPixelCenter;
Vertices[1].Position[1] = y - flPixelCenter;
Vertices[2].Position[0] = x + nSize - flPixelCenter;
Vertices[2].Position[1] = y + nSize - flPixelCenter;
Vertices[3].Position[0] = x - flPixelCenter;
Vertices[3].Position[1] = y + nSize - flPixelCenter;
float flDt = flTimeBegin - m_NonInteractiveRefresh.m_flLastPacifierTime;
// Even if we are drawing faster than 10 hertz (goal is 60 for this path), only animate the spinner at 10 hertz.
if ( flDt > 0.10f )
{
if ( ++m_NonInteractiveRefresh.m_nPacifierFrame >= m_NonInteractiveRefresh.m_Info.m_nPacifierCount )
{
m_NonInteractiveRefresh.m_nPacifierFrame = 0;
}
m_NonInteractiveRefresh.m_flLastPacifierTime = flTimeBegin;
}
pTexture = g_pShaderAPI->GetD3DTexture( m_NonInteractiveRefresh.m_Info.m_pPacifierTextures[ m_NonInteractiveRefresh.m_nPacifierFrame ] );
Dx9Device()->SetRenderState( D3DRS_ALPHABLENDENABLE, 1 );
Dx9Device()->SetRenderState( D3DRS_SRCBLEND, D3DBLEND_SRCALPHA );
Dx9Device()->SetRenderState( D3DRS_DESTBLEND, D3DBLEND_INVSRCALPHA );
Dx9Device()->SetTexture( 0, pTexture );
Dx9Device()->SetPixelShader( m_NonInteractiveRefresh.m_pPixelShaderStartupPass2 );
Dx9Device()->DrawPrimitiveUP( D3DPT_QUADLIST, 1, Vertices, sizeof( TEXVERTEX ) );
}
Dx9Device()->SetVertexShader( NULL );
Dx9Device()->SetPixelShader( NULL );
Dx9Device()->SetTexture( 0, NULL );
Dx9Device()->SetVertexDeclaration( NULL );
Dx9Device()->SetRenderState( D3DRS_ZENABLE, TRUE );
Dx9Device()->Present( 0, 0, 0, 0 );
g_pShaderAPI->QueueResetRenderState();
g_pShaderAPI->OwnGPUResources( true );
UpdatePresentStats();
#endif
g_bInSwap = false;
// NOTE: It is necessary to re-read time, since Refresh
// may block, and if it does, it'll force a refresh every allocation
// if we don't resample time after the block
g_flLastUpdateTime = Plat_FloatTime();
#if !defined( _CERT )
float flPresentCost = g_flLastUpdateTime - flTimeBegin;
if( flPresentCost > ( IsDebug() ? 1e-3f : 5e-3f ) )
{
COM_TimestampedLog( "RefreshFrontBufferNonInteractive %.3f ms", flPresentCost * 1000 );
}
#endif
if ( IsPS3() )
{
// We can't trust device state after a swap/present operation.
// Reset all render state after the underlying PS3 device wrapper has reset its own state.
g_pShaderAPI->ResetRenderState( 1 );
}
}
//-----------------------------------------------------------------------------
// Page flip
//-----------------------------------------------------------------------------
void CShaderDeviceDx8::Present()
{
LOCK_SHADERAPI();
// flush the dynamic buffer and execute the per-draw call queuene
g_pShaderAPI->OnPresent();
if ( !IsDeactivated() )
{
Dx9Device()->EndScene();
}
HRESULT hr = S_OK;
// if we're in queued mode, don't present if the device is already lost
bool bValidPresent = true;
bool bInMainThread = ThreadInMainThread();
if ( !bInMainThread )
{
// don't present if the device is in an invalid state and in queued mode
if ( m_DeviceState != DEVICE_STATE_OK )
{
bValidPresent = false;
}
// check for lost device early in threaded mode
CheckDeviceLost( m_bOtherAppInitializing );
if ( m_DeviceState != DEVICE_STATE_OK )
{
bValidPresent = false;
}
}
// Copy the back buffer into the non-interactive temp buffer
if ( m_NonInteractiveRefresh.m_Mode == MATERIAL_NON_INTERACTIVE_MODE_LEVEL_LOAD )
{
g_pShaderAPI->CopyRenderTargetToTextureEx( m_NonInteractiveRefresh.m_Info.m_hTempFullscreenTexture, 0, NULL, NULL );
}
// If we're not iconified, try to present (without this check, we can flicker when Alt-Tabbed away)
#ifdef _WIN32
if ( IsX360() || (IsIconic( ( HWND )m_hWnd ) == 0 && bValidPresent) )
#else
if ( IsX360() || (IsIconic( (VD3DHWND)m_hWnd ) == 0 && bValidPresent) )
#endif
{
if ( IsPC() && ( m_IsResizing || ( m_ViewHWnd != (VD3DHWND)m_hWnd ) ) )
{
RECT destRect;
#if !defined( DX_TO_GL_ABSTRACTION )
GetClientRect( ( HWND )m_ViewHWnd, &destRect );
#else
toglGetClientRect( (VD3DHWND)m_ViewHWnd, &destRect );
#endif
ShaderViewport_t viewport;
g_pShaderAPI->GetViewports( &viewport, 1 );
RECT srcRect;
srcRect.left = viewport.m_nTopLeftX;
srcRect.right = viewport.m_nTopLeftX + viewport.m_nWidth;
srcRect.top = viewport.m_nTopLeftY;
srcRect.bottom = viewport.m_nTopLeftY + viewport.m_nHeight;
MICRO_PROFILE( g_mp_Present );
hr = Dx9Device()->Present( &srcRect, &destRect, (VD3DHWND)m_ViewHWnd, 0 );
}
else
{
g_pShaderAPI->OwnGPUResources( false );
MICRO_PROFILE( g_mp_Present );
hr = Dx9Device()->Present( 0, 0, 0, 0 );
}
}
UpdatePresentStats();
if ( IsPlatformWindows() )
{
if ( hr == D3DERR_DRIVERINTERNALERROR )
{
/* Usually this bug means that the driver has run out of internal video
memory, due to leaking it slowly over several application restarts.
As of summer 2007, IE in particular seemed to leak a lot of driver
memory for every image context it created in the browser window. A
reboot clears out the leaked memory and will generally allow the game
to be run again; occasionally (but not frequently) it's necessary to
reduce video settings in the game as well to run. But, this is too
fine a distinction to explain in a dialog, so place the guilt on the
user and ask them to reduce video settings regardless.
*/
Error( "Internal driver error at Present.\n"
"You're likely out of OS Paged Pool Memory! For more info, see\n"
"http://support.steampowered.com\n" );
}
if ( hr == D3DERR_DEVICELOST )
{
MarkDeviceLost();
}
}
MeshMgr()->DiscardVertexBuffers();
if ( bInMainThread )
{
CheckDeviceLost( m_bOtherAppInitializing );
}
if ( IsX360() )
{
// according to docs - "Mandatory Reset of GPU Registers"
// 360 must force the cached state to be dirty after any present()
g_pShaderAPI->ResetRenderState( false );
}
#ifdef RECORD_KEYFRAMES
static int frame = 0;
++frame;
if (frame == KEYFRAME_INTERVAL)
{
RECORD_COMMAND( DX8_KEYFRAME, 0 );
g_pShaderAPI->ResetRenderState();
frame = 0;
}
#endif
g_pShaderAPI->AdvancePIXFrame();
if ( !IsDeactivated() )
{
#ifndef DX_TO_GL_ABSTRACTION
if ( ( ShaderUtil()->GetConfig().bMeasureFillRate || ShaderUtil()->GetConfig().bVisualizeFillRate ) )
{
g_pShaderAPI->ClearBuffers( true, true, true, -1, -1 );
}
#endif
Dx9Device()->BeginScene();
}
if ( IsPS3() )
{
// We can't trust device state after a swap/present operation.
// Reset all render state after the underlying PS3 device wrapper has reset its own state.
g_pShaderAPI->ResetRenderState( false );
}
}
// We need to scale our colors to the range [16, 235] to keep our colors within TV standards. Some colors might
// still be out of gamut if any of the R, G, or B channels are more than 191 units apart from each other in
// the 0-255 scale, but it looks like the 360 deals with this for us by lowering the bright saturated color components.
// NOTE: I'm leaving the max at 255 to retain whiter than whites. On most TV's, we seems a little dark in the bright colors
// compared to TV and movies when played in the same conditions. This keeps out brights on par with what customers are
// used to seeing.
// TV's generally have a 2.5 gamma, so we need to convert our 2.2 frame buffer into a 2.5 frame buffer for display on a TV
#if defined( CSTRIKE15 )
ConVar mat_monitorgamma_pwl2srgb( "mat_monitorgamma_pwl2srgb", "0" );
ConVar mat_monitorgamma_vganonpwlgamma( "mat_monitorgamma_vganonpwlgamma", "2.2" );
#else
ConVar mat_monitorgamma_pwl2srgb( "mat_monitorgamma_pwl2srgb", "1" );
ConVar mat_monitorgamma_vganonpwlgamma( "mat_monitorgamma_vganonpwlgamma", "2.11" );
#endif
ConVar mat_monitorgamma_force_480_full_tv_range( "mat_monitorgamma_force_480_full_tv_range", "1" );
void CShaderDeviceDx8::SetHardwareGammaRamp( float fGamma, float fGammaTVRangeMin, float fGammaTVRangeMax, float fGammaTVExponent, bool bTVEnabled )
{
DevMsg( 2, "SetHardwareGammaRamp( %f )\n", fGamma );
Assert( Dx9Device() );
if( !Dx9Device() )
return;
DevMsg( 2, "**** Gamma Ramp: fGamma: %f fGammaTVRangeMin: %f fGammaTVRangeMax: %f fGammaTVExponent: %f bTVEnabled: %u\n",
fGamma, fGammaTVRangeMin, fGammaTVRangeMax, fGammaTVExponent, bTVEnabled );
#ifdef _PS3
// input gamma driven by UI: 1.8 - 2.6
// On PS3 we assume that TV mode is defaulting UI 2.2 value to 2.2/2.5 HW value
float flHwGamma = 2.2f / 2.5f;
if ( fGamma < 2.2 )
{
// we remap the range [1.8-2.2] into [0.8-2.2/2.5]
flHwGamma = 0.8 + ( fGamma - 1.8 ) / ( 2.2 - 1.8 ) * ( 2.2/2.5 - 0.8 );
}
else
{
// we remap the range [2.2-2.6] into [2.2/2.5 - 1.2]
flHwGamma = 2.2/2.5 + ( fGamma - 2.2 ) / ( 2.6 - 2.2 ) * ( 1.2 - 2.2/2.5 );
}
// ps3 hardware gamma range allowed by specifications: 0.8 - 1.2
flHwGamma = clamp( flHwGamma, 0.8f, 1.2f );
cellVideoOutSetGamma( CELL_VIDEO_OUT_PRIMARY, flHwGamma );
#else
#ifdef PLATFORM_X360
// On X360, if we're in TV mode, and not high def and at 480P/I or less, then we disable our [16,235] (or equivalent) conversion because the X360's
// system software already applies this adjustment (as far as we can determine) in the "Standard" Black level mode in the X360 dashboard.
// See: System Settings->Console Settings->Display->Black Level
if ( ( bTVEnabled ) && ( mat_monitorgamma_force_480_full_tv_range.GetBool() ) )
{
XVIDEO_MODE xvideoMode;
XGetVideoMode( &xvideoMode );
if ( ( !xvideoMode.fIsHiDef ) && ( xvideoMode.dwDisplayHeight <= 480 ) )
{
fGammaTVRangeMin = 0;
fGammaTVRangeMax = 255;
//Warning( "CShaderDeviceDx8::SetHardwareGammaRamp: Forcing TV range min/max in 480I/P mode to [0,255]\n" );
}
}
#endif
D3DGAMMARAMP gammaRamp;
for ( int i = 0; i < 256; i++ )
{
float flInputValue = float( i ) / 255.0f;
// Since the 360's sRGB read/write is a piecewise linear approximation, we need to correct for the difference in gamma space here
// We're purposely want PWL adjustment *enabled* here, even though we're no longer using PWL adjusted textures. This adjusts for the distortion introduced
// into our overall signal transfer function at low linear light scales.
float flSrgbGammaValue;
if ( IsX360() && mat_monitorgamma_pwl2srgb.GetInt() )
{
// First undo the 360 broken sRGB curve by bringing the value back into linear space
float flLinearValue = X360GammaToLinear( flInputValue );
flLinearValue = clamp( flLinearValue, 0.0f, 1.0f );
// Now apply a true sRGB curve to mimic PC hardware
flSrgbGammaValue = SrgbLinearToGamma( flLinearValue ); // ( flLinearValue <= 0.0031308f ) ? ( flLinearValue * 12.92f ) : ( 1.055f * powf( flLinearValue, ( 1.0f / 2.4f ) ) ) - 0.055f;
flSrgbGammaValue = clamp( flSrgbGammaValue, 0.0f, 1.0f );
}
else
{
flSrgbGammaValue = flInputValue;
}
// Apply the user controlled exponent curve
float flCorrection = pow( flSrgbGammaValue, ( fGamma / 2.2f ) );
flCorrection = clamp( flCorrection, 0.0f, 1.0f );
// TV adjustment - Apply an exp and a scale and bias
if ( bTVEnabled )
{
// Adjust for TV gamma of 2.5 by applying an exponent of 2.2 / 2.5 = 0.88
flCorrection = pow( flCorrection, 2.2f / fGammaTVExponent );
flCorrection = clamp( flCorrection, 0.0f, 1.0f ) ;
// Scale and bias to fit into the 16-235 range for TV's
flCorrection = ( flCorrection * ( fGammaTVRangeMax - fGammaTVRangeMin ) / 255.0f ) + ( fGammaTVRangeMin / 255.0f );
flCorrection = clamp( flCorrection, 0.0f, 1.0f );
}
#if !defined( CSTRIKE15 )
else if ( IsX360() )
{
// Approximate compensation for not using PWL textures on 360 in "monitor" (VGA) mode. Without this the low-end of the ramp will appear too bright at high linear light scales.
float flVGANonPWLAdjustmentGamma = mat_monitorgamma_vganonpwlgamma.GetFloat();
flCorrection = pow( flCorrection, 2.2f / flVGANonPWLAdjustmentGamma );
flCorrection = clamp( flCorrection, 0.0f, 1.0f );
}
#endif
// Generate final int value
unsigned int val = ( int )( flCorrection * 65535.0f );
gammaRamp.red[i] = val;
gammaRamp.green[i] = val;
gammaRamp.blue[i] = val;
}
if ( !CommandLine()->FindParm( "-nogammaramp" ) )
{
Dx9Device()->SetGammaRamp( 0, D3DSGR_NO_CALIBRATION, &gammaRamp );
}
#endif
}
//-----------------------------------------------------------------------------
// Shader compilation
//-----------------------------------------------------------------------------
IShaderBuffer* CShaderDeviceDx8::CompileShader( const char *pProgram, size_t nBufLen, const char *pShaderVersion )
{
return ShaderManager()->CompileShader( pProgram, nBufLen, pShaderVersion );
}
VertexShaderHandle_t CShaderDeviceDx8::CreateVertexShader( IShaderBuffer *pBuffer )
{
return ShaderManager()->CreateVertexShader( pBuffer );
}
void CShaderDeviceDx8::DestroyVertexShader( VertexShaderHandle_t hShader )
{
ShaderManager()->DestroyVertexShader( hShader );
}
GeometryShaderHandle_t CShaderDeviceDx8::CreateGeometryShader( IShaderBuffer* pShaderBuffer )
{
Assert( 0 );
return GEOMETRY_SHADER_HANDLE_INVALID;
}
void CShaderDeviceDx8::DestroyGeometryShader( GeometryShaderHandle_t hShader )
{
Assert( hShader == GEOMETRY_SHADER_HANDLE_INVALID );
}
PixelShaderHandle_t CShaderDeviceDx8::CreatePixelShader( IShaderBuffer *pBuffer )
{
return ShaderManager()->CreatePixelShader( pBuffer );
}
void CShaderDeviceDx8::DestroyPixelShader( PixelShaderHandle_t hShader )
{
ShaderManager()->DestroyPixelShader( hShader );
}
#ifdef DX_TO_GL_ABSTRACTION
void CShaderDeviceDx8::DoStartupShaderPreloading( void )
{
ShaderManager()->DoStartupShaderPreloading();
}
#endif
//-----------------------------------------------------------------------------
// Creates/destroys Mesh
// NOTE: Will be deprecated soon!
//-----------------------------------------------------------------------------
IMesh* CShaderDeviceDx8::CreateStaticMesh( VertexFormat_t vertexFormat, const char *pTextureBudgetGroup, IMaterial * pMaterial, VertexStreamSpec_t *pStreamSpec )
{
LOCK_SHADERAPI();
return MeshMgr()->CreateStaticMesh( vertexFormat, pTextureBudgetGroup, pMaterial, pStreamSpec );
}
void CShaderDeviceDx8::DestroyStaticMesh( IMesh* pMesh )
{
LOCK_SHADERAPI();
MeshMgr()->DestroyStaticMesh( pMesh );
}
//-----------------------------------------------------------------------------
// Creates/destroys vertex buffers + index buffers
//-----------------------------------------------------------------------------
IVertexBuffer *CShaderDeviceDx8::CreateVertexBuffer( ShaderBufferType_t type, VertexFormat_t fmt, int nVertexCount, const char *pBudgetGroup )
{
LOCK_SHADERAPI();
return MeshMgr()->CreateVertexBuffer( type, fmt, nVertexCount, pBudgetGroup );
}
void CShaderDeviceDx8::DestroyVertexBuffer( IVertexBuffer *pVertexBuffer )
{
LOCK_SHADERAPI();
MeshMgr()->DestroyVertexBuffer( pVertexBuffer );
}
IIndexBuffer *CShaderDeviceDx8::CreateIndexBuffer( ShaderBufferType_t bufferType, MaterialIndexFormat_t fmt, int nIndexCount, const char *pBudgetGroup )
{
LOCK_SHADERAPI();
return MeshMgr()->CreateIndexBuffer( bufferType, fmt, nIndexCount, pBudgetGroup );
}
void CShaderDeviceDx8::DestroyIndexBuffer( IIndexBuffer *pIndexBuffer )
{
LOCK_SHADERAPI();
MeshMgr()->DestroyIndexBuffer( pIndexBuffer );
}
IVertexBuffer *CShaderDeviceDx8::GetDynamicVertexBuffer( int streamID, VertexFormat_t vertexFormat, bool bBuffered )
{
LOCK_SHADERAPI();
return MeshMgr()->GetDynamicVertexBuffer( streamID, vertexFormat, bBuffered );
}
IIndexBuffer *CShaderDeviceDx8::GetDynamicIndexBuffer( )
{
LOCK_SHADERAPI();
return MeshMgr()->GetDynamicIndexBuffer( );
}
#ifdef _X360
void CShaderDeviceDx8::SpewVideoInfo360( const CCommand &args )
{
XVIDEO_MODE videoMode;
XGetVideoMode( &videoMode );
Warning( "back buffer size: %dx%d\n", m_PresentParameters.BackBufferWidth, m_PresentParameters.BackBufferHeight );
Warning( "display resolution: %dx%d %s\n", videoMode.dwDisplayWidth, videoMode.dwDisplayHeight, videoMode.fIsInterlaced ? "interlaced" : "progressive" );
Warning( "refresh rate: %f\n", videoMode.RefreshRate );
Warning( "aspect: %s\n", videoMode.fIsWideScreen ? "16x9 (widescreen)" : "4x3 (normal)" );
Warning( "%s\n", videoMode.fIsHiDef ? "hidef" : "lodef" );
switch( videoMode.VideoStandard )
{
case XC_VIDEO_STANDARD_NTSC_M:
Warning( "video standard: NTSC_M\n" );
break;
case XC_VIDEO_STANDARD_NTSC_J:
Warning( "video standard: NTSC_J\n" );
break;
case XC_VIDEO_STANDARD_PAL_I:
Warning( "video standard: PAL_I\n" );
break;
default:
Warning( "error: UNKNOWN VIDEO STANDARD!\n" );
Assert( 0 );
break;
}
ConVarRef fps_max( "fps_max" );
Warning( "fps_max: %f\n", fps_max.GetFloat() );
switch( m_PresentParameters.MultiSampleType )
{
case D3DMULTISAMPLE_NONE:
Warning( "multisample type: D3DMULTISAMPLE_NONE\n" );
break;
case D3DMULTISAMPLE_2_SAMPLES:
Warning( "multisample type: D3DMULTISAMPLE_2_SAMPLES\n" );
break;
case D3DMULTISAMPLE_4_SAMPLES:
Warning( "multisample type: D3DMULTISAMPLE_4_SAMPLES\n" );
break;
}
}
#endif