//========= Copyright © 1996-2005, Valve Corporation, All rights reserved. ============// // // Purpose: // // $NoKeywords: $ //===========================================================================// #ifndef FASTTIMER_H #define FASTTIMER_H #ifdef _WIN32 #pragma once #endif #include #include "tier0/platform.h" PLATFORM_INTERFACE uint64 g_ClockSpeed; PLATFORM_INTERFACE unsigned long g_dwClockSpeed; PLATFORM_INTERFACE double g_ClockSpeedMicrosecondsMultiplier; PLATFORM_INTERFACE double g_ClockSpeedMillisecondsMultiplier; PLATFORM_INTERFACE double g_ClockSpeedSecondsMultiplier; #ifdef COMPILER_MSVC64 extern "C" { unsigned __int64 __rdtsc(); } #pragma intrinsic(__rdtsc) #endif class CCycleCount { friend class CFastTimer; public: CCycleCount(); CCycleCount( uint64 cycles ); void Sample(); // Sample the clock. This takes about 34 clocks to execute (or 26,000 calls per millisecond on a P900). void Init(); // Set to zero. void Init( float initTimeMsec ); void Init( double initTimeMsec ) { Init( (float)initTimeMsec ); } void Init( uint64 cycles ); bool IsLessThan( CCycleCount const &other ) const; // Compare two counts. // Convert to other time representations. These functions are slow, so it's preferable to call them // during display rather than inside a timing block. unsigned long GetCycles() const; uint64 GetLongCycles() const; unsigned long GetMicroseconds() const; uint64 GetUlMicroseconds() const; double GetMicrosecondsF() const; void SetMicroseconds( unsigned long nMicroseconds ); unsigned long GetMilliseconds() const; double GetMillisecondsF() const; double GetSeconds() const; CCycleCount& operator+=( CCycleCount const &other ); // dest = rSrc1 + rSrc2 static void Add( CCycleCount const &rSrc1, CCycleCount const &rSrc2, CCycleCount &dest ); // Add two samples together. // dest = rSrc1 - rSrc2 static void Sub( CCycleCount const &rSrc1, CCycleCount const &rSrc2, CCycleCount &dest ); // Add two samples together. static uint64 GetTimestamp(); uint64 m_Int64; }; class CClockSpeedInit { public: CClockSpeedInit() { Init(); } static void Init() { const CPUInformation& pi = GetCPUInformation(); if ( !IsX360() ) { g_ClockSpeed = pi.m_Speed; } else { // cycle counter runs as doc'd at 1/64 Xbox 3.2GHz clock speed, thus 50 Mhz g_ClockSpeed = pi.m_Speed / 64L; } g_dwClockSpeed = (unsigned long)g_ClockSpeed; g_ClockSpeedMicrosecondsMultiplier = 1000000.0 / (double)g_ClockSpeed; g_ClockSpeedMillisecondsMultiplier = 1000.0 / (double)g_ClockSpeed; g_ClockSpeedSecondsMultiplier = 1.0f / (double)g_ClockSpeed; } }; class CFastTimer { public: // These functions are fast to call and should be called from your sampling code. void Start(); void End(); const CCycleCount & GetDuration() const; // Get the elapsed time between Start and End calls. CCycleCount GetDurationInProgress() const; // Call without ending. Not that cheap. // Return number of cycles per second on this processor. static inline unsigned long GetClockSpeed(); private: CCycleCount m_Duration; #ifdef DEBUG_FASTTIMER bool m_bRunning; // Are we currently running? #endif }; // This is a helper class that times whatever block of code it's in class CTimeScope { public: CTimeScope( CFastTimer *pTimer ); ~CTimeScope(); private: CFastTimer *m_pTimer; }; inline CTimeScope::CTimeScope( CFastTimer *pTotal ) { m_pTimer = pTotal; m_pTimer->Start(); } inline CTimeScope::~CTimeScope() { m_pTimer->End(); } // This is a helper class that times whatever block of code it's in and // adds the total (int microseconds) to a global counter. class CTimeAdder { public: CTimeAdder( CCycleCount *pTotal ); ~CTimeAdder(); void End(); private: CCycleCount *m_pTotal; CFastTimer m_Timer; }; inline CTimeAdder::CTimeAdder( CCycleCount *pTotal ) { m_pTotal = pTotal; m_Timer.Start(); } inline CTimeAdder::~CTimeAdder() { End(); } inline void CTimeAdder::End() { if( m_pTotal ) { m_Timer.End(); *m_pTotal += m_Timer.GetDuration(); m_pTotal = 0; } } // -------------------------------------------------------------------------- // // Simple tool to support timing a block of code, and reporting the results on // program exit or at each iteration // // Macros used because dbg.h uses this header, thus Msg() is unavailable // -------------------------------------------------------------------------- // #define PROFILE_SCOPE(name) \ class C##name##ACC : public CAverageCycleCounter \ { \ public: \ ~C##name##ACC() \ { \ Msg("%-48s: %6.3f avg (%8.1f total, %7.3f peak, %5d iters)\n", \ #name, \ GetAverageMilliseconds(), \ GetTotalMilliseconds(), \ GetPeakMilliseconds(), \ GetIters() ); \ } \ }; \ static C##name##ACC name##_ACC; \ CAverageTimeMarker name##_ATM( &name##_ACC ) #define TIME_SCOPE(name) \ class CTimeScopeMsg_##name \ { \ public: \ CTimeScopeMsg_##name() { m_Timer.Start(); } \ ~CTimeScopeMsg_##name() \ { \ m_Timer.End(); \ Msg( #name "time: %.4fms\n", m_Timer.GetDuration().GetMillisecondsF() ); \ } \ private: \ CFastTimer m_Timer; \ } name##_TSM; // -------------------------------------------------------------------------- // class CAverageCycleCounter { public: CAverageCycleCounter(); void Init(); void MarkIter( const CCycleCount &duration ); unsigned GetIters() const; double GetAverageMilliseconds() const; double GetTotalMilliseconds() const; double GetPeakMilliseconds() const; private: unsigned m_nIters; CCycleCount m_Total; CCycleCount m_Peak; bool m_fReport; const tchar *m_pszName; }; // -------------------------------------------------------------------------- // class CAverageTimeMarker { public: CAverageTimeMarker( CAverageCycleCounter *pCounter ); ~CAverageTimeMarker(); private: CAverageCycleCounter *m_pCounter; CFastTimer m_Timer; }; // -------------------------------------------------------------------------- // // CCycleCount inlines. // -------------------------------------------------------------------------- // inline CCycleCount::CCycleCount() { Init( (uint64)0 ); } inline CCycleCount::CCycleCount( uint64 cycles ) { Init( cycles ); } inline void CCycleCount::Init() { Init( (uint64)0 ); } inline void CCycleCount::Init( float initTimeMsec ) { if ( g_ClockSpeedMillisecondsMultiplier > 0 ) Init( (uint64)(initTimeMsec / g_ClockSpeedMillisecondsMultiplier) ); else Init( (uint64)0 ); } inline void CCycleCount::Init( uint64 cycles ) { m_Int64 = cycles; } #ifdef COMPILER_MSVC #pragma warning(push) #pragma warning(disable : 4189) // warning C4189: local variable is initialized but not referenced #endif inline void CCycleCount::Sample() { #ifdef COMPILER_MSVC64 unsigned __int64* pSample = (unsigned __int64*)&m_Int64; *pSample = __rdtsc(); // Msg( "Sample = %I64x", pSample ); #elif defined( _X360 ) // only need lower 32 bits, avoids doc'd read bug and 32 bit rollover is in 85 seconds m_Int64 = (uint64)__mftb32(); // scale back up, needs to be viewed as 1 cycle/clock #elif defined( __GNUC__ ) unsigned long* pSample = (unsigned long *)&m_Int64; __asm__ __volatile__ ( "rdtsc\n\t" "movl %%eax, (%0)\n\t" "movl %%edx, 4(%0)\n\t" : /* no output regs */ : "D" (pSample) : "%eax", "%edx" ); #elif defined( _WIN32 ) unsigned long* pSample = (unsigned long *)&m_Int64; __asm { // force the cpu to synchronize the instruction queue // NJS: CPUID can really impact performance in tight loops. //cpuid //cpuid //cpuid mov ecx, pSample rdtsc mov [ecx], eax mov [ecx+4], edx } #elif defined( POSIX ) unsigned long* pSample = (unsigned long *)&m_Int64; __asm__ __volatile__ ( "rdtsc\n\t" "movl %%eax, (%0)\n\t" "movl %%edx, 4(%0)\n\t" : /* no output regs */ : "D" (pSample) : "%eax", "%edx" ); #endif } #ifdef COMPILER_MSVC #pragma warning(pop) #endif inline CCycleCount& CCycleCount::operator+=( CCycleCount const &other ) { m_Int64 += other.m_Int64; return *this; } inline void CCycleCount::Add( CCycleCount const &rSrc1, CCycleCount const &rSrc2, CCycleCount &dest ) { dest.m_Int64 = rSrc1.m_Int64 + rSrc2.m_Int64; } inline void CCycleCount::Sub( CCycleCount const &rSrc1, CCycleCount const &rSrc2, CCycleCount &dest ) { dest.m_Int64 = rSrc1.m_Int64 - rSrc2.m_Int64; } inline uint64 CCycleCount::GetTimestamp() { CCycleCount c; c.Sample(); return c.GetLongCycles(); } inline bool CCycleCount::IsLessThan(CCycleCount const &other) const { return m_Int64 < other.m_Int64; } inline unsigned long CCycleCount::GetCycles() const { return (unsigned long)m_Int64; } inline uint64 CCycleCount::GetLongCycles() const { return m_Int64; } inline unsigned long CCycleCount::GetMicroseconds() const { return (unsigned long)((m_Int64 * 1000000) / g_ClockSpeed); } inline uint64 CCycleCount::GetUlMicroseconds() const { return ((m_Int64 * 1000000) / g_ClockSpeed); } inline double CCycleCount::GetMicrosecondsF() const { return (double)( m_Int64 * g_ClockSpeedMicrosecondsMultiplier ); } inline void CCycleCount::SetMicroseconds( unsigned long nMicroseconds ) { m_Int64 = ((uint64)nMicroseconds * g_ClockSpeed) / 1000000; } inline unsigned long CCycleCount::GetMilliseconds() const { return (unsigned long)((m_Int64 * 1000) / g_ClockSpeed); } inline double CCycleCount::GetMillisecondsF() const { return (double)( m_Int64 * g_ClockSpeedMillisecondsMultiplier ); } inline double CCycleCount::GetSeconds() const { return (double)( m_Int64 * g_ClockSpeedSecondsMultiplier ); } // -------------------------------------------------------------------------- // // CFastTimer inlines. // -------------------------------------------------------------------------- // inline void CFastTimer::Start() { m_Duration.Sample(); #ifdef DEBUG_FASTTIMER m_bRunning = true; #endif } inline void CFastTimer::End() { CCycleCount cnt; cnt.Sample(); if ( IsX360() ) { // have to handle rollover, hires timer is only accurate to 32 bits // more than one overflow should not have occurred, otherwise caller should use a slower timer if ( (uint64)cnt.m_Int64 <= (uint64)m_Duration.m_Int64 ) { // rollover occurred cnt.m_Int64 += 0x100000000LL; } } m_Duration.m_Int64 = cnt.m_Int64 - m_Duration.m_Int64; #ifdef DEBUG_FASTTIMER m_bRunning = false; #endif } inline CCycleCount CFastTimer::GetDurationInProgress() const { CCycleCount cnt; cnt.Sample(); if ( IsX360() ) { // have to handle rollover, hires timer is only accurate to 32 bits // more than one overflow should not have occurred, otherwise caller should use a slower timer if ( (uint64)cnt.m_Int64 <= (uint64)m_Duration.m_Int64 ) { // rollover occurred cnt.m_Int64 += 0x100000000LL; } } CCycleCount result; result.m_Int64 = cnt.m_Int64 - m_Duration.m_Int64; return result; } inline unsigned long CFastTimer::GetClockSpeed() { return g_dwClockSpeed; } inline CCycleCount const& CFastTimer::GetDuration() const { #ifdef DEBUG_FASTTIMER assert( !m_bRunning ); #endif return m_Duration; } // -------------------------------------------------------------------------- // // CAverageCycleCounter inlines inline CAverageCycleCounter::CAverageCycleCounter() : m_nIters( 0 ) { } inline void CAverageCycleCounter::Init() { m_Total.Init(); m_Peak.Init(); m_nIters = 0; } inline void CAverageCycleCounter::MarkIter( const CCycleCount &duration ) { ++m_nIters; m_Total += duration; if ( m_Peak.IsLessThan( duration ) ) m_Peak = duration; } inline unsigned CAverageCycleCounter::GetIters() const { return m_nIters; } inline double CAverageCycleCounter::GetAverageMilliseconds() const { if ( m_nIters ) return (m_Total.GetMillisecondsF() / (double)m_nIters); else return 0; } inline double CAverageCycleCounter::GetTotalMilliseconds() const { return m_Total.GetMillisecondsF(); } inline double CAverageCycleCounter::GetPeakMilliseconds() const { return m_Peak.GetMillisecondsF(); } // -------------------------------------------------------------------------- // inline CAverageTimeMarker::CAverageTimeMarker( CAverageCycleCounter *pCounter ) { m_pCounter = pCounter; m_Timer.Start(); } inline CAverageTimeMarker::~CAverageTimeMarker() { m_Timer.End(); m_pCounter->MarkIter( m_Timer.GetDuration() ); } // CLimitTimer // Use this to time whether a desired interval of time has passed. It's extremely fast // to check while running. class CLimitTimer { public: void SetLimit( uint64 m_cMicroSecDuration ); bool BLimitReached( void ); private: uint64 m_lCycleLimit; }; //----------------------------------------------------------------------------- // Purpose: Initializes the limit timer with a period of time to measure. // Input : cMicroSecDuration - How long a time period to measure //----------------------------------------------------------------------------- inline void CLimitTimer::SetLimit( uint64 m_cMicroSecDuration ) { uint64 dlCycles = ( ( uint64 ) m_cMicroSecDuration * ( uint64 ) g_dwClockSpeed ) / ( uint64 ) 1000000L; CCycleCount cycleCount; cycleCount.Sample( ); m_lCycleLimit = cycleCount.GetLongCycles( ) + dlCycles; } //----------------------------------------------------------------------------- // Purpose: Determines whether our specified time period has passed // Output: true if at least the specified time period has passed //----------------------------------------------------------------------------- inline bool CLimitTimer::BLimitReached( ) { CCycleCount cycleCount; cycleCount.Sample( ); return ( cycleCount.GetLongCycles( ) >= m_lCycleLimit ); } #endif // FASTTIMER_H