mirror of
https://gitea.wildfiregames.com/0ad/0ad
synced 2026-06-18 14:23:56 -07:00
also rename wchar -> utf8 to avoid conflict with <wchar.h> (requires rebuild of workspace) (unfortunately copying history fails to "502 bad gateway"; had to delete old + add new independently) This was SVN commit r7340.
204 lines
5.9 KiB
C++
204 lines
5.9 KiB
C++
/* Copyright (c) 2010 Wildfire Games
|
|
*
|
|
* Permission is hereby granted, free of charge, to any person obtaining
|
|
* a copy of this software and associated documentation files (the
|
|
* "Software"), to deal in the Software without restriction, including
|
|
* without limitation the rights to use, copy, modify, merge, publish,
|
|
* distribute, sublicense, and/or sell copies of the Software, and to
|
|
* permit persons to whom the Software is furnished to do so, subject to
|
|
* the following conditions:
|
|
*
|
|
* The above copyright notice and this permission notice shall be included
|
|
* in all copies or substantial portions of the Software.
|
|
*
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
|
|
* EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
|
|
* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
|
|
* IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
|
|
* CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
|
|
* TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
|
|
* SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
|
|
*/
|
|
|
|
/*
|
|
* Timer implementation using RDTSC
|
|
*/
|
|
|
|
#include "precompiled.h"
|
|
#include "lib/sysdep/os/win/whrt/tsc.h"
|
|
|
|
#include "lib/sysdep/os/win/whrt/counter.h"
|
|
|
|
#include "lib/bits.h"
|
|
#include "lib/sysdep/os_cpu.h"
|
|
#include "lib/sysdep/os/win/win.h"
|
|
#include "lib/sysdep/os/win/wutil.h"
|
|
|
|
#if ARCH_X86_X64
|
|
# include "lib/sysdep/arch/x86_x64/x86_x64.h" // x86_x64_rdtsc
|
|
# include "lib/sysdep/arch/x86_x64/topology.h"
|
|
#endif
|
|
|
|
|
|
//-----------------------------------------------------------------------------
|
|
// detect throttling
|
|
|
|
enum AmdPowerNowFlags
|
|
{
|
|
PN_FREQ_ID_CTRL = BIT(1),
|
|
PN_SW_THERMAL_CTRL = BIT(5),
|
|
PN_INVARIANT_TSC = BIT(8)
|
|
};
|
|
|
|
static bool IsThrottlingPossible()
|
|
{
|
|
#if ARCH_X86_X64
|
|
x86_x64_CpuidRegs regs;
|
|
switch(x86_x64_Vendor())
|
|
{
|
|
case X86_X64_VENDOR_INTEL:
|
|
if(x86_x64_cap(X86_X64_CAP_TM_SCC) || x86_x64_cap(X86_X64_CAP_EST))
|
|
return true;
|
|
break;
|
|
|
|
case X86_X64_VENDOR_AMD:
|
|
regs.eax = 0x80000007;
|
|
if(x86_x64_cpuid(®s))
|
|
{
|
|
if(regs.edx & (PN_FREQ_ID_CTRL|PN_SW_THERMAL_CTRL))
|
|
return true;
|
|
}
|
|
break;
|
|
}
|
|
return false;
|
|
#endif
|
|
}
|
|
|
|
|
|
//-----------------------------------------------------------------------------
|
|
|
|
class CounterTSC : public ICounter
|
|
{
|
|
public:
|
|
virtual const wchar_t* Name() const
|
|
{
|
|
return L"TSC";
|
|
}
|
|
|
|
LibError Activate()
|
|
{
|
|
#if ARCH_X86_X64
|
|
if(!x86_x64_cap(X86_X64_CAP_TSC))
|
|
return ERR::NO_SYS; // NOWARN (CPU doesn't support RDTSC)
|
|
#endif
|
|
|
|
return INFO::OK;
|
|
}
|
|
|
|
void Shutdown()
|
|
{
|
|
}
|
|
|
|
bool IsSafe() const
|
|
{
|
|
// use of the TSC for timing is subject to a litany of potential problems:
|
|
// - separate, unsynchronized counters with offset and drift;
|
|
// - frequency changes (P-state transitions and STPCLK throttling);
|
|
// - failure to increment in C3 and C4 deep-sleep states.
|
|
// we will discuss the specifics below.
|
|
|
|
// SMP or multi-core => counters are unsynchronized. this could be
|
|
// solved by maintaining separate per-core counter states, but that
|
|
// requires atomic reads of the TSC and the current processor number.
|
|
//
|
|
// (otherwise, we have a subtle race condition: if preempted while
|
|
// reading the time and rescheduled on a different core, incorrect
|
|
// results may be returned, which would be unacceptable.)
|
|
//
|
|
// unfortunately this isn't possible without OS support or the
|
|
// as yet unavailable RDTSCP instruction => unsafe.
|
|
//
|
|
// (note: if the TSC is invariant, drift is no longer a concern.
|
|
// we could synchronize the TSC MSRs during initialization and avoid
|
|
// per-core counter state and the abovementioned race condition.
|
|
// however, we won't bother, since such platforms aren't yet widespread
|
|
// and would surely support the nice and safe HPET, anyway)
|
|
{
|
|
WinScopedLock lock(WHRT_CS);
|
|
const CpuTopology* topology = cpu_topology_Detect();
|
|
if(cpu_topology_NumPackages(topology) != 1 || cpu_topology_CoresPerPackage(topology) != 1)
|
|
return false;
|
|
}
|
|
|
|
#if ARCH_X86_X64
|
|
// recent CPU:
|
|
if(x86_x64_Generation() >= 7)
|
|
{
|
|
// note: 8th generation CPUs support C1-clock ramping, which causes
|
|
// drift on multi-core systems, but those were excluded above.
|
|
|
|
x86_x64_CpuidRegs regs;
|
|
regs.eax = 0x80000007;
|
|
if(x86_x64_cpuid(®s))
|
|
{
|
|
// TSC is invariant WRT P-state, C-state and STPCLK => safe.
|
|
if(regs.edx & PN_INVARIANT_TSC)
|
|
return true;
|
|
}
|
|
|
|
// in addition to P-state transitions, we're also subject to
|
|
// STPCLK throttling. this happens when the chipset thinks the
|
|
// system is dangerously overheated; the OS isn't even notified.
|
|
// it may be rare, but could cause incorrect results => unsafe.
|
|
return false;
|
|
|
|
// newer systems also support the C3 Deep Sleep state, in which
|
|
// the TSC isn't incremented. that's not nice, but irrelevant
|
|
// since STPCLK dooms the TSC on those systems anyway.
|
|
}
|
|
#endif
|
|
|
|
// we're dealing with a single older CPU; the only problem there is
|
|
// throttling, i.e. changes to the TSC frequency. we don't want to
|
|
// disable this because it may be important for cooling. the OS
|
|
// initiates changes but doesn't notify us; jumps are too frequent
|
|
// and drastic to detect and account for => unsafe.
|
|
if(IsThrottlingPossible())
|
|
return false;
|
|
|
|
return true;
|
|
}
|
|
|
|
u64 Counter() const
|
|
{
|
|
return x86_x64_rdtsc();
|
|
}
|
|
|
|
size_t CounterBits() const
|
|
{
|
|
return 64;
|
|
}
|
|
|
|
double NominalFrequency() const
|
|
{
|
|
// WARNING: do not call x86_x64_ClockFrequency because it uses the
|
|
// HRT, which we're currently in the process of initializing.
|
|
// instead query CPU clock frequency via OS.
|
|
//
|
|
// note: even here, initial accuracy isn't critical because the
|
|
// clock is subject to thermal drift and would require continual
|
|
// recalibration anyway.
|
|
return os_cpu_ClockFrequency();
|
|
}
|
|
|
|
double Resolution() const
|
|
{
|
|
return 1.0 / NominalFrequency();
|
|
}
|
|
};
|
|
|
|
ICounter* CreateCounterTSC(void* address, size_t size)
|
|
{
|
|
debug_assert(sizeof(CounterTSC) <= size);
|
|
return new(address) CounterTSC();
|
|
}
|