0ad/source/lib/sysdep/os/win/whrt/tsc.cpp
elexis 43137fef3f Make all Wildfire Games copyright headers consistent by always ending with a period and using (C) instead of (c).
Differential Revision: https://code.wildfiregames.com/D716
Refs 09e974e1cb
Reviewed By: bb
Change in agreement with leper.

This was SVN commit r19899.
2017-07-10 14:26:24 +00:00

259 lines
6.8 KiB
C++

/* Copyright (C) 2010 Wildfire Games.
*
* Permission is hereby granted, free of charge, to any person obtaining
* a copy of this software and associated documentation files (the
* "Software"), to deal in the Software without restriction, including
* without limitation the rights to use, copy, modify, merge, publish,
* distribute, sublicense, and/or sell copies of the Software, and to
* permit persons to whom the Software is furnished to do so, subject to
* the following conditions:
*
* The above copyright notice and this permission notice shall be included
* in all copies or substantial portions of the Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
* EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
* IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
* CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
* TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
* SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
*/
/*
* Timer implementation using RDTSC
*/
#include "precompiled.h"
#include "lib/sysdep/os/win/whrt/tsc.h"
#include "lib/sysdep/os/win/whrt/counter.h"
#include "lib/bits.h"
#include "lib/sysdep/acpi.h"
#include "lib/sysdep/os_cpu.h"
#include "lib/sysdep/os/win/win.h"
#include "lib/sysdep/os/win/wutil.h"
#if ARCH_X86_X64
# include "lib/sysdep/arch/x86_x64/x86_x64.h" // x86_x64::rdtsc
# include "lib/sysdep/arch/x86_x64/topology.h"
# include "lib/sysdep/arch/x86_x64/msr.h"
#endif
//-----------------------------------------------------------------------------
static bool IsUniprocessor()
{
if(topology::NumPackages() != 1)
return false;
if(topology::CoresPerPackage() != 1)
return false;
return true;
}
static bool IsInvariantTSC()
{
#if ARCH_X86_X64
// (we no longer need to check x86_x64::Vendor - Intel and AMD
// agreed on the definition of this feature check)
x86_x64::CpuidRegs regs = { 0 };
regs.eax = 0x80000007;
if(x86_x64::cpuid(&regs))
{
// TSC is invariant across P-state, C-state, turbo, and
// stop grant transitions (e.g. STPCLK)
if(regs.edx & BIT(8))
return true;
}
#endif
return false;
}
static bool IsThrottlingPossible()
{
#if ARCH_X86_X64
x86_x64::CpuidRegs regs = { 0 };
switch(x86_x64::Vendor())
{
case x86_x64::VENDOR_INTEL:
if(x86_x64::Cap(x86_x64::CAP_TM_SCC) || x86_x64::Cap(x86_x64::CAP_EST))
return true;
break;
case x86_x64::VENDOR_AMD:
regs.eax = 0x80000007;
if(x86_x64::cpuid(&regs))
{
enum AmdPowerNowFlags
{
PN_FREQ_ID_CTRL = BIT(1),
PN_HW_THERMAL_CTRL = BIT(4),
PN_SW_THERMAL_CTRL = BIT(5)
};
if(regs.edx & (PN_FREQ_ID_CTRL|PN_HW_THERMAL_CTRL|PN_SW_THERMAL_CTRL))
return true;
}
break;
default:
break;
}
#endif
return false;
}
static bool IsSandyBridge()
{
if(x86_x64::Vendor() != x86_x64::VENDOR_INTEL)
return false;
if(x86_x64::Model() == x86_x64::MODEL_SANDY_BRIDGE)
return true;
if(x86_x64::Model() == x86_x64::MODEL_SANDY_BRIDGE_2)
return true;
return false;
}
//-----------------------------------------------------------------------------
class CounterTSC : public ICounter
{
public:
virtual const char* Name() const
{
return "TSC";
}
Status Activate()
{
#if ARCH_X86_X64
if(!x86_x64::Cap(x86_x64::CAP_TSC))
return ERR::NOT_SUPPORTED; // NOWARN (CPU doesn't support RDTSC)
#endif
return INFO::OK;
}
void Shutdown()
{
}
bool IsSafe() const
{
// using the TSC for timing is subject to a litany of
// potential problems, discussed below:
if(IsInvariantTSC())
return true;
// SMP or multi-core => counters are unsynchronized. both offset and
// drift could be solved by maintaining separate per-core
// counter states, but that requires atomic reads of the TSC and
// the current processor number.
//
// (otherwise, we have a subtle race condition: if preempted while
// reading the time and rescheduled on a different core, incorrect
// results may be returned, which would be unacceptable.)
//
// unfortunately this isn't possible without OS support or the
// as yet unavailable RDTSCP instruction => unsafe.
//
// (note: if the TSC is invariant, drift is no longer a concern.
// we could synchronize the TSC MSRs during initialization and avoid
// per-core counter state and the race condition mentioned above.
// however, we won't bother, since such platforms aren't yet widespread
// and would surely support the nice and safe HPET, anyway)
if(!IsUniprocessor())
return false;
const FADT* fadt = (const FADT*)acpi_GetTable("FACP");
if(fadt)
{
ENSURE(fadt->header.size >= sizeof(FADT));
// TSC isn't incremented in deep-sleep states => unsafe.
if(fadt->IsC3Supported())
return false;
// frequency throttling possible => unsafe.
if(fadt->IsDutyCycleSupported())
return false;
}
#if ARCH_X86_X64
// recent CPU:
//if(x86_x64::Generation() >= 7)
{
// note: 8th generation CPUs support C1-clock ramping, which causes
// drift on multi-core systems, but those were excluded above.
// in addition to frequency changes due to P-state transitions,
// we're also subject to STPCLK throttling. this happens when
// the chipset thinks the system is dangerously overheated; the
// OS isn't even notified. this may be rare, but could cause
// incorrect results => unsafe.
//return false;
}
#endif
// we're dealing with a single older CPU; the only problem there is
// throttling, i.e. changes to the TSC frequency. we don't want to
// disable this because it may be important for cooling. the OS
// initiates changes but doesn't notify us; jumps are too frequent
// and drastic to detect and account for => unsafe.
if(IsThrottlingPossible())
return false;
return true;
}
u64 Counter() const
{
return x86_x64::rdtsc();
}
size_t CounterBits() const
{
return 64;
}
double NominalFrequency() const
{
// WARNING: do not call x86_x64::ClockFrequency because it uses the
// HRT, which we're currently in the process of initializing.
// instead query CPU clock frequency via OS.
//
// note: even here, initial accuracy isn't critical because the
// clock is subject to thermal drift and would require continual
// recalibration anyway.
#if ARCH_X86_X64
if(MSR::IsAccessible() && MSR::HasPlatformInfo())
{
const i64 busFrequency = IsSandyBridge()? 100000000 : 133333333;
const u64 platformInfo = MSR::Read(MSR::PLATFORM_INFO);
const u8 maxNonTurboRatio = bits(platformInfo, 8, 15);
return double(maxNonTurboRatio) * busFrequency;
}
else
#endif
return os_cpu_ClockFrequency();
}
double Resolution() const
{
return 1.0 / NominalFrequency();
}
};
ICounter* CreateCounterTSC(void* address, size_t size)
{
ENSURE(sizeof(CounterTSC) <= size);
return new(address) CounterTSC();
}