536 lines
12 KiB
536 lines
12 KiB
4 years ago
|
/*==LICENSE==*
|
||
|
|
||
|
CyanWorlds.com Engine - MMOG client, server and tools
|
||
|
Copyright (C) 2011 Cyan Worlds, Inc.
|
||
|
|
||
|
This program is free software: you can redistribute it and/or modify
|
||
|
it under the terms of the GNU General Public License as published by
|
||
|
the Free Software Foundation, either version 3 of the License, or
|
||
|
(at your option) any later version.
|
||
|
|
||
|
This program is distributed in the hope that it will be useful,
|
||
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||
|
GNU General Public License for more details.
|
||
|
|
||
|
You should have received a copy of the GNU General Public License
|
||
|
along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||
|
|
||
|
Additional permissions under GNU GPL version 3 section 7
|
||
|
|
||
|
If you modify this Program, or any covered work, by linking or
|
||
|
combining it with any of RAD Game Tools Bink SDK, Autodesk 3ds Max SDK,
|
||
|
NVIDIA PhysX SDK, Microsoft DirectX SDK, OpenSSL library, Independent
|
||
|
JPEG Group JPEG library, Microsoft Windows Media SDK, or Apple QuickTime SDK
|
||
|
(or a modified version of those libraries),
|
||
|
containing parts covered by the terms of the Bink SDK EULA, 3ds Max EULA,
|
||
|
PhysX SDK EULA, DirectX SDK EULA, OpenSSL and SSLeay licenses, IJG
|
||
|
JPEG Library README, Windows Media SDK EULA, or QuickTime SDK EULA, the
|
||
|
licensors of this Program grant you additional
|
||
|
permission to convey the resulting work. Corresponding Source for a
|
||
|
non-source form of such a combination shall include the source code for
|
||
|
the parts of OpenSSL and IJG JPEG Library used as well as that of the covered
|
||
|
work.
|
||
|
|
||
|
You can contact Cyan Worlds, Inc. by email legal@cyan.com
|
||
|
or by snail mail at:
|
||
|
Cyan Worlds, Inc.
|
||
|
14617 N Newport Hwy
|
||
|
Mead, WA 99021
|
||
|
|
||
|
*==LICENSE==*/
|
||
|
#include "plProfileManager.h"
|
||
|
#include "plProfile.h"
|
||
|
#include "hsTimer.h"
|
||
|
|
||
|
#include "hsUtils.h"
|
||
|
|
||
|
static UInt32 gCyclesPerMS = 0;
|
||
|
|
||
|
#ifdef HS_BUILD_FOR_WIN32
|
||
|
#define USE_FAST_TIMER
|
||
|
#endif
|
||
|
|
||
|
#ifdef USE_FAST_TIMER
|
||
|
|
||
|
#pragma warning (push)
|
||
|
#pragma warning (disable : 4035) // disable no return value warning
|
||
|
|
||
|
__forceinline UInt32 GetPentiumCounter()
|
||
|
{
|
||
|
__asm
|
||
|
{
|
||
|
xor eax,eax // VC won't realize that eax is modified w/out this
|
||
|
// instruction to modify the val.
|
||
|
// Problem shows up in release mode builds
|
||
|
_emit 0x0F // Pentium high-freq counter to edx;eax
|
||
|
_emit 0x31 // only care about low 32 bits in eax
|
||
|
|
||
|
xor edx,edx // so VC gets that edx is modified
|
||
|
}
|
||
|
}
|
||
|
|
||
|
#pragma warning (pop)
|
||
|
|
||
|
#include "hsWindows.h"
|
||
|
|
||
|
static UInt32 GetProcSpeed()
|
||
|
{
|
||
|
const char* keypath[] =
|
||
|
{
|
||
|
"HARDWARE",
|
||
|
"DESCRIPTION",
|
||
|
"System",
|
||
|
"CentralProcessor",
|
||
|
"0"
|
||
|
};
|
||
|
|
||
|
HKEY hKey = HKEY_LOCAL_MACHINE;
|
||
|
|
||
|
int numKeys = sizeof(keypath) / sizeof(char*);
|
||
|
for (int i = 0; i < numKeys; i++)
|
||
|
{
|
||
|
HKEY thisKey = NULL;
|
||
|
hsBool success = (RegOpenKeyEx(hKey, keypath[i], 0, KEY_READ, &thisKey) == ERROR_SUCCESS);
|
||
|
|
||
|
RegCloseKey(hKey);
|
||
|
hKey = thisKey;
|
||
|
|
||
|
if (!success)
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
DWORD value=0, size=sizeof(DWORD);
|
||
|
hsBool success = (RegQueryValueEx(hKey, "~MHz", 0, NULL, (BYTE*)&value, &size) == ERROR_SUCCESS);
|
||
|
RegCloseKey(hKey);
|
||
|
|
||
|
return value*1000000;
|
||
|
}
|
||
|
|
||
|
UInt32 GetProcSpeedAlt()
|
||
|
{
|
||
|
const UInt32 kSamplePeriodMS = 250;
|
||
|
|
||
|
// Raise priority to avoid interference from other threads.
|
||
|
int priority = GetThreadPriority(GetCurrentThread());
|
||
|
SetThreadPriority(GetCurrentThread(), THREAD_PRIORITY_TIME_CRITICAL);
|
||
|
|
||
|
UInt32 startTicks, endTicks;
|
||
|
UInt64 pcStart, pcEnd;
|
||
|
|
||
|
// Count number of processor cycles inside the specified interval
|
||
|
QueryPerformanceCounter((LARGE_INTEGER*)&pcStart);
|
||
|
startTicks = plProfileManager::GetTime();
|
||
|
Sleep(kSamplePeriodMS);
|
||
|
endTicks = plProfileManager::GetTime();
|
||
|
QueryPerformanceCounter((LARGE_INTEGER*)&pcEnd);
|
||
|
|
||
|
// Restore thread priority.
|
||
|
SetThreadPriority(GetCurrentThread(), priority);
|
||
|
|
||
|
// Calculate Rdtsc/PerformanceCounter ratio;
|
||
|
UInt32 numTicks = endTicks - startTicks;
|
||
|
UInt64 pcDiff = pcEnd - pcStart;
|
||
|
|
||
|
double ratio = double(numTicks) / double(pcDiff);
|
||
|
UInt64 pcFreq;
|
||
|
QueryPerformanceFrequency((LARGE_INTEGER*)&pcFreq);
|
||
|
|
||
|
// Calculate CPU frequency.
|
||
|
UInt64 cpuFreq = UInt64(pcFreq * ratio);
|
||
|
|
||
|
return (UInt32)cpuFreq;
|
||
|
}
|
||
|
|
||
|
#define GetProfileTicks() GetPentiumCounter()
|
||
|
|
||
|
#else
|
||
|
|
||
|
#define GetProfileTicks() hsTimer::GetPrecTickCount()
|
||
|
|
||
|
#endif // USE_FAST_TIMER
|
||
|
|
||
|
#define TicksToMSec(t) (float(t) / float(gCyclesPerMS))
|
||
|
#define MSecToTicks(t) (float(t) * float(gCyclesPerMS))
|
||
|
|
||
|
plProfileManager::plProfileManager() : fLastAvgTime(0), fProcessorSpeed(0)
|
||
|
{
|
||
|
#ifdef USE_FAST_TIMER
|
||
|
fProcessorSpeed = GetProcSpeed();
|
||
|
// Registry stuff only works on NT OS's, have to calc it otherwise
|
||
|
if (fProcessorSpeed == 0)
|
||
|
fProcessorSpeed = GetProcSpeedAlt();
|
||
|
|
||
|
gCyclesPerMS = fProcessorSpeed / 1000;
|
||
|
#else
|
||
|
gCyclesPerMS = hsTimer::GetPrecTicksPerSec() / 1000;
|
||
|
#endif
|
||
|
}
|
||
|
|
||
|
plProfileManager::~plProfileManager()
|
||
|
{
|
||
|
}
|
||
|
|
||
|
plProfileManager& plProfileManager::Instance()
|
||
|
{
|
||
|
static plProfileManager theInstance;
|
||
|
return theInstance;
|
||
|
}
|
||
|
|
||
|
void plProfileManager::AddTimer(plProfileVar* var)
|
||
|
{
|
||
|
fVars.push_back(var);
|
||
|
}
|
||
|
|
||
|
static UInt32 kAvgMilliseconds = 1000;
|
||
|
|
||
|
void plProfileManager::SetAvgTime(UInt32 avgMS)
|
||
|
{
|
||
|
kAvgMilliseconds = avgMS;
|
||
|
}
|
||
|
|
||
|
static plProfileVar gVarEFPS("EFPS", "General", plProfileVar::kDisplayTime | plProfileVar::kDisplayFPS);
|
||
|
|
||
|
void plProfileManager::BeginFrame()
|
||
|
{
|
||
|
for (int i = 0; i < fVars.size(); i++)
|
||
|
{
|
||
|
fVars[i]->BeginFrame();
|
||
|
if (fVars[i]->GetLaps())
|
||
|
fVars[i]->GetLaps()->BeginFrame();
|
||
|
}
|
||
|
|
||
|
gVarEFPS.BeginTiming();
|
||
|
}
|
||
|
|
||
|
void plProfileManager::EndFrame()
|
||
|
{
|
||
|
gVarEFPS.EndTiming();
|
||
|
|
||
|
hsBool updateAvgs = false;
|
||
|
|
||
|
// If enough time has passed, update the averages
|
||
|
double curTime = hsTimer::GetMilliSeconds();
|
||
|
if (curTime - fLastAvgTime > kAvgMilliseconds)
|
||
|
{
|
||
|
fLastAvgTime = curTime;
|
||
|
updateAvgs = true;
|
||
|
}
|
||
|
|
||
|
int i;
|
||
|
|
||
|
//
|
||
|
// Update all the variables
|
||
|
//
|
||
|
for (i = 0; i < fVars.size(); i++)
|
||
|
{
|
||
|
plProfileVar* var = fVars[i];
|
||
|
|
||
|
if (updateAvgs)
|
||
|
{
|
||
|
// Timers that reset at every BeginTiming() call don't want to average over frames
|
||
|
if (!hsCheckBits(var->GetDisplayFlags(), plProfileBase::kDisplayResetEveryBegin))
|
||
|
{
|
||
|
var->UpdateAvg();
|
||
|
if (var->GetLaps())
|
||
|
var->GetLaps()->UpdateAvgs();
|
||
|
}
|
||
|
}
|
||
|
|
||
|
var->EndFrame();
|
||
|
|
||
|
if (var->GetLaps())
|
||
|
var->GetLaps()->EndFrame();
|
||
|
}
|
||
|
}
|
||
|
|
||
|
UInt32 plProfileManager::GetTime()
|
||
|
{
|
||
|
return GetProfileTicks();
|
||
|
}
|
||
|
|
||
|
///////////////////////////////////////////////////////////////////////////////
|
||
|
|
||
|
plProfileBase::plProfileBase() :
|
||
|
fName(nil),
|
||
|
fDisplayFlags(0),
|
||
|
fValue(0),
|
||
|
fTimerSamples(0),
|
||
|
fAvgCount(0),
|
||
|
fAvgTotal(0),
|
||
|
fLastAvg(0),
|
||
|
fMax(0),
|
||
|
fActive(false),
|
||
|
fRunning(true)
|
||
|
{
|
||
|
}
|
||
|
|
||
|
plProfileBase::~plProfileBase()
|
||
|
{
|
||
|
}
|
||
|
|
||
|
void plProfileBase::BeginFrame()
|
||
|
{
|
||
|
if (!hsCheckBits(fDisplayFlags, kDisplayNoReset))
|
||
|
fValue = 0;
|
||
|
fTimerSamples = 0;
|
||
|
}
|
||
|
|
||
|
void plProfileBase::EndFrame()
|
||
|
{
|
||
|
fAvgCount++;
|
||
|
fAvgTotal += fValue;
|
||
|
fMax = hsMaximum(fMax, fValue);
|
||
|
}
|
||
|
|
||
|
void plProfileBase::UpdateAvg()
|
||
|
{
|
||
|
if (fAvgCount > 0)
|
||
|
{
|
||
|
fLastAvg = (UInt32)(fAvgTotal / fAvgCount);
|
||
|
fAvgCount = 0;
|
||
|
fAvgTotal = 0;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
UInt32 plProfileBase::GetValue()
|
||
|
{
|
||
|
if (hsCheckBits(fDisplayFlags, kDisplayTime))
|
||
|
return (UInt32)TicksToMSec(fValue);
|
||
|
else
|
||
|
return fValue;
|
||
|
}
|
||
|
|
||
|
// Stolen from plMemTracker.cpp
|
||
|
static const char *insertCommas(unsigned int value)
|
||
|
{
|
||
|
static char str[30];
|
||
|
memset(str, 0, sizeof(str));
|
||
|
|
||
|
sprintf(str, "%u", value);
|
||
|
if (strlen(str) > 3)
|
||
|
{
|
||
|
memmove(&str[strlen(str)-3], &str[strlen(str)-4], 4);
|
||
|
str[strlen(str) - 4] = ',';
|
||
|
}
|
||
|
if (strlen(str) > 7)
|
||
|
{
|
||
|
memmove(&str[strlen(str)-7], &str[strlen(str)-8], 8);
|
||
|
str[strlen(str) - 8] = ',';
|
||
|
}
|
||
|
if (strlen(str) > 11)
|
||
|
{
|
||
|
memmove(&str[strlen(str)-11], &str[strlen(str)-12], 12);
|
||
|
str[strlen(str) - 12] = ',';
|
||
|
}
|
||
|
|
||
|
return str;
|
||
|
}
|
||
|
|
||
|
void plProfileBase::IPrintValue(UInt32 value, char* buf, hsBool printType)
|
||
|
{
|
||
|
if (hsCheckBits(fDisplayFlags, kDisplayCount))
|
||
|
{
|
||
|
if (printType)
|
||
|
{
|
||
|
const char* valueStr = insertCommas(value);
|
||
|
strcpy(buf, valueStr);
|
||
|
}
|
||
|
else
|
||
|
sprintf(buf, "%u", value);
|
||
|
}
|
||
|
else if (hsCheckBits(fDisplayFlags, kDisplayFPS))
|
||
|
{
|
||
|
sprintf(buf, "%.1f", 1000.0f / TicksToMSec(value));
|
||
|
}
|
||
|
else if (hsCheckBits(fDisplayFlags, kDisplayTime))
|
||
|
{
|
||
|
sprintf(buf, "%.1f", TicksToMSec(value));
|
||
|
if (printType)
|
||
|
strcat(buf, " ms");
|
||
|
}
|
||
|
else if (hsCheckBits(fDisplayFlags, kDisplayMem))
|
||
|
{
|
||
|
if (printType)
|
||
|
{
|
||
|
if (value > (1024*1000))
|
||
|
sprintf(buf, "%.1f MB", float(value) / (1024.f * 1024.f));
|
||
|
else if (value > 1024)
|
||
|
sprintf(buf, "%d KB", value / 1024);
|
||
|
else
|
||
|
sprintf(buf, "%d b", value);
|
||
|
}
|
||
|
else
|
||
|
sprintf(buf, "%u", value);
|
||
|
}
|
||
|
}
|
||
|
|
||
|
void plProfileBase::PrintValue(char* buf, hsBool printType)
|
||
|
{
|
||
|
IPrintValue(fValue, buf, printType);
|
||
|
}
|
||
|
|
||
|
void plProfileBase::PrintAvg(char* buf, hsBool printType)
|
||
|
{
|
||
|
IPrintValue(fLastAvg, buf, printType);
|
||
|
}
|
||
|
|
||
|
void plProfileBase::PrintMax(char* buf, hsBool printType)
|
||
|
{
|
||
|
IPrintValue(fMax, buf, printType);
|
||
|
}
|
||
|
|
||
|
////////////////////////////////////////////////////////////////////////////////
|
||
|
|
||
|
|
||
|
plProfileLaps::LapInfo* plProfileLaps::IFindLap(const char* lapName)
|
||
|
{
|
||
|
static int lastSearch = 0;
|
||
|
|
||
|
int i;
|
||
|
for (i = lastSearch; i < fLapTimes.size(); i++)
|
||
|
{
|
||
|
if(fLapTimes[i].GetName() == lapName)
|
||
|
{
|
||
|
lastSearch = i;
|
||
|
return &fLapTimes[i];
|
||
|
}
|
||
|
}
|
||
|
|
||
|
if(lastSearch > fLapTimes.size()) lastSearch = fLapTimes.size();
|
||
|
for (i = 0; i < lastSearch; i++)
|
||
|
{
|
||
|
if(fLapTimes[i].GetName() == lapName)
|
||
|
{
|
||
|
lastSearch = i;
|
||
|
return &fLapTimes[i];
|
||
|
}
|
||
|
}
|
||
|
return nil;
|
||
|
}
|
||
|
|
||
|
void plProfileLaps::BeginLap(UInt32 curValue, const char* name)
|
||
|
{
|
||
|
LapInfo* lap = IFindLap(name);
|
||
|
if (!lap)
|
||
|
{
|
||
|
// Technically we shouldn't hold on to this pointer. However, I think
|
||
|
// it will be ok in all cases, so I'll wait until this blows up
|
||
|
LapInfo info(name);
|
||
|
fLapTimes.push_back(info);
|
||
|
lap = &(*(fLapTimes.end()-1));
|
||
|
}
|
||
|
|
||
|
lap->fUsedThisFrame = true;
|
||
|
lap->BeginTiming(curValue);
|
||
|
}
|
||
|
|
||
|
void plProfileLaps::EndLap(UInt32 curValue, const char* name)
|
||
|
{
|
||
|
LapInfo* lap = IFindLap(name);
|
||
|
|
||
|
// There's a lap timer around the input code. You display it with "Stats.ShowLaps Update Input"
|
||
|
// Since the command activates the timer INSIDE the lap, the first call to this function fails to
|
||
|
// find it. (the timer wasn't active when BeginLap was called)
|
||
|
if (lap)
|
||
|
lap->EndTiming(curValue);
|
||
|
}
|
||
|
|
||
|
void plProfileLaps::BeginFrame()
|
||
|
{
|
||
|
for (int i = 0; i < fLapTimes.size(); i++)
|
||
|
{
|
||
|
fLapTimes[i].BeginFrame();
|
||
|
fLapTimes[i].fUsedThisFrame = false;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
void plProfileLaps::EndFrame()
|
||
|
{
|
||
|
for (int i = 0; i < fLapTimes.size(); i++)
|
||
|
{
|
||
|
fLapTimes[i].EndFrame();
|
||
|
if (!fLapTimes[i].fUsedThisFrame)
|
||
|
{
|
||
|
char buf[200];
|
||
|
sprintf(buf, "Dropping unused lap %s", fLapTimes[i].GetName());
|
||
|
hsStatusMessage(buf);
|
||
|
fLapTimes.erase(fLapTimes.begin()+i);
|
||
|
i--;
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
|
||
|
void plProfileLaps::UpdateAvgs()
|
||
|
{
|
||
|
for (int i = 0; i < fLapTimes.size(); i++)
|
||
|
fLapTimes[i].UpdateAvg();
|
||
|
}
|
||
|
|
||
|
int plProfileLaps::GetNumLaps()
|
||
|
{
|
||
|
// std::sort(fLapTimes.begin(), fLapTimes.end());
|
||
|
return fLapTimes.size();
|
||
|
}
|
||
|
|
||
|
plProfileBase* plProfileLaps::GetLap(int i)
|
||
|
{
|
||
|
return &fLapTimes[i];
|
||
|
}
|
||
|
|
||
|
|
||
|
///////////////////////////////////////////////////////////////////////////////
|
||
|
|
||
|
|
||
|
plProfileVar::plProfileVar(const char *name, const char* group, UInt8 flags) :
|
||
|
fGroup(group),
|
||
|
fLaps(nil)
|
||
|
{
|
||
|
fName = name;
|
||
|
fDisplayFlags = flags;
|
||
|
plProfileManager::Instance().AddTimer(this);
|
||
|
fLapsActive = 0;
|
||
|
}
|
||
|
|
||
|
plProfileVar::~plProfileVar()
|
||
|
{
|
||
|
delete fLaps;
|
||
|
}
|
||
|
|
||
|
void plProfileVar::IBeginLap(const char* lapName)
|
||
|
{
|
||
|
if (!fLaps)
|
||
|
fLaps = TRACKED_NEW plProfileLaps;
|
||
|
fDisplayFlags |= kDisplayLaps;
|
||
|
if(fLapsActive)
|
||
|
fLaps->BeginLap(fValue, lapName);
|
||
|
BeginTiming();
|
||
|
}
|
||
|
|
||
|
void plProfileVar::IEndLap(const char* lapName)
|
||
|
{
|
||
|
EndTiming();
|
||
|
if(fLapsActive)
|
||
|
fLaps->EndLap(fValue, lapName);
|
||
|
}
|
||
|
|
||
|
void plProfileVar::IBeginTiming()
|
||
|
{
|
||
|
if( hsCheckBits( fDisplayFlags, kDisplayResetEveryBegin ) )
|
||
|
fValue = 0;
|
||
|
|
||
|
fValue -= GetProfileTicks();
|
||
|
}
|
||
|
|
||
|
void plProfileVar::IEndTiming()
|
||
|
{
|
||
|
fValue += GetProfileTicks();
|
||
|
|
||
|
fTimerSamples++;
|
||
|
|
||
|
// If we reset every BeginTiming(), then we want to average all the timing calls
|
||
|
// independent of framerate
|
||
|
if (hsCheckBits(fDisplayFlags, plProfileBase::kDisplayResetEveryBegin))
|
||
|
UpdateAvg();
|
||
|
}
|