|
|
//========= Copyright Valve Corporation, All rights reserved. ============//
//
// Purpose:
//
// $NoKeywords: $
//=============================================================================
#include "stdafx.h"
// memdbgon must be the last include file in a .cpp file!!!
#include "tier0/memdbgon.h"
namespace GCSDK { #ifdef DEBUG_JOB_LIST
CUtlLinkedList<CJob *,int> CJobMgr::sm_listAllJobs; #endif
typedef int (__cdecl *QSortCompareFuncCtx_t)(void *, const void *, const void *);
//-----------------------------------------------------------------------------
// Purpose: Constructor
//-----------------------------------------------------------------------------
CJobMgr::CJobMgr() : m_MapJob( 0, 0, DefLessFunc( GID_t ) ), m_QueueJobSleeping( 0, 0, &JobSleepingLessFunc ), m_unNextJobID( 0 ), m_mapStatsBucket( 0, 0, DefLessFunc(uint32) ), m_WorkThreadPool( "CJobMgr::m_WorkThreadPool" ), m_bDebugDisallowPause( false ) { SetDefLessFunc( m_MapJobTimeoutsIndexByJobID ); SetDefLessFunc( m_mapOrphanMessages ); m_bJobTimedOut = false; m_nCurrentYieldIterationRegPri = 0; m_bProfiling = false; m_bIsShuttingDown = false; m_cErrorsToReport = 0; m_unFrameFuncThreadID = 0; m_WorkThreadPool.SetWorkThreadAutoConstruct( 1, NULL ); if( MemAlloc_GetDebugInfoSize() > 0 ) { g_memMainDebugInfo.Init( 0, MemAlloc_GetDebugInfoSize() ); }
if( MemAlloc_GetDebugInfoSize() > 0 ) { g_memMainDebugInfo.EnsureCapacity( MemAlloc_GetDebugInfoSize() ); } }
//-----------------------------------------------------------------------------
// Purpose: Constructor
//-----------------------------------------------------------------------------
CJobMgr::~CJobMgr() { m_WorkThreadPool.StopWorkThreads(); }
//-----------------------------------------------------------------------------
// Purpose: limit the size of our thread pool
//-----------------------------------------------------------------------------
void CJobMgr::SetThreadPoolSize( uint cThreads ) { m_WorkThreadPool.SetWorkThreadAutoConstruct( cThreads, NULL ); }
//-----------------------------------------------------------------------------
// Purpose: gets the next available job ID
//-----------------------------------------------------------------------------
JobID_t CJobMgr::GetNewJobID() { #ifdef GC
return GGCHost()->GenerateGID(); #else
return ++m_unNextJobID; #endif
}
//-----------------------------------------------------------------------------
// Purpose: Run jobs
// Runs once per frame and resumes any sleeping jobs that are scheduled
// to run again, also checks for jobs which have timed out.
//
// Input: limitTimer - limit timer not to exceed
// Output: true if there is still work remaining to do, false otherwise
//-----------------------------------------------------------------------------
bool CJobMgr::BFrameFuncRunSleepingJobs( CLimitTimer &limitTimer ) { CheckThreadID(); // make sure frame function is called from correct thread
bool bWorkRemaining = false;
{ VPROF_BUDGET( "CJobMgr::BResumeSleepingJobs", VPROF_BUDGETGROUP_JOBS_COROUTINES ); bWorkRemaining |= BResumeSleepingJobs( limitTimer ); }
{ VPROF_BUDGET( "CJobMgr::CheckForJobTimeouts", VPROF_BUDGETGROUP_JOBS_COROUTINES ); CheckForJobTimeouts( limitTimer ); }
m_JobStats.m_cJobsCurrent = CountJobs();
return bWorkRemaining; }
//-----------------------------------------------------------------------------
// Purpose: Run jobs
// This function is called repeatedly in a single frame if time is left
// and will first run any yielding jobs
// Input: limitTimer - limit timer not to exceed
// Output: true if there is still work remaining to do, false otherwise
//-----------------------------------------------------------------------------
bool CJobMgr::BFrameFuncRunYieldingJobs( CLimitTimer &limitTimer ) { CheckThreadID(); // make sure frame function is called from correct thread
bool bWorkRemaining = false;
{ VPROF_BUDGET( "CJobMgr::BResumeYieldingJobs", VPROF_BUDGETGROUP_JOBS_COROUTINES ); bWorkRemaining |= BResumeYieldingJobs( limitTimer ); }
{ VPROF_BUDGET( "CJobMgr -- Dispatch completed work items", VPROF_BUDGETGROUP_JOBS_COROUTINES ); bWorkRemaining |= m_WorkThreadPool.BDispatchCompletedWorkItems( limitTimer, this ); }
m_JobStats.m_cJobsCurrent = CountJobs();
return bWorkRemaining; }
//-----------------------------------------------------------------------------
// Purpose: Registers a new job for us to keep track of.
// Input: job - The job in question
//-----------------------------------------------------------------------------
void CJobMgr::InsertJob( CJob &job ) { Assert( m_MapJob.Find( job.GetJobID() ) == m_MapJob.InvalidIndex() ); m_MapJob.Insert( job.GetJobID(), &job ); #ifdef DEBUG_JOB_LIST
sm_listAllJobs.AddToTail( &job ); #endif
}
//-----------------------------------------------------------------------------
// purpose: This job is done, accumulate its stats
//-----------------------------------------------------------------------------
void CJobMgr::AccumulateStatsofJob( CJob &job ) { // if we are not profiling, but the job experienced some kind of failure
// record it anyway - we will issue a consolidated spew about it
if ( !m_bProfiling && job.m_flags.m_uFlags == 0 ) return; if ( job.m_flags.m_uFlags ) m_cErrorsToReport++;
job.m_FastTimerDelta.End(); job.m_cyclecountTotal += job.m_FastTimerDelta.GetDuration();
uint32 eBucket = 0; // the pointer to the name is a pointer to a constant string
// so use this dirty trick to make lookups fast
eBucket = (uint32)job.GetName(); int iBucket = m_mapStatsBucket.Find( eBucket ); if ( iBucket == m_mapStatsBucket.InvalidIndex() ) { iBucket = m_mapStatsBucket.Insert( eBucket ); V_strcpy_safe( m_mapStatsBucket[iBucket].m_rgchName, job.GetName() ); }
JobStatsBucket_t *pJobStatsBucket = &m_mapStatsBucket[iBucket]; pJobStatsBucket->m_cCompletes++; pJobStatsBucket->m_cLocksAttempted += job.m_cLocksAttempted; pJobStatsBucket->m_cLocksWaitedFor += job.m_cLocksWaitedFor; pJobStatsBucket->m_cLocksFailed += job.m_flags.m_bits.m_bLocksFailed ? 1 : 0; pJobStatsBucket->m_cLocksLongHeld += job.m_flags.m_bits.m_bLocksLongHeld ? 1 : 0; pJobStatsBucket->m_cLocksLongWait += job.m_flags.m_bits.m_bLocksLongWait ? 1 : 0; pJobStatsBucket->m_cWaitTimeout += job.m_flags.m_bits.m_bWaitTimeout ? 1 : 0; pJobStatsBucket->m_cJobsFailed += job.m_flags.m_bits.m_bJobFailed ? 1 : 0; pJobStatsBucket->m_cLongInterYieldTime += job.m_flags.m_bits.m_bLongInterYield ? 1 : 0; pJobStatsBucket->m_cTimeoutNetMsg += job.m_flags.m_bits.m_bTimeoutNetMsg ? 1 : 0;
pJobStatsBucket->m_u64RunTime += job.m_cyclecountTotal.GetLongCycles(); if ( (uint64)job.m_cyclecountTotal.GetLongCycles() > pJobStatsBucket->m_u64RunTimeMax ) pJobStatsBucket->m_u64RunTimeMax = job.m_cyclecountTotal.GetLongCycles(); if ( job.m_STimeSwitched != job.m_STimeStarted ) { pJobStatsBucket->m_cJobsPaused++; pJobStatsBucket->m_u64JobDuration += job.m_STimeStarted.CServerMicroSecsPassed(); } else { pJobStatsBucket->m_u64JobDuration += job.m_cyclecountTotal.GetMicroseconds(); } }
//-----------------------------------------------------------------------------
// purpose: This message was orphaned, accumulate for stats
//-----------------------------------------------------------------------------
void CJobMgr::RecordOrphanedMessage( MsgType_t eMsg, JobID_t jobIDTarget ) { EG_MSG( SPEW_JOB, "Message %s arrived responding to job %lld which no longer exists, dropping message\n", PchMsgNameFromEMsg( eMsg ), jobIDTarget ); int iBucket = m_mapOrphanMessages.Find( eMsg ); if ( iBucket == m_mapOrphanMessages.InvalidIndex() ) { int ct = 0; iBucket = m_mapOrphanMessages.Insert( eMsg, ct ); } m_mapOrphanMessages[iBucket]++; }
//-----------------------------------------------------------------------------
// Purpose: Removes a job from the manager. Note that we don't free it.
// Input: job - The job in question
//-----------------------------------------------------------------------------
void CJobMgr::RemoveJob( CJob &job ) { m_MapJob.Remove( job.GetJobID() );
AccumulateStatsofJob( job ); m_JobStats.m_cJobsTotal++; if ( job.m_flags.m_bits.m_bJobFailed ) m_JobStats.m_cJobsFailed++;
uint64 u64JobDuration = job.m_STimeStarted.CServerMicroSecsPassed(); m_JobStats.m_flSumJobTimeMicrosec += u64JobDuration; m_JobStats.m_flSumSqJobTimeMicrosec += ((double)u64JobDuration * (double)u64JobDuration); if ( u64JobDuration > m_JobStats.m_unMaxJobTimeMicrosec ) { m_JobStats.m_unMaxJobTimeMicrosec = u64JobDuration; }
#ifdef DEBUG_JOB_LIST
sm_listAllJobs.FindAndRemove( &job ); #endif
}
#ifdef GC
//-----------------------------------------------------------------------------
// Purpose: resumes the specified job if it is, in fact, waiting for a SQL query
// to return
//-----------------------------------------------------------------------------
bool CJobMgr::BResumeSQLJob( JobID_t jobID ) { int iMap = m_mapSQLQueriesInFlight.Find( jobID ); if ( m_mapSQLQueriesInFlight.IsValidIndex( iMap ) ) { if ( m_bSQLProfiling && m_dictSQLBuckets.IsValidIndex( m_mapSQLQueriesInFlight[iMap].m_iBucket ) ) { SQLProfileBucket_t &bucket = m_dictSQLBuckets[ m_mapSQLQueriesInFlight[iMap].m_iBucket ]; bucket.m_unCount++; bucket.m_nTotalMicrosec += (int64)m_sqlTimer.GetDurationInProgress().GetUlMicroseconds() - m_mapSQLQueriesInFlight[iMap].m_nStartMicrosec; }
m_mapSQLQueriesInFlight.RemoveAt( iMap ); }
int iJob; if ( !BGetIJob( jobID, k_EJobPauseReasonSQL, true, &iJob ) ) { EG_MSG( SPEW_JOB, "BResumeSQLJob called for a job that could not be found!\n" ); return false; }
// Just change the job's pause reason and add it to the yield list
// it will wake up on the next heartbeat
m_MapJob[iJob]->EndPause( k_EJobPauseReasonSQL ); AddToYieldList( *m_MapJob[iJob] );
return true; } #endif
//-----------------------------------------------------------------------------
// Purpose: returns true if we're running any jobs of the specified name
// Output : Returns true on success, false on failure.
//-----------------------------------------------------------------------------
bool CJobMgr::BIsJobRunning( const char *pchJobName ) { FOR_EACH_MAP_FAST( m_MapJob, i ) { if ( !Q_stricmp( m_MapJob[i]->GetName(), pchJobName ) ) return true; } return false; }
//-----------------------------------------------------------------------------
// Purpose: returns true if there is a job active with the specified ID
//-----------------------------------------------------------------------------
bool CJobMgr::BJobExists( JobID_t jobID ) const { return ( m_MapJob.Find( jobID ) != m_MapJob.InvalidIndex() ); }
//-----------------------------------------------------------------------------
// Purpose: returns a job pointer by id
//-----------------------------------------------------------------------------
const CJob *CJobMgr::GetPJob( JobID_t jobID ) const { int iMap = m_MapJob.Find( jobID ); if ( iMap != m_MapJob.InvalidIndex() ) { return m_MapJob[iMap]; } return NULL; }
CJob *CJobMgr::GetPJob( JobID_t jobID ) { int iMap = m_MapJob.Find( jobID ); if ( iMap != m_MapJob.InvalidIndex() ) { return m_MapJob[iMap]; } return NULL; }
//-----------------------------------------------------------------------------
// Purpose: Examines an incoming message to see if it belongs to an active job,
// and if so, sends it to that job. Creates a new job if necessary.
// Output: true if the message was routed to a job
//-----------------------------------------------------------------------------
bool CJobMgr::BRouteMsgToJob( void *pParent, IMsgNetPacket *pNetPacket, const JobMsgInfo_t &jobMsgInfo ) { if ( pNetPacket == NULL ) { AssertMsg(pNetPacket, "CJobMgr::BRouteMsgToJob received NULL packet."); return false; }
if ( jobMsgInfo.m_JobIDTarget != k_GIDNil ) { // This message is a reply to a running job
VPROF_BUDGET( "CJobMgr::BRouteMsgToJob() - continue job", VPROF_BUDGETGROUP_JOBS_COROUTINES );
// Find the job that this packet is destined for
int iJob = m_MapJob.Find( jobMsgInfo.m_JobIDTarget ); if ( m_MapJob.InvalidIndex() != iJob ) { // found the right job, pass it off
PassMsgToJob( *(m_MapJob[iJob]), pNetPacket, jobMsgInfo ); return true; }
// The job is no longer running, it most likely timed out before the response arrived.
// Continue and see if a job is registered to launch from this message
}
// no job, so try creating a job that can handle the msg
// We pass in a pointer to m_JobIDTarget so that it gets set to the new Job's ID. This ensures
// that anyone replying to this message from within the new job has the right JobIDSource.
VPROF_BUDGET( "CJobMgr::BRouteMsgToJob() - job", VPROF_BUDGETGROUP_JOBS_COROUTINES ); bool bRet = BLaunchJobFromNetworkMsg( pParent, jobMsgInfo, pNetPacket );
if ( !bRet && jobMsgInfo.m_JobIDTarget != k_GIDNil ) { RecordOrphanedMessage( jobMsgInfo.m_eMsg, jobMsgInfo.m_JobIDTarget ); // return that we've handled this message (as much as it possibly can be) -- was intended for a job that has
// timed out, no one else can do anything with it
return true; }
return bRet; }
//-----------------------------------------------------------------------------
// Purpose: Routes a message directly to the specified job
//-----------------------------------------------------------------------------
void CJobMgr::PassMsgToJob( CJob &job, IMsgNetPacket *pNetPacket, const JobMsgInfo_t &jobMsgInfo ) { // Check if this job previously failed to wait for this message type,
// then this is probably a late reply. Discard it
if ( job.BHasFailedToReceivedMsgType( jobMsgInfo.m_eMsg ) ) { EmitInfo( SPEW_JOB, 2, LOG_ALWAYS, "Reply msg type %s to job %s is too late; discarding\n", PchMsgNameFromEMsg( jobMsgInfo.m_eMsg ), job.GetName() ); return; }
// make sure it's what we're waiting for
if ( job.GetPauseReason() != k_EJobPauseReasonNetworkMsg ) { AssertMsg3( false, "CJobMgr::PassMsgToJob() job %s received unexpected message %s when paused for %s\n", job.GetName(), PchMsgNameFromEMsg( jobMsgInfo.m_eMsg ), job.GetPauseReasonDescription() ); }
// In case of error, we need to throw this message away
if ( job.GetPauseReason() != k_EJobPauseReasonNetworkMsg ) return;
// Add the packet and resume the job
job.AddPacketToList( pNetPacket, jobMsgInfo.m_JobIDSource ); job.EndPause( k_EJobPauseReasonNetworkMsg ); AddToYieldList( job );
return; }
//-----------------------------------------------------------------------------
// Purpose: pauses the job until a network msg for the specified job arrives
//-----------------------------------------------------------------------------
bool CJobMgr::BYieldingWaitForMsg( CJob &job ) { // wait until we're woken up by a networking callback, or a timeout
PauseJob( job, k_EJobPauseReasonNetworkMsg ); return !m_bJobTimedOut; }
//-----------------------------------------------------------------------------
// Purpose: Returns IJob matching a JobID, if it is paused for the given reason
// Input: jobID - The job that should be paused for the given reason
// eJobPauseReason - Pause reason
// bShouldExist - If true, job should exist, so asserts on not finding it ok
// pIJob - IJob to fill in
// Output: true if job paused for matching reason found
//-----------------------------------------------------------------------------
bool CJobMgr::BGetIJob( JobID_t jobID, EJobPauseReason eJobPauseReason, bool bShouldExist, int *pIJob ) { // If this isn't owned by a job, we don't handle it
if ( k_GIDNil == jobID ) return false;
// Figure out which job the msg belongs to
int iJob = m_MapJob.Find( jobID ); Assert( m_MapJob.InvalidIndex() != iJob || !bShouldExist );
// If it's not one of ours, ignore it
if ( m_MapJob.InvalidIndex() == iJob ) return false;
// make sure it's what we're waiting for
if ( m_MapJob[iJob]->GetPauseReason() != eJobPauseReason ) return false;
*pIJob = iJob; return true; }
//-----------------------------------------------------------------------------
// Purpose: yields for a set amount of time
// Input : &job - job that is yielding
// m_cMicrosecondsToSleep - number of microseconds to wait for before resuming job
// Output : Returns true on success, false on failure.
//-----------------------------------------------------------------------------
bool CJobMgr::BYieldingWaitTime( CJob &job, uint32 cMicrosecondsToSleep ) { Assert( cMicrosecondsToSleep < k_cMicroSecJobPausedTimeout ); // sleep of zero causes an infinite loop
Assert( 0 != cMicrosecondsToSleep );
#ifdef _DEBUG
for ( int i = 0; i < m_QueueJobSleeping.Count(); i++ ) { Assert( m_QueueJobSleeping.Element(i).m_JobID != job.GetJobID() ); } #endif
// insert the job into the sleep list
JobSleeping_t jobSleeping; jobSleeping.m_JobID = job.GetJobID(); jobSleeping.m_SWakeupTime.SetFromJobTime( cMicrosecondsToSleep ); jobSleeping.m_STimeTouched.SetToJobTime(); m_QueueJobSleeping.Insert( jobSleeping );
// yield
PauseJob( job, k_EJobPauseReasonSleepForTime ); if ( m_bJobTimedOut ) return false;
return true; }
#ifdef GC
//-----------------------------------------------------------------------------
// Purpose: yields waiting for a query response
// Input : &job - job that is yielding
// Output : Returns true on success, false on failure.
//-----------------------------------------------------------------------------
// yields waiting for a query response
bool CJobMgr::BYieldingRunQuery( CJob &job, CGCSQLQueryGroup *pQueryGroup, ESchemaCatalog eSchemaCatalog ) { // clear the existing results pointer, if any, to make space for the results
// for this query
pQueryGroup->SetResults( NULL );
if ( m_bSQLProfiling ) { const char *pchName = pQueryGroup->PchName(); if ( !pchName || !pchName[0] ) { if ( pQueryGroup->GetStatementCount() == 1 ) { pchName = pQueryGroup->PchCommand( 0 ); }
if ( !pchName || !pchName[0] ) { pchName = job.GetName(); } }
PendingSQLJob_t sqlJob; sqlJob.m_nStartMicrosec = (int64)m_sqlTimer.GetDurationInProgress().GetUlMicroseconds(); sqlJob.m_iBucket = m_dictSQLBuckets.Find( pchName ); if ( !m_dictSQLBuckets.IsValidIndex( sqlJob.m_iBucket ) ) { SQLProfileBucket_t bucket = { 0, 0 }; sqlJob.m_iBucket = m_dictSQLBuckets.Insert( pchName, bucket ); } m_mapSQLQueriesInFlight.Insert( job.GetJobID(), sqlJob ); }
VPROF_BUDGET( "GCHost", VPROF_BUDGETGROUP_STEAM ); { VPROF_BUDGET( "GCHost - SQLQuery", VPROF_BUDGETGROUP_STEAM ); GGCHost()->SQLQuery( job.GetJobID(), pQueryGroup, eSchemaCatalog ); } PauseJob( job, k_EJobPauseReasonSQL ); return pQueryGroup->GetResults() && pQueryGroup->GetResults()->GetError() == k_EGCSQLErrorNone; }
//-----------------------------------------------------------------------------
// Purpose: turns on sql profiling
//-----------------------------------------------------------------------------
void CJobMgr::StartSQLProfiling() { if ( m_bSQLProfiling ) return;
m_mapSQLQueriesInFlight.RemoveAll(); m_dictSQLBuckets.RemoveAll(); m_sqlTimer.Start(); m_bSQLProfiling = true; }
//-----------------------------------------------------------------------------
// Purpose: turns off sql profiling
//-----------------------------------------------------------------------------
void CJobMgr::StopSQLProfiling() { if ( !m_bSQLProfiling ) return;
m_mapSQLQueriesInFlight.RemoveAll(); m_sqlTimer.End(); m_bSQLProfiling = false; }
//-----------------------------------------------------------------------------
// Purpose: sql profile sort func
//-----------------------------------------------------------------------------
int CJobMgr::SQLProfileSortFunc( void *pCtx, const int *lhs, const int *rhs ) { SQLProfileCtx_t *pSQLProfileCtx = (SQLProfileCtx_t *)pCtx; CUtlDict<SQLProfileBucket_t> *pDictBuckets = pSQLProfileCtx->pdictBuckets; SQLProfileBucket_t &lhsBucket = pDictBuckets->Element( *lhs ); SQLProfileBucket_t &rhsBucket = pDictBuckets->Element( *rhs );
switch ( pSQLProfileCtx->m_eSort ) { default: case k_ESQLProfileSortTotalTime: return rhsBucket.m_nTotalMicrosec - lhsBucket.m_nTotalMicrosec; case k_ESQLProfileSortTotalCount: return rhsBucket.m_unCount - lhsBucket.m_unCount; case k_ESQLProfileSortAvgTime: return ( rhsBucket.m_nTotalMicrosec / rhsBucket.m_unCount ) - ( lhsBucket.m_nTotalMicrosec / lhsBucket.m_unCount ); case k_ESQLProfileSortName: return Q_stricmp( pDictBuckets->GetElementName( *lhs ), pDictBuckets->GetElementName( *rhs ) ); } }
//-----------------------------------------------------------------------------
// Purpose: dumps the current sql profile
//-----------------------------------------------------------------------------
void CJobMgr::DumpSQLProfile( ESQLProfileSort eSort ) { CUtlVector<int> vecSort; for ( int iDict = 0; iDict < m_dictSQLBuckets.MaxElement(); iDict++ ) { if ( !m_dictSQLBuckets.IsValidIndex( iDict ) ) continue;
if ( m_dictSQLBuckets[iDict].m_unCount > 0 ) { vecSort.AddToTail( iDict ); } }
EmitInfo( SPEW_CONSOLE, SPEW_ALWAYS, LOG_ALWAYS, "SQL statement stats:\n" ); if ( 0 == vecSort.Count() ) { EmitInfo( SPEW_CONSOLE, SPEW_ALWAYS, LOG_ALWAYS, "\tNo SQL stats collected; use sql_profile_on / sql_profile_off to collect stats first\n" ); return; }
// sort
SQLProfileCtx_t ctx; ctx.m_eSort = eSort; ctx.pdictBuckets = &m_dictSQLBuckets;
V_qsort_s( vecSort.Base(), vecSort.Count(), sizeof(int), (QSortCompareFuncCtx_t)SQLProfileSortFunc, &ctx );
// display
EmitInfo( SPEW_CONSOLE, SPEW_ALWAYS, LOG_ALWAYS, "%8s %8s %8s\n", "count", "time", "avg" ); FOR_EACH_VEC( vecSort, i ) { SQLProfileBucket_t &bucket = m_dictSQLBuckets[ vecSort[i] ]; const char *pchStatement = m_dictSQLBuckets.GetElementName( vecSort[i] );
// cleanup the statement text
char rgchCleaned[140]; V_strcpy_safe( rgchCleaned, pchStatement ); for ( int i = 0; NULL != rgchCleaned[i]; i++ ) { if ( '\n' == rgchCleaned[i] || '\t' == rgchCleaned[i] ) { rgchCleaned[i] = ' '; } }
bool bSeconds = bucket.m_nTotalMicrosec > k_nMillion; float fTime = bucket.m_nTotalMicrosec / 1000.0f / ( bSeconds ? 1000.0f : 1.0f );
// render
EmitInfo( SPEW_CONSOLE, SPEW_ALWAYS, LOG_ALWAYS, "%8d %8.2f%s %8.2f %s\n", bucket.m_unCount, fTime, bSeconds ? "s " : "ms", (float)bucket.m_nTotalMicrosec / (float)bucket.m_unCount / 1000.0f, rgchCleaned ); } } #endif
//-----------------------------------------------------------------------------
// Purpose: pauses job until a work item completes
//-----------------------------------------------------------------------------
bool CJobMgr::BYieldingWaitForWorkItem( CJob &job, const char *pszWorkItemName ) { // wait until we're woken up by a work item completed, or a timeout
PauseJob( job, k_EJobPauseReasonWorkItem ); if ( m_bJobTimedOut || job.m_bWorkItemCanceled ) return false;
return true; }
//-----------------------------------------------------------------------------
// Purpose: adds a job work item to the thread pool
//-----------------------------------------------------------------------------
void CJobMgr::AddThreadedJobWorkItem( CWorkItem *pWorkItem ) { m_WorkThreadPool.AddWorkItem( pWorkItem ); }
//-----------------------------------------------------------------------------
// Purpose: returns true if we're still working
//-----------------------------------------------------------------------------
bool CJobMgr::HasOutstandingThreadPoolWorkItems() { return m_WorkThreadPool.HasWorkItemsToProcess(); }
//-----------------------------------------------------------------------------
// Purpose: Mark that we're shutting down
//-----------------------------------------------------------------------------
void CJobMgr::SetIsShuttingDown() { m_WorkThreadPool.AllowTimeouts( true ); // during shutdown, we might abort jobs before waiting for the work item to complete
m_bIsShuttingDown = true; }
//-----------------------------------------------------------------------------
// Purpose: Wakes up the specified waiting job.
// Input: jobID - The job that owns this work item
// bWorkItemCanceled - true if this job
// bShouldExist - Do we assert if the job doesn't exist?
// Output: true if the message was routed to a job
//-----------------------------------------------------------------------------
bool CJobMgr::BRouteWorkItemCompletedInternal( JobID_t jobID, bool bWorkItemCanceled, bool bShouldExist, bool bResumeImmediately ) { int iJob;
// this can resume jobs, make sure we didn't switch threads
CheckThreadID();
if ( !BGetIJob( jobID, k_EJobPauseReasonWorkItem, bShouldExist, &iJob ) ) { EG_MSG( SPEW_JOB, "BRouteWorkItemCompleted called for a job that could not be found!\n" ); return false; }
// continue the job
m_MapJob[iJob]->m_bWorkItemCanceled = bWorkItemCanceled; if ( bResumeImmediately ) { m_MapJob[iJob]->Continue(); } else { AddToYieldList( *m_MapJob[iJob] );
// reset the sleep reason
m_MapJob[iJob]->m_ePauseReason = k_EJobPauseReasonYield; }
return true; }
//-----------------------------------------------------------------------------
// Purpose: Adds job to yield list (without actually pausing it) - internal
// Input : &job - job that is yielding
// Output : Returns true on success, false on failure.
//-----------------------------------------------------------------------------
void CJobMgr::AddToYieldList( CJob &job ) { #ifdef _DEBUG
FOR_EACH_LL( m_ListJobsYieldingRegPri, i ) { Assert( m_ListJobsYieldingRegPri[i].m_JobID != job.GetJobID() ); } #endif
// insert the job into the sleep list
JobYielding_t jobYielding; jobYielding.m_JobID = job.GetJobID(); jobYielding.m_nIteration = m_nCurrentYieldIterationRegPri; m_ListJobsYieldingRegPri.AddToTail( jobYielding ); }
//-----------------------------------------------------------------------------
// called by a job that has just been started to place itself on the yield queue instead of running
//-----------------------------------------------------------------------------
void CJobMgr::AddDelayedJobToYieldList( CJob &job ) { //make sure that this job is setup to be yielded at this point, otherwise it will not resume properly
AssertMsg1( job.GetPauseReason() == k_EJobPauseReasonYield, "Delayed job %s was added to yield list but was not in expected yield state\n", job.GetName() ); AddToYieldList( job ); }
//-----------------------------------------------------------------------------
// Purpose: yields until the next Run()
// Input : &job - job that is yielding
// Output : Returns true on success, false on failure.
//-----------------------------------------------------------------------------
bool CJobMgr::BYield( CJob &job ) { AddToYieldList( job );
// yield
PauseJob( job, k_EJobPauseReasonYield ); if ( m_bJobTimedOut ) return false;
return true; }
//-----------------------------------------------------------------------------
// Purpose: yields IF NEEDED until the next Run()
// Input : &job - job that is possibly yielding
// pbYielded - optional, set to true if we did yield
// Output : Returns true on success, false on failure.
//-----------------------------------------------------------------------------
bool CJobMgr::BYieldIfNeeded( CJob &job, bool *pbYielded ) { if ( pbYielded ) *pbYielded = false;
if ( job.GetMicrosecondsRun() > ( k_cMicroSecTaskGranularity / 2 ) ) { bool bRet = BYield( job ); if ( pbYielded ) *pbYielded = bRet; return bRet; }
return true; }
//-----------------------------------------------------------------------------
// Purpose: Resumes jobs in list passed in that are ready to be awakened
//-----------------------------------------------------------------------------
bool CJobMgr::BResumeYieldingJobsFromList( CUtlLinkedList<JobYielding_t, int> &listJobsYielding, uint nCurrentIteration, CLimitTimer &limitTimer ) { while ( listJobsYielding.Count() ) { int iJobYielding = listJobsYielding.Head(); const JobYielding_t &jobYielding = listJobsYielding[ iJobYielding ];
if ( jobYielding.m_nIteration > nCurrentIteration ) break;
// pop the sleep off the top of the queue
int iJob = m_MapJob.Find( jobYielding.m_JobID ); listJobsYielding.Remove( iJobYielding );
if ( m_MapJob.InvalidIndex() == iJob ) continue;
Assert( m_MapJob[iJob]->GetPauseReason() == k_EJobPauseReasonYield );
// Should never be false, but if it is we
// don't want to do anything to this job
if ( m_MapJob[iJob]->GetPauseReason() == k_EJobPauseReasonYield ) { // resume the job
m_MapJob[iJob]->Continue(); }
if ( limitTimer.BLimitReached() ) break; }
return ( listJobsYielding.Count() > 0 ); }
//-----------------------------------------------------------------------------
// Purpose: Resumes any jobs that have are ready to be awaken
// Input: limitTimer - limit timer not to exceed
// Output: true if there is still work remaining to do, false otherwise
//-----------------------------------------------------------------------------
bool CJobMgr::BResumeYieldingJobs( CLimitTimer &limitTimer ) { return BResumeYieldingJobsFromList( m_ListJobsYieldingRegPri, m_nCurrentYieldIterationRegPri++, limitTimer ); }
//-----------------------------------------------------------------------------
// Purpose: Resumes any jobs that have are ready to be awaken
// Input: limitTimer - limit timer not to exceed
// Output: true if there is still work remaining to do, false otherwise
//-----------------------------------------------------------------------------
bool CJobMgr::BResumeSleepingJobs( CLimitTimer &limitTimer ) { while ( m_QueueJobSleeping.Count() ) { const JobSleeping_t &jobSleeping = m_QueueJobSleeping.ElementAtHead(); if ( jobSleeping.m_SWakeupTime.LTime() > CJobTime::LJobTimeCur() ) { // Check if we need to heartbeat
if ( jobSleeping.m_STimeTouched.CServerMicroSecsPassed() >= k_cMicroSecJobHeartbeat ) { int iJob = m_MapJob.Find( jobSleeping.m_JobID ); if ( m_MapJob.InvalidIndex() != iJob ) { m_MapJob[iJob]->Heartbeat(); } }
return false; }
// pop the sleep off the top of the queue
int iJob = m_MapJob.Find( jobSleeping.m_JobID ); m_QueueJobSleeping.RemoveAtHead();
if ( m_MapJob.InvalidIndex() == iJob ) continue;
Assert( m_MapJob[iJob]->GetPauseReason() == k_EJobPauseReasonSleepForTime ); // should never be false, but if it is we don't want to do anything to this job
if ( m_MapJob[iJob]->GetPauseReason() == k_EJobPauseReasonSleepForTime ) { // resume the job
m_MapJob[iJob]->Continue(); }
if ( limitTimer.BLimitReached() ) break; }
return ( m_QueueJobSleeping.Count() > 0 ); }
//-----------------------------------------------------------------------------
// Purpose: comparison function for sorting sleeping jobs list by time
// Output : Returns true on if lhs is greater than the rhs
//-----------------------------------------------------------------------------
bool CJobMgr::JobSleepingLessFunc( JobSleeping_t const &lhs, JobSleeping_t const &rhs ) { // a lower time is a higher priority
return ( lhs.m_SWakeupTime.LTime() > rhs.m_SWakeupTime.LTime() ); }
JobID_t g_DebugJob = k_GIDNil;
//-----------------------------------------------------------------------------
// Purpose: quickly iterates the list of jobs to make sure none have been paused
// for too long
//-----------------------------------------------------------------------------
void CJobMgr::CheckForJobTimeouts( CLimitTimer &limitTimer ) { // look through each active jobs
// remove from the list any job that has successfully received it's I/O
// send a failure msg to any job that has timed out
// since the timeout time is constant, we only have to check until we find a job
int cIter = 0; while ( m_ListJobTimeouts.Head() != m_ListJobTimeouts.InvalidIndex() ) { cIter ++;
// Break if limit timer is reached and we've already processed at least one item.
if ( cIter > 1 && limitTimer.BLimitReached() ) break;
JobTimeout_t &jobtimeout = m_ListJobTimeouts[ m_ListJobTimeouts.Head() ]; // see if it's timed out
if ( !m_bIsShuttingDown && jobtimeout.m_STimeTouched.CServerMicroSecsPassed() < k_cMicroSecJobHeartbeat ) { // we haven't reached our recycle or timeout limit, which means none of the jobs passed us in the queue would have either
break; }
// get the first job in the list, which is the most likely to have timed out
int iJob = m_MapJob.Find( jobtimeout.m_JobID ); if ( m_MapJob.InvalidIndex() == iJob ) { m_MapJobTimeoutsIndexByJobID.Remove( jobtimeout.m_JobID ); m_ListJobTimeouts.Remove( m_ListJobTimeouts.Head() ); continue; }
// job still exists, make sure it is still paused at the same point
CJob *pJob = m_MapJob[iJob];
if ( pJob->GetTimeSwitched().LTime() == jobtimeout.m_STimePaused.LTime() ) { jobtimeout.m_cHeartbeatsBeforeTimeout--;
if ( pJob->GetJobID() == g_DebugJob ) { EmitInfo( SPEW_CONSOLE, SPEW_ALWAYS, LOG_ALWAYS, "Heartbeat!\n" ); }
// Always heartbeat so anyone waiting on the job (say on another server) will know it is still alive
// Note that we even do this right before we timeout, since the job will actually be continued and may just loop itself right back into this waiting state
// Note also that we do NOT check pJob->GetNextHeartbeatTime() since we've already been watching our own timer
pJob->Heartbeat();
if ( m_bIsShuttingDown || jobtimeout.m_cHeartbeatsBeforeTimeout <= 0 ) { // Job finished all its available heartbeats before its timeout limit, timeout if appropriate and remove from the list
m_MapJobTimeoutsIndexByJobID.Remove( jobtimeout.m_JobID ); m_ListJobTimeouts.Remove( m_ListJobTimeouts.Head() );
bool bShouldTimeout = true; switch ( pJob->m_ePauseReason ) { case k_EJobPauseReasonWaitingForLock: case k_EJobPauseReasonYield: case k_EJobPauseReasonSQL: bShouldTimeout = false; break; case k_EJobPauseReasonSleepForTime: bShouldTimeout = m_bIsShuttingDown; break; } // switch
// If the job WAS waiting on IO but now is waiting on a Lock, Sleeping,
// or Yielding, don't time it out.
// BUGBUG taylor we should fix things so that we can timeout Jobs waiting on
// Locks and have them properly unlink themselves from the Lock chain
if ( bShouldTimeout ) { TimeoutJob( *( pJob ) ); } } else { // Job has not yet used up all its available heartbeats before its timeout limit
// We've already decremented its m_cHeartbeatsBeforeTimeout, now Reset its touched time too
jobtimeout.m_STimeTouched.SetToJobTime(); // Move it back to the end of the queue so it can come back up to the top for either another heartbeat or a timeout
m_ListJobTimeouts.LinkToTail( m_ListJobTimeouts.Head() ); int iIndexMap = m_MapJobTimeoutsIndexByJobID.Find( jobtimeout.m_JobID ); if ( iIndexMap != m_MapJobTimeoutsIndexByJobID.InvalidIndex() ) { int &iListIndex = m_MapJobTimeoutsIndexByJobID.Element( iIndexMap ); iListIndex = m_ListJobTimeouts.Tail(); } else { AssertMsg( false, "Map of jobs to timeout is corrupted" ); } }
continue; } else { // This is really the common heartbeating case, where the job waited a short while without ever reaching the k_cMicroSecJobHeartbeat limit
// Thus, we need to heartbeat before removing it from the list IF the job has gone too long without heartbeating
if ( pJob->BJobNeedsToHeartbeat() ) { pJob->Heartbeat(); }
// Since the job didn't actually time out, clear this timeout event
m_MapJobTimeoutsIndexByJobID.Remove( jobtimeout.m_JobID ); m_ListJobTimeouts.Remove( m_ListJobTimeouts.Head() ); } } }
//-----------------------------------------------------------------------------
// Purpose: Continues a job in a timed out state
//-----------------------------------------------------------------------------
void CJobMgr::TimeoutJob( CJob &job ) {
if ( job.GetPauseReason() == k_EJobPauseReasonNetworkMsg ) job.m_flags.m_bits.m_bTimeoutNetMsg = true; else { // these are so rare I dont want to add a column for them in the rollup
EG_WARNING( SPEW_JOB, "Resuming job '%s (id: %lld)' due to timeout while paused for %s\n", job.GetName(), job.GetJobID(), job.GetPauseReasonDescription() ); job.m_flags.m_bits.m_bTimeoutOther = true; }
m_JobStats.m_cJobsTimedOut++; m_bJobTimedOut = true; job.Continue(); m_bJobTimedOut = false; }
//-----------------------------------------------------------------------------
// Purpose: wakes up a job that was waiting on a lock
//-----------------------------------------------------------------------------
void CJobMgr::WakeupLockedJob( CJob &job ) { Assert( job.m_ePauseReason == k_EJobPauseReasonWaitingForLock );
// in case of error, bug out now so as not
// to cause more trouble
if ( job.m_ePauseReason != k_EJobPauseReasonWaitingForLock ) { return; }
// insert the job into the yielding list so it will wakeup next Run
AddToYieldList( job );
// reset the sleep reason
job.m_ePauseReason = k_EJobPauseReasonYield; }
//-----------------------------------------------------------------------------
// Purpose: Pauses a job, and puts it in a list to check for timeouts
//-----------------------------------------------------------------------------
void CJobMgr::PauseJob( CJob &job, EJobPauseReason eJobPauseReason ) { Assert( !m_bDebugDisallowPause ); if ( m_bDebugDisallowPause ) { EmitError( SPEW_GC, "Job %s attempted to pause even though pauses were disabled\n", job.GetName() ); }
// add to list to check for timeouts later (or update the existing entry if it is already there)
JobTimeout_t *pJobTimeout; int iMapIndex = m_MapJobTimeoutsIndexByJobID.Find( job.GetJobID() ); if ( iMapIndex == m_MapJobTimeoutsIndexByJobID.InvalidIndex() ) { pJobTimeout = &m_ListJobTimeouts[ m_ListJobTimeouts.AddToTail() ]; m_MapJobTimeoutsIndexByJobID.Insert( job.GetJobID(), m_ListJobTimeouts.Tail() ); } else { // There was an existing entry, in addition to updating it, move it to the tail
int &iListIndex = m_MapJobTimeoutsIndexByJobID.Element( iMapIndex ); m_ListJobTimeouts.LinkToTail( iListIndex ); iListIndex = m_ListJobTimeouts.Tail();
pJobTimeout = &m_ListJobTimeouts.Element( iListIndex ); }
pJobTimeout->m_JobID = job.GetJobID(); pJobTimeout->m_STimePaused.SetToJobTime(); pJobTimeout->m_STimeTouched.SetToJobTime(); pJobTimeout->m_cHeartbeatsBeforeTimeout = job.CHeartbeatsBeforeTimeout(); if ( eJobPauseReason == k_EJobPauseReasonWorkItem ) { // work items control their own schedule - wait up to 6 hours
pJobTimeout->m_cHeartbeatsBeforeTimeout = (6 * 60 * 60 * k_nMillion) / k_cMicroSecJobHeartbeat; }
if ( pJobTimeout->m_cHeartbeatsBeforeTimeout <= 0 ) { pJobTimeout->m_cHeartbeatsBeforeTimeout = k_cJobHeartbeatsBeforeTimeoutDefault; }
// tell the job to pause
job.Pause( eJobPauseReason ); }
//-----------------------------------------------------------------------------
// Purpose: dumps a list of currently active jobs to the console
// Output : int - number of jobs listed
//-----------------------------------------------------------------------------
int CJobMgr::DumpJobSummary() { CUtlMap< uint32, JobStatsBucket_t, int > mapStatsBucket( 0, 0, DefLessFunc( uint32 ) );
FOR_EACH_MAP_FAST( m_MapJob, i ) { CJob &job = *m_MapJob[i];
// the pointer to the name is a pointer to a constant string
// so use this dirty trick to make lookups fast
uint32 eBucket = (uint32)job.GetName(); int iBucket = mapStatsBucket.Find( eBucket ); if ( iBucket == mapStatsBucket.InvalidIndex() ) { iBucket = mapStatsBucket.Insert( eBucket ); V_strcpy_safe( mapStatsBucket[iBucket].m_rgchName, job.GetName() ); }
JobStatsBucket_t *pJobStatsBucket = &mapStatsBucket[iBucket]; pJobStatsBucket->m_cCompletes++; // overloading this to really mean "jobs running" for this spew
pJobStatsBucket->m_cLocksAttempted += job.m_vecLocks.Count(); // overloading this to really be used for "locks held" for this spew
pJobStatsBucket->m_u64JobDuration += job.m_STimeStarted.CServerMicroSecsPassed();
switch ( job.m_ePauseReason ) { case k_EJobPauseReasonNetworkMsg: pJobStatsBucket->m_cPauseReasonNetworkMsg++; break; case k_EJobPauseReasonSleepForTime: pJobStatsBucket->m_cPauseReasonSleepForTime++; break; case k_EJobPauseReasonWaitingForLock: pJobStatsBucket->m_cPauseReasonWaitingForLock++; break; case k_EJobPauseReasonYield: pJobStatsBucket->m_cPauseReasonYield++; break; case k_EJobPauseReasonSQL: pJobStatsBucket->m_cPauseReasonSQL++; break; case k_EJobPauseReasonWorkItem: pJobStatsBucket->m_cPauseReasonWorkItem++; break; default: break; } }
EmitInfo( SPEW_CONSOLE, SPEW_ALWAYS, LOG_ALWAYS, "%50s --- running jobs (usec)-- -- locks held -- ----- pause reasons ---------------------------------\n", " " ); EmitInfo( SPEW_CONSOLE, SPEW_ALWAYS, LOG_ALWAYS, "%50s count aveduration netmsg sql sleep waitlock yield workitem\n", "name" );
JobProfileStats_t jobprofilestats; jobprofilestats.m_iJobProfileSort = k_EJobProfileSortOrder_Count; jobprofilestats.pmapStatsBucket = &mapStatsBucket;
CUtlVector<int> vecSort( 0, mapStatsBucket.Count() ); FOR_EACH_MAP_FAST( mapStatsBucket, iBucket ) { vecSort.AddToTail( iBucket ); } V_qsort_s( vecSort.Base(), vecSort.Count(), sizeof(int), (QSortCompareFuncCtx_t)ProfileSortFunc, &jobprofilestats );
FOR_EACH_VEC( vecSort, iVec ) { JobStatsBucket_t &bucket = mapStatsBucket[ vecSort[iVec] ];
int64 msecDurationAve = bucket.m_u64JobDuration / bucket.m_cCompletes;
EmitInfo( SPEW_CONSOLE, SPEW_ALWAYS, LOG_ALWAYS, "%50s %8lld %16lld %13lld %11lld %8lld %8lld %8lld %8lld %8lld \n", bucket.m_rgchName, bucket.m_cCompletes, msecDurationAve, bucket.m_cLocksAttempted,
bucket.m_cPauseReasonNetworkMsg, bucket.m_cPauseReasonSQL, bucket.m_cPauseReasonSleepForTime, bucket.m_cPauseReasonWaitingForLock, bucket.m_cPauseReasonYield, bucket.m_cPauseReasonWorkItem ); }
return m_MapJob.Count(); }
//-----------------------------------------------------------------------------
// Purpose: spews details about a job by ID
//-----------------------------------------------------------------------------
void CJobMgr::DumpJob( JobID_t jobID, int nPrintLocksMax ) const { const CJob *pJob = GetPJob( jobID ); if( !pJob ) { EmitInfo( SPEW_CONSOLE, SPEW_ALWAYS, LOG_ALWAYS, "Invalid job ID %llu\n", jobID ); } else { EmitInfo( SPEW_CONSOLE, SPEW_ALWAYS, LOG_ALWAYS, "%llu\t%12s %12s\n", pJob->GetJobID(), pJob->GetName(), pJob->GetPauseReasonDescription() );
if ( pJob->GetPauseReason() == k_EJobPauseReasonWaitingForLock && pJob->m_pWaitingOnLock != NULL ) { EmitInfo( SPEW_CONSOLE, SPEW_ALWAYS, LOG_ALWAYS, "\tWaiting for lock %s from: %s line %d\n", pJob->m_pWaitingOnLock->GetName(), pJob->m_pWaitingOnLockFilename, pJob->m_waitingOnLockLine ); pJob->m_pWaitingOnLock->Dump( "\t ", nPrintLocksMax, true ); }
FOR_EACH_VEC( pJob->m_vecLocks, nLock ) { CLock *pLock = pJob->m_vecLocks[nLock]; EmitInfo( SPEW_CONSOLE, SPEW_ALWAYS, LOG_ALWAYS, "\tHolding lock %s:\n", pLock->GetName() ); pLock->Dump( "\t ", nPrintLocksMax, true ); } } }
//-----------------------------------------------------------------------------
// Purpose: count the number of active jobs
//-----------------------------------------------------------------------------
int CJobMgr::CountJobs() const { return m_MapJob.Count(); }
//-----------------------------------------------------------------------------
// Purpose: verify that current thread is correct
//-----------------------------------------------------------------------------
void CJobMgr::CheckThreadID() { uint unCurrentThread = ThreadGetCurrentId();
if ( m_unFrameFuncThreadID == 0 ) { m_unFrameFuncThreadID = unCurrentThread; } else { // if this Assert goes of, you most likely tried to start
// a job from a different thread then the frame function thread
Assert( m_unFrameFuncThreadID == unCurrentThread ); } }
//-----------------------------------------------------------------------------
// Purpose: JobType_t comparer, used to sort the list of registered
// jobs into a tree by msg that creates them
//-----------------------------------------------------------------------------
bool JobTypeSortFuncByMsg( JobType_t const * const &lhs, JobType_t const * const &rhs ) { if ( lhs->m_eCreationMsg == rhs->m_eCreationMsg ) { return ( lhs->m_eServerType < rhs->m_eServerType ); }
return ( lhs->m_eCreationMsg < rhs->m_eCreationMsg ); }
//-----------------------------------------------------------------------------
// Purpose: JobType_t comparer, used to sort the list of registered
// jobs into a tree by job name
//-----------------------------------------------------------------------------
bool JobTypeSortFuncByName( JobType_t const * const &lhs, JobType_t const * const &rhs ) { int iCompare = Q_strcmp( lhs->m_pchName, rhs->m_pchName ); if ( iCompare == 0 ) { return ( lhs->m_eServerType < rhs->m_eServerType ); }
return ( iCompare < 0 ); }
// singeton accessor to list of registered jobs
CUtlRBTree<const JobType_t *> &GMapJobTypesByMsg() { static CUtlRBTree<const JobType_t *> s_MapJobTypes( 0, 0, JobTypeSortFuncByMsg ); return s_MapJobTypes; }
// singeton accessor to list of registered jobs
CUtlRBTree<const JobType_t *> &GMapJobTypesByName() { static CUtlRBTree<const JobType_t *> s_MapJobTypes( 0, 0, JobTypeSortFuncByName ); return s_MapJobTypes; }
//-----------------------------------------------------------------------------
// Purpose: adds a new type of job into the global list
//-----------------------------------------------------------------------------
void CJobMgr::RegisterJobType( const JobType_t *pJobType ) { Assert( pJobType->m_pchName != NULL ); Assert( pJobType->m_pJobFactory != NULL ); GMapJobTypesByMsg().Insert( pJobType ); GMapJobTypesByName().Insert( pJobType ); }
//-----------------------------------------------------------------------------
// Purpose: Creates a new job from the network msg
// Input : *pServerParent - server to attach job to
// msg - network msg
// Output : true if a job was created
//-----------------------------------------------------------------------------
bool CJobMgr::BLaunchJobFromNetworkMsg( void *pParent, const JobMsgInfo_t &jobMsgInfo, IMsgNetPacket *pNetPacket ) { if ( pNetPacket == NULL ) { AssertMsg(pNetPacket, "CJobMgr::BLaunchJobFromNetworkMsg received NULL packet."); return false; }
if ( pNetPacket->BHasTargetJobName() && BIsValidSystemMsg( pNetPacket->GetEMsg(), NULL ) ) { JobType_t jobSearch = { pNetPacket->GetTargetJobName(), k_EGCMsgInvalid, jobMsgInfo.m_eServerType }; int iJobType = GMapJobTypesByName().Find( &jobSearch );
if ( GMapJobTypesByName().IsValidIndex( iJobType ) ) {
// Get shortcut to job info
const JobType_t *pJobType = (GMapJobTypesByName())[iJobType]; Assert( pJobType ); Assert( pJobType->m_pchName );
// Create the job
CJob *job = pJobType->m_pJobFactory( pParent, NULL );
// Safety check
if ( job == NULL ) { AssertMsg1( job, "Job factory returned NULL for job named '%s'!\n", pJobType->m_pchName ); return false; }
// Start the job
job->StartJobFromNetworkMsg( pNetPacket, jobMsgInfo.m_JobIDSource ); return true; } } else { JobType_t jobSearch = { 0, jobMsgInfo.m_eMsg, jobMsgInfo.m_eServerType }; int iJobType = GMapJobTypesByMsg().Find( &jobSearch );
if ( GMapJobTypesByMsg().IsValidIndex( iJobType ) ) {
// Get shortcut to job info
const JobType_t *pJobType = (GMapJobTypesByMsg())[iJobType]; Assert( pJobType ); Assert( pJobType->m_pchName );
// Create the job
CJob *job = pJobType->m_pJobFactory( pParent, NULL );
// Safety check
if ( job == NULL ) { AssertMsg3( job, "Job factory returned NULL for job msg %d, server type %d (named '%s')!\n", (int)jobMsgInfo.m_eMsg, (int)jobMsgInfo.m_eServerType, pJobType->m_pchName ); return false; }
// Start the job
job->StartJobFromNetworkMsg( pNetPacket, jobMsgInfo.m_JobIDSource ); return true; } }
return false; }
//-----------------------------------------------------------------------------
// Purpose: profile sort func
//-----------------------------------------------------------------------------
int CJobMgr::ProfileSortFunc( void *pCtx, const int *lhs, const int *rhs ) { JobProfileStats_t *pJobprofilestats = (JobProfileStats_t *)pCtx; int64 d = 0; switch ( pJobprofilestats->m_iJobProfileSort ) { default: case k_EJobProfileSortOrder_Alpha: return Q_stricmp( pJobprofilestats->pmapStatsBucket->Element(*lhs).m_rgchName, pJobprofilestats->pmapStatsBucket->Element(*rhs).m_rgchName ); case k_EJobProfileSortOrder_Count: d = ((int64)pJobprofilestats->pmapStatsBucket->Element(*rhs).m_cCompletes - (int64)pJobprofilestats->pmapStatsBucket->Element(*lhs).m_cCompletes); break; case k_EJobProfileSortOrder_TotalRuntime: d = ((int64)pJobprofilestats->pmapStatsBucket->Element(*rhs).m_u64RunTime - (int64)pJobprofilestats->pmapStatsBucket->Element(*lhs).m_u64RunTime); break; } if ( d < 0 ) return -1; if ( d > 0 ) return 1; return 0; }
//-----------------------------------------------------------------------------
// Purpose: dump out accumulated job profile data
//-----------------------------------------------------------------------------
void CJobMgr::ProfileJobs( EJobProfileAction ejobProfileAction, EJobProfileSortOrder iSortOrder ) { bool bClearBuckets = false; if ( ejobProfileAction == k_EJobProfileAction_Start ) { if ( !m_bProfiling ) { bClearBuckets = true; } m_bProfiling = true; } else if ( ejobProfileAction == k_EJobProfileAction_Stop ) { m_bProfiling = false; } else if ( ejobProfileAction == k_EJobProfileAction_Clear ) { bClearBuckets = true; }
if ( bClearBuckets ) { m_mapStatsBucket.RemoveAll(); }
if ( k_EJobProfileAction_Dump != ejobProfileAction ) return;
EmitInfo( SPEW_CONSOLE, SPEW_ALWAYS, LOG_ALWAYS, "%44s --- completed jobs (usec)---------------------------------- ------ lock counts---------------------------------- ------ failures -----------\n", " " ); EmitInfo( SPEW_CONSOLE, SPEW_ALWAYS, LOG_ALWAYS, "%44s count averuntime maxruntime aveduration #yielded attempted waited failed longheld longwait wait-t/o t/o-msg jobfailed longslice\n", "name" );
JobProfileStats_t jobprofilestats; jobprofilestats.m_iJobProfileSort = iSortOrder; jobprofilestats.pmapStatsBucket = &m_mapStatsBucket;
CUtlVector<int> vecSort( 0, m_mapStatsBucket.Count() ); FOR_EACH_MAP_FAST( m_mapStatsBucket, iBucket ) { vecSort.AddToTail( iBucket ); } V_qsort_s( vecSort.Base(), vecSort.Count(), sizeof(int), (QSortCompareFuncCtx_t)ProfileSortFunc, &jobprofilestats );
FOR_EACH_VEC( vecSort, iVec ) { JobStatsBucket_t &bucket = m_mapStatsBucket[ vecSort[iVec] ]; if ( bucket.m_cCompletes ) { CCycleCount ccRunTime( bucket.m_u64RunTime / bucket.m_cCompletes ); int64 usecAve = ccRunTime.GetMicroseconds();
CCycleCount ccRunTimeMax( bucket.m_u64RunTimeMax ); int64 usecMax = ccRunTimeMax.GetMicroseconds();
int64 msecDurationAve = bucket.m_u64JobDuration / bucket.m_cCompletes;
EmitInfo( SPEW_CONSOLE, SPEW_ALWAYS, LOG_ALWAYS, "%44s %12lld %12lld %12lld %12lld %8lld %8lld %8lld %8lld %8lld %8lld %8lld %8lld %8lld %8lld\n", bucket.m_rgchName, bucket.m_cCompletes, usecAve, usecMax, msecDurationAve, bucket.m_cJobsPaused, bucket.m_cLocksAttempted, bucket.m_cLocksWaitedFor, bucket.m_cLocksFailed, bucket.m_cLocksLongHeld, bucket.m_cLocksLongWait, bucket.m_cWaitTimeout, bucket.m_cTimeoutNetMsg, bucket.m_cJobsFailed, bucket.m_cLongInterYieldTime ); } } if ( m_mapOrphanMessages.Count() ) { EmitInfo( SPEW_CONSOLE, SPEW_ALWAYS, LOG_ALWAYS, "Messages that arrived responding to jobs that no longer exists and were dropped\n" ); FOR_EACH_MAP_FAST( m_mapOrphanMessages, iBucket ) { EmitInfo( SPEW_CONSOLE, SPEW_ALWAYS, LOG_ALWAYS, "%44s %12d\n", PchMsgNameFromEMsg( m_mapOrphanMessages.Key(iBucket) ), m_mapOrphanMessages[iBucket] ); } m_mapOrphanMessages.RemoveAll(); } }
//-----------------------------------------------------------------------------
// Purpose: Dump a list of all jobs to the console
// Each job is indexed, and that index can be used with
// DebugJob() to cause a debug break in that job.
//-----------------------------------------------------------------------------
void CJobMgr::DumpJobs( const char *pszJobName, int nMax, int nPrintLocksMax ) const { FOR_EACH_MAP_FAST( m_MapJob, iJob ) { if ( nMax <= 0 ) break; nMax--;
if ( pszJobName == NULL || V_strcmp( pszJobName, m_MapJob[iJob]->GetName() ) == 0 ) { DumpJob( m_MapJob.Key(iJob), nPrintLocksMax ); } } EmitInfo( SPEW_CONSOLE, SPEW_ALWAYS, LOG_ALWAYS, "Total job count: %d\n", m_MapJob.Count() ); }
//-----------------------------------------------------------------------------
// Purpose: cause a debug break in the given job
//-----------------------------------------------------------------------------
void CJobMgr::DebugJob( int iJob ) { #ifdef DEBUG_JOB_LIST
if ( sm_listAllJobs.IsValidIndex( iJob ) ) { sm_listAllJobs[iJob]->Debug(); } else { EmitInfo( SPEW_CONSOLE, 1, 1, "Job not found\n" ); } #else
EmitInfo( SPEW_CONSOLE, 1, 1, "Job debugging disabled\n" ); #endif
}
#ifdef DBGFLAG_VALIDATE
//-----------------------------------------------------------------------------
// Purpose: Run a global validation pass on all of our data structures and memory
// allocations.
// Input: validator - Our global validator object
// pchName - Our name (typically a member var in our container)
//-----------------------------------------------------------------------------
void CJobMgr::Validate( CValidator &validator, const char *pchName ) { VALIDATE_SCOPE();
ValidateObj( m_MapJob ); FOR_EACH_MAP_FAST( m_MapJob, iJob ) { ValidatePtr( m_MapJob[iJob] ); }
ValidateObj( m_mapStatsBucket ); FOR_EACH_MAP_FAST( m_mapStatsBucket, iBucket ) { ValidateObj( m_mapStatsBucket[iBucket] ); }
ValidateObj( m_ListJobsYieldingRegPri ); ValidateObj( m_ListJobTimeouts ); ValidateObj( m_MapJobTimeoutsIndexByJobID ); ValidateObj( m_QueueJobSleeping ); ValidateObj( m_WorkThreadPool ); }
//-----------------------------------------------------------------------------
// Purpose: Run a global validation pass on all of our global data
// Input: validator - Our global validator object
//-----------------------------------------------------------------------------
void CJobMgr::ValidateStatics( CValidator &validator, const char *pchName ) { VALIDATE_SCOPE_STATIC( "CJobMgr class statics" );
ValidateObj( GMapJobTypesByMsg() ); ValidateObj( GMapJobTypesByName() ); #ifdef DEBUG_JOB_LIST
ValidateObj( sm_listAllJobs ); #endif
} #endif // DBGFLAG_VALIDATE
} // namespace GCSDK
|