Go to the source code of this file.
Data Structures | |
struct | _GroupInfo |
class | ElementCheckpointer |
class | CkCheckpointMgr |
There is only one Checkpoint Manager in the whole system. More... | |
class | CkCheckpointInit |
Typedefs | |
typedef struct _GroupInfo | GroupInfo |
typedef void | GroupCreationFn (CkGroupID groupID, int constructorIdx, envelope *env) |
Functions | |
void | noopit (const char *,...) |
PUPbytes (GroupInfo) | |
void | _initDone () |
This function (not a handler) is called once and only once per processor. | |
static void | bdcastRO (void) |
static void | bdcastROGroupData (void) |
void | printIndex (const CkArrayIndex &idx, char *dest) |
static bool | checkpointOne (const char *dirname, CkCallback &cb, bool requestStatus) |
static void | addPartitionDirectory (ostringstream &path) |
static FILE * | openCheckpointFile (const char *dirname, const char *basename, const char *mode, int id=-1) |
void | CkPupROData (PUP::er &p) |
void | CkPupMainChareData (PUP::er &p, CkArgMsg *args) |
CkpvExtern (std::vector< void * >, chare_objs) | |
CkpvExtern (std::vector< int >, chare_types) | |
CkpvExtern (std::vector< VidBlock * >, vidblocks) | |
void | CkPupChareData (PUP::er &p) |
static void | CkPupPerPlaceData (PUP::er &p, GroupIDTable *idTable, GroupTable *objectTable, unsigned int &numObjects, int constructionMsgType, GroupCreationFn creationFn#if(defined(_FAULT_MLOG_)||defined(_FAULT_CAUSAL_)), bool create#endif) |
void | CkPupGroupData (PUP::er &p#if(defined(_FAULT_MLOG_)||defined(_FAULT_CAUSAL_)), bool create#endif) |
void | CkPupNodeGroupData (PUP::er &p#if(defined(_FAULT_MLOG_)||defined(_FAULT_CAUSAL_)), bool create#endif) |
void | CkPupArrayElementsData (PUP::er &p, int notifyListeners) |
int | CkCountArrayElements () |
void | CkPupProcessorData (PUP::er &p) |
void | CkRemoveArrayElements () |
void | CkStartCheckpoint (const char *dirname, const CkCallback &cb, bool requestStatus) |
void | CkRestartMain (const char *dirname, CkArgMsg *args) |
void | CkResumeRestartMain (char *msg) |
Variables | |
CkGroupID | _sysChkptMgr |
CkCallback | cb |
Restart: There's no such object as restart manager is created because a group cannot restore itself anyway. |
typedef struct _GroupInfo GroupInfo |
typedef void GroupCreationFn(CkGroupID groupID, int constructorIdx, envelope *env) |
Definition at line 444 of file ckcheckpoint.C.
void noopit | ( | const char * | , | |
... | ||||
) |
Definition at line 24 of file ckcheckpoint.C.
PUPbytes | ( | GroupInfo | ) |
Definition at line 41 of file ckcheckpoint.C.
static void bdcastRO | ( | void | ) | [static] |
Definition at line 94 of file ckcheckpoint.C.
References _allocEnv(), _numInitMsgs, _readonlyTable, _roRestartHandlerIdx, Converse::CkMyPe(), Converse::CmiSyncBroadcastAndFree(), EnvToUsr(), envelope::getTotalsize(), RODataMsg, envelope::setCount(), envelope::setSrcPe(), and PUP::sizer::size().
Referenced by CkPupMainChareData().
static void bdcastROGroupData | ( | void | ) | [static] |
Definition at line 116 of file ckcheckpoint.C.
References _ROGroupRestartHandlerIdx, CkPupGroupData(), CkPupROData(), CmiAlloc(), Converse::CmiSyncBroadcastAllAndFree(), int, msg, PUP::mem::size(), and PUP::sizer::size().
void printIndex | ( | const CkArrayIndex & | idx, | |
char * | dest | |||
) |
Definition at line 148 of file ckcheckpoint.C.
static bool checkpointOne | ( | const char * | dirname, | |
CkCallback & | cb, | |||
bool | requestStatus | |||
) | [static] |
Definition at line 651 of file ckcheckpoint.C.
References PUP::toDisk::checkError(), Converse::CkMyPe(), BGConverse::CkNumNodes(), Converse::CkNumPes(), CkPupMainChareData(), CkPupROData(), CmiFclose(), and openCheckpointFile().
Referenced by CkCheckpointMgr::Checkpoint().
static void addPartitionDirectory | ( | ostringstream & | path | ) | [static] |
Definition at line 158 of file ckcheckpoint.C.
Referenced by CkCheckpointMgr::Checkpoint(), and openCheckpointFile().
static FILE* openCheckpointFile | ( | const char * | dirname, | |
const char * | basename, | |||
const char * | mode, | |||
int | id = -1 | |||
) | [static] |
Definition at line 164 of file ckcheckpoint.C.
References addPartitionDirectory(), Converse::CkMyPe(), and CmiFopen().
Referenced by CkCheckpointMgr::Checkpoint(), checkpointOne(), CkRestartMain(), and CkResumeRestartMain().
void CkPupROData | ( | PUP::er & | p | ) |
Definition at line 307 of file ckcheckpoint.C.
References _readonlyMsgs, _readonlyTable, c, CkPupMessage(), PUP::er::isUnpacking(), and ReadonlyMsgInfo::pMsg.
Referenced by _handleProcData(), _recvCheckpointHandler(), _recvRestartCheckpointHandler(), _startCheckpointHandler(), bdcastROGroupData(), checkpointOne(), CkPupProcessorData(), CkRestartMain(), CkResumeRestartMain(), and startMlogCheckpoint().
Definition at line 329 of file ckcheckpoint.C.
References _chareTable, _entryTable, _mainTable, bdcastRO(), Converse::CkMyPe(), ChareInfo::getMigCtor(), PUP::er::isUnpacking(), malloc(), ChareInfo::name, ChareInfo::size, size, PUP::er::typeString(), and Chare::virtual_pup().
Referenced by _handleProcData(), checkpointOne(), CkPupProcessorData(), and CkRestartMain().
CkpvExtern | ( | std::vector< void * > | , | |
chare_objs | ||||
) |
CkpvExtern | ( | std::vector< int > | , | |
chare_types | ||||
) |
CkpvExtern | ( | std::vector< VidBlock * > | , | |
vidblocks | ||||
) |
void CkPupChareData | ( | PUP::er & | p | ) |
Definition at line 371 of file ckcheckpoint.C.
References _chareTable, buf, CkAllocSysMsg(), CkCreateLocalChare(), CkFreeSysMsg(), PUP::er::isUnpacking(), PUP::m, n, name, VidBlock::pup(), UsrToEnv(), and Chare::virtual_pup().
Referenced by _handleProcData(), CkCheckpointMgr::Checkpoint(), CkPupProcessorData(), and CkRestartMain().
static void CkPupPerPlaceData | ( | PUP::er & | p, | |
GroupIDTable * | idTable, | |||
GroupTable * | objectTable, | |||
unsigned int & | numObjects, | |||
int | constructionMsgType, | |||
GroupCreationFn creationFn# | ifdefined(_FAULT_MLOG_)||defined(_FAULT_CAUSAL_), | |||
bool create# | endif | |||
) | [static] |
Definition at line 446 of file ckcheckpoint.C.
References _chareTable, buf, CkAllocSysMsg(), CkCreateLocalGroup(), Converse::CkMyPe(), GroupIdxArray< dtype >::find(), TableEntry::getcIdx(), TableEntry::getObj(), PUP::er::isUnpacking(), PUP::m, Chare::mlogData, name, envelope::setMsgtype(), ChareMlogData::teamRecoveryFlag, PUP::er::typeString(), UsrToEnv(), and Chare::virtual_pup().
Referenced by CkPupGroupData(), and CkPupNodeGroupData().
void CkPupGroupData | ( | PUP::er &p# | ifdefined(_FAULT_MLOG_)||defined(_FAULT_CAUSAL_), | |
bool create# | endif | |||
) |
Definition at line 524 of file ckcheckpoint.C.
References BocInitMsg, CkCreateLocalGroup(), and CkPupPerPlaceData().
Referenced by _handleProcData(), _recvCheckpointHandler(), _recvRestartCheckpointHandler(), _startCheckpointHandler(), bdcastROGroupData(), CkCheckpointMgr::Checkpoint(), CkPupProcessorData(), CkRestartMain(), CkResumeRestartMain(), and startMlogCheckpoint().
void CkPupNodeGroupData | ( | PUP::er &p# | ifdefined(_FAULT_MLOG_)||defined(_FAULT_CAUSAL_), | |
bool create# | endif | |||
) |
Definition at line 538 of file ckcheckpoint.C.
References CkCreateLocalNodeGroup(), CkPupPerPlaceData(), and NodeBocInitMsg.
Referenced by _handleProcData(), _recvCheckpointHandler(), _recvRestartCheckpointHandler(), _startCheckpointHandler(), CkCheckpointMgr::Checkpoint(), CkPupProcessorData(), CkRestartMain(), and startMlogCheckpoint().
Definition at line 554 of file ckcheckpoint.C.
References IrrGroup::ckJustMigrated(), Converse::CkMyPe(), idx, PUP::er::isUnpacking(), CkLocMgr::restore(), CkLocMgr::resume(), and PUP::er::typeString().
Referenced by CkCheckpointMgr::Checkpoint(), CkPupProcessorData(), CkRestartMain(), and CkResumeRestartMain().
int CkCountArrayElements | ( | ) |
Definition at line 605 of file ckcheckpoint.C.
Referenced by CkMemCheckPT::pupAllElements(), and pupArrayElementsSkip().
void CkPupProcessorData | ( | PUP::er & | p | ) |
Definition at line 615 of file ckcheckpoint.C.
References Converse::CkMyPe(), BGConverse::CkMyRank(), CkPupArrayElementsData(), CkPupChareData(), CkPupGroupData(), CkPupMainChareData(), CkPupNodeGroupData(), and CkPupROData().
void CkRemoveArrayElements | ( | ) |
Definition at line 694 of file ckcheckpoint.C.
void CkStartCheckpoint | ( | const char * | dirname, | |
const CkCallback & | cb, | |||
bool | requestStatus | |||
) |
Definition at line 723 of file ckcheckpoint.C.
References Converse::CkMyPe(), CkCallback::containsPointer(), and CkCallback::isInvalid().
Referenced by PVT::beginCheckpoint(), CentralLB::CheckForRealloc(), ArmciVirtualProcessor::checkpoint(), and sim::SeqBeginCheckpoint().
void CkResumeRestartMain | ( | char * | msg | ) |
Definition at line 855 of file ckcheckpoint.C.
References _initDone(), _inrestart, _restarted, Converse::CkMyPe(), CkPupArrayElementsData(), CkPupGroupData(), CkPupROData(), CmiFclose(), CmiFree(), CmiNodeBarrier(), CmiPrintf(), CmiWallTimer(), CkMemCheckPT::inRestarting, openCheckpointFile(), p, and CkCallback::send().
Referenced by _ROGroupRestartHandler().
Definition at line 33 of file ckcheckpoint.C.
Restart: There's no such object as restart manager is created because a group cannot restore itself anyway.
The mechanism exists as converse code and get invoked by broadcast message.
Definition at line 745 of file ckcheckpoint.C.
Referenced by _handlePhase2(), _invokeQD(), ampiInit(), TraceSummaryBOC::askSummary(), HierarchicalLB::avg_load_reduction(), ArmciVirtualProcessor::barrier(), PVT::beginCheckpoint(), pathHistoryManager::broadcastCriticalPathProjections(), ccd_heap_update(), ccsHandlerToCallback(), CentralLB::CheckForRealloc(), ArmciVirtualProcessor::checkpoint(), CkExtContributeToArray(), CkExtContributeToChare(), CkExtContributeToGroup(), KMeansBOC::collectDistances(), KMeansBOC::collectKMeansData(), TraceUtilizationBOC::collectSumDetailData(), TraceSummaryBOC::collectSummaryData(), serialCollideClient::collisions(), CkSparseContiguousReducer< T >::contribute(), CkMulticastMgr::contribute(), MetaBalancer::ContributeStats(), CUDACallbackManager(), CkMemCheckPT::doItNow(), TCharm::done(), DistributedLB::DoneWithLBPhase(), KMeansBOC::findInitialClusters(), MetaBalancerRedn::getMaxIter(), controlPointManager::gotoNextPhase(), SearchConductor::groupInitComplete(), CkCallback::impl_thread_init(), CkMemCheckPT::isMaster(), DistributedLB::LoadReduction(), LV3D0_qd(), LBDB::Migrated(), HybridBaseLB::MigrationDone(), CentralLB::MigrationDone(), PythonObject::print(), DistBaseLB::ProcessAtSync(), CentralLB::ProcessAtSync(), PUPmarshall(), CentralLB::ReceiveCounts(), registerArrayElemJoinExtCallback(), registerArrayElemLeaveExtCallback(), registerArrayMapProcNumExtCallback(), registerArrayMsgRecvExtCallback(), registerArrayResumeFromSyncExtCallback(), registerChareMsgRecvExtCallback(), registerCkRegisterMainModuleCallback(), registerCreateReductionTargetMsgExtCallback(), registerGroupMsgRecvExtCallback(), registerMainchareCtorExtCallback(), registerPyReductionExtCallback(), registerReadOnlyRecvExtCallback(), PythonObject::replyIntValue(), ArmciVirtualProcessor::requestAddresses(), GreedyRefineLB::sendSolution(), sim::SeqBeginCheckpoint(), PVT::setGVT(), TraceSummaryBOC::shrink(), ArmciVirtualProcessor::startCheckpoint(), TraceProjectionsBOC::startEndTimeAnalysis(), KMeansBOC::startKMeansAnalysis(), TraceProjectionsBOC::startTimeAnalysis(), DistributedLB::Strategy(), MSA_PageArray< ENTRY_TYPE, ENTRY_OPS_CLASS, ENTRIES_PER_PAGE >::Sync(), TraceSummaryBOC::traceSummaryParallelShutdown(), MetaBalancer::TriggerAdaptiveReduction(), KMeansBOC::updateSeedMembership(), pathHistoryManager::useCriticalPathForPriories(), CentralLB::WillIbekilled(), and GreedyRefineLB::work().