PerfTimer.cpp 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491
  1. #include "PerfTimer.h"
  2. #include "BFApp.h"
  3. #pragma warning(disable:4996)
  4. #ifdef _DEBUG
  5. #define PERF_WANTS_THREAD_CHECK
  6. #endif
  7. USING_NS_BF;
  8. PerfManager* Beefy::gPerfManager = NULL;
  9. PerfEntry::PerfEntry()
  10. {
  11. mCount = 0;
  12. mTimeTotal = 0;
  13. mCurTimingStart = 0;
  14. mChild = NULL;
  15. }
  16. void PerfEntry::DbgPrint(const StringImpl& name, int level, std::map<String, int>& uniqueTimingMap)
  17. {
  18. String text;
  19. uint64 childrenTime = 0;
  20. /*PerfEntryMap::iterator itr = mChildren.begin();
  21. while (itr != mChildren.end())
  22. {
  23. PerfEntry* child = &itr->second;
  24. childrenTime += child->mTimeTotal;
  25. ++itr;
  26. }*/
  27. for (auto& kv : mChildren)
  28. {
  29. PerfEntry* child = kv.mValue;
  30. childrenTime += child->mTimeTotal;
  31. }
  32. for (int i = 0; i <= level; i++)
  33. text += " ";
  34. String prefix = text;
  35. text += name;
  36. while (text.length() < 80)
  37. text += ' ';
  38. int selfTime = (int)(mTimeTotal - childrenTime);
  39. if (uniqueTimingMap.find(name) == uniqueTimingMap.end())
  40. uniqueTimingMap[name] = selfTime;
  41. else
  42. uniqueTimingMap[name] += selfTime;
  43. text += StrFormat("%4d\t%6.1f\t%6.1f\n", mCount, mTimeTotal / 1000.0f, (int) (selfTime) / 1000.0f);
  44. /*for (int i = 0; i < (int) mLog.size(); i++)
  45. {
  46. PerfLogEntry* logEntry = &mLog[i];
  47. text += prefix + StrFormat("@%d: %s\n", logEntry->mTick, logEntry->mString.c_str());
  48. }*/
  49. OutputDebugStrF(text.c_str());
  50. for (auto& kv : mChildren)
  51. {
  52. PerfEntry* child = kv.mValue;
  53. child->DbgPrint(kv.mKey, level + 1, uniqueTimingMap);
  54. }
  55. }
  56. void PerfManager::Clear()
  57. {
  58. mLogEntries.ClearFast();
  59. mAlloc.Clear();
  60. mFrames.clear();
  61. mCurStackIdx = 0;
  62. mOverhead = 0;
  63. }
  64. PerfManager::PerfManager()
  65. {
  66. mRecording = false;
  67. mCurStackIdx = 0;
  68. mOwningThreadId = 0;
  69. mOverhead = 0;
  70. mAlloc.mDisableDebugTracing = true;
  71. }
  72. void PerfManager::NextFrame()
  73. {
  74. if (!mRecording)
  75. return;
  76. BF_ASSERT(mCurStackIdx <= 1);
  77. while (mCurStackIdx > 0)
  78. ZoneEnd(true);
  79. auto logEntryFrameStart = mAlloc.Alloc<PerfLogEntry_FrameStart>();
  80. logEntryFrameStart->mType = PerfLogEntryType_FrameStart;
  81. logEntryFrameStart->mTimingStart = BFGetTickCountMicroFast();
  82. mLogEntries.PushBack(logEntryFrameStart);
  83. mCurStackIdx++;
  84. }
  85. void PerfManager::ZoneStart(const char* name)
  86. {
  87. if (!mRecording)
  88. return;
  89. #ifdef PERF_WANTS_THREAD_CHECK
  90. BF_ASSERT(mOwningThreadId == BfpThread_GetCurrentId());
  91. #endif
  92. uint64 callTimerStart = BFGetTickCountMicroFast();
  93. mCurStackIdx++;
  94. int nameLen = (int)strlen(name);
  95. auto logEntryStart = mAlloc.Alloc<PerfLogEntry_Start>(nameLen + 1);
  96. char* namePtr = (char*)(logEntryStart + 1);
  97. strcpy(namePtr, name);
  98. logEntryStart->mType = PerfLogEntryType_Start;
  99. logEntryStart->mName = namePtr;
  100. mLogEntries.PushBack(logEntryStart);
  101. logEntryStart->mTimingStart = BFGetTickCountMicroFast();;
  102. mOverhead += logEntryStart->mTimingStart - callTimerStart;
  103. /*
  104. if (mCurStackIdx == 0)
  105. GetCurFrame();
  106. PerfEntry* curParent = mCurStack[mCurStackIdx - 1];
  107. PerfEntry* entry = NULL;
  108. if (curParent->mChild != NULL)
  109. {
  110. if (curParent->mChild->mName == name)
  111. entry = curParent->mChild;
  112. }
  113. if (entry == NULL)
  114. {
  115. PerfEntryMap::iterator itr = curParent->mChildren.find(name);
  116. if (itr != curParent->mChildren.end())
  117. {
  118. entry = &itr->second;
  119. }
  120. else
  121. {
  122. itr = curParent->mChildren.insert(PerfEntryMap::value_type(name, PerfEntry())).first;
  123. entry = &itr->second;
  124. entry->mName = name;
  125. }
  126. curParent->mChild = entry;
  127. }
  128. entry->mCount++;
  129. entry->mCurTimingStart = BFGetTickCountMicroFast();
  130. mCurStack[mCurStackIdx++] = entry;
  131. mOverhead += entry->mCurTimingStart - callTimerStart;*/
  132. }
  133. void PerfManager::ZoneEnd(bool allowFrameEnd)
  134. {
  135. if (!mRecording)
  136. return;
  137. if ((mCurStackIdx <= 1) && (!allowFrameEnd))
  138. return;
  139. auto logEntryEnd = mAlloc.Alloc<PerfLogEntry_End>();
  140. logEntryEnd->mType = PerfLogEntryType_End;
  141. logEntryEnd->mTimingEnd = BFGetTickCountMicroFast();
  142. mLogEntries.PushBack(logEntryEnd);
  143. mCurStackIdx--;
  144. /*PerfEntry* entry = mCurStack[mCurStackIdx - 1];
  145. mCurStackIdx--;
  146. entry->mTimeTotal += BFGetTickCountMicroFast() - entry->mCurTimingStart;*/
  147. }
  148. void PerfManager::Message(const StringImpl& theString)
  149. {
  150. if (!mRecording)
  151. return;
  152. //TODO: Implement
  153. /*if (mCurStackIdx == 0)
  154. GetCurFrame();
  155. PerfEntry* entry = mCurStack[mCurStackIdx - 1];
  156. PerfLogEntry logEntry;
  157. logEntry.mTick = BFTickCount();
  158. logEntry.mString = theString;
  159. entry->mLog.push_back(logEntry);*/
  160. }
  161. void PerfManager::StartRecording()
  162. {
  163. #ifdef PERF_WANTS_THREAD_CHECK
  164. mOwningThreadId = BfpThread_GetCurrentId();
  165. #endif
  166. mRecording = true;
  167. Clear();
  168. NextFrame();
  169. }
  170. void PerfManager::StopRecording(bool dbgPrint)
  171. {
  172. if (!mRecording)
  173. return;
  174. #ifdef PERF_WANTS_THREAD_CHECK
  175. BF_ASSERT(mOwningThreadId == ::BfpThread_GetCurrentId());
  176. #endif
  177. mRecording = false;
  178. auto logEntryStopRecording = mAlloc.Alloc<PerfLogEntry_StopRecording>();
  179. logEntryStopRecording->mType = PerfLogEntryType_StopRecording;
  180. logEntryStopRecording->mTimingEnd = BFGetTickCountMicroFast();
  181. mLogEntries.PushBack(logEntryStopRecording);
  182. if (dbgPrint)
  183. DbgPrint();
  184. /*if (mFrames.size() > 0)
  185. {
  186. PerfFrame* frame = &mFrames.back();
  187. frame->mTimeTotal = BFGetTickCountMicroFast() - frame->mCurTimingStart;
  188. }*/
  189. }
  190. bool PerfManager::IsRecording()
  191. {
  192. return mRecording;
  193. }
  194. void PerfManager::DbgPrint()
  195. {
  196. #ifdef PERF_WANTS_THREAD_CHECK
  197. BF_ASSERT(mOwningThreadId == ::BfpThread_GetCurrentId());
  198. #endif
  199. if (mFrames.empty())
  200. {
  201. mCurStackIdx = 0;
  202. PerfFrame* curFrame = NULL;
  203. for (auto logEntry : mLogEntries)
  204. {
  205. if (logEntry->mType == PerfLogEntryType_FrameStart)
  206. {
  207. PerfLogEntry_FrameStart* frameStartEntry = (PerfLogEntry_FrameStart*)logEntry;
  208. if (mFrames.size() > 0)
  209. {
  210. PerfFrame* frame = &mFrames.back();
  211. frame->mTimeTotal = frameStartEntry->mTimingStart - frame->mCurTimingStart;
  212. }
  213. mFrames.push_back(PerfFrame());
  214. PerfFrame* frame = &mFrames.back();
  215. frame->mCurTimingStart = frameStartEntry->mTimingStart;
  216. #ifndef BF_NO_BFAPP
  217. if (gBFApp != NULL)
  218. frame->mAppFrameNum = gBFApp->mUpdateCnt;
  219. else
  220. frame->mAppFrameNum = 0;
  221. #else
  222. frame->mAppFrameNum = 0;
  223. #endif
  224. frame->mCount = 1;
  225. mCurStack[mCurStackIdx++] = frame;
  226. }
  227. else if (logEntry->mType == PerfLogEntryType_Start)
  228. {
  229. PerfLogEntry_Start* entryStart = (PerfLogEntry_Start*)logEntry;
  230. PerfEntry* curParent = mCurStack[mCurStackIdx - 1];
  231. PerfEntry* entry = NULL;
  232. if (curParent->mChild != NULL)
  233. {
  234. if (curParent->mChild->mName == entryStart->mName)
  235. entry = curParent->mChild;
  236. }
  237. if (entry == NULL)
  238. {
  239. /*PerfEntryMap::iterator itr = curParent->mChildren.find(entryStart->mName);
  240. if (itr != curParent->mChildren.end())
  241. {
  242. entry = &itr->second;
  243. }
  244. else
  245. {
  246. itr = curParent->mChildren.insert(PerfEntryMap::value_type(entryStart->mName, PerfEntry())).first;
  247. entry = &itr->second;
  248. entry->mName = entryStart->mName;
  249. }*/
  250. PerfEntry** entryPtr = NULL;
  251. if (curParent->mChildren.TryAdd(entryStart->mName, NULL, &entryPtr))
  252. {
  253. entry = mAlloc.Alloc<PerfEntry>();
  254. *entryPtr = entry;
  255. entry->mName = entryStart->mName;
  256. }
  257. else
  258. {
  259. entry = *entryPtr;
  260. }
  261. curParent->mChild = entry;
  262. }
  263. entry->mCount++;
  264. entry->mCurTimingStart = entryStart->mTimingStart;
  265. mCurStack[mCurStackIdx++] = entry;
  266. }
  267. else if (logEntry->mType == PerfLogEntryType_End)
  268. {
  269. PerfLogEntry_End* entryEnd = (PerfLogEntry_End*)logEntry;
  270. PerfEntry* entry = mCurStack[mCurStackIdx - 1];
  271. mCurStackIdx--;
  272. entry->mTimeTotal += entryEnd->mTimingEnd - entry->mCurTimingStart;
  273. }
  274. else if (logEntry->mType == PerfLogEntryType_StopRecording)
  275. {
  276. PerfLogEntry_StopRecording* stopRecordingEntry = (PerfLogEntry_StopRecording*)logEntry;
  277. if (mFrames.size() > 0)
  278. {
  279. PerfFrame* frame = &mFrames.back();
  280. frame->mTimeTotal = stopRecordingEntry->mTimingEnd - frame->mCurTimingStart;
  281. }
  282. }
  283. }
  284. }
  285. std::map<String, int> uniqueTimingMap;
  286. OutputDebugStrF("PerfManager_Results____________________________________________________________Calls___MSTotal__MSSelf\n");
  287. PerfFrameList::iterator frameItr = mFrames.begin();
  288. while (frameItr != mFrames.end())
  289. {
  290. PerfFrame* frame = &(*frameItr);
  291. frame->DbgPrint(StrFormat("Frame %d", frame->mAppFrameNum), 0, uniqueTimingMap);
  292. ++frameItr;
  293. }
  294. OutputDebugStr("\nPerfManager_Combined_Results____________________________________________________________________MSSelf\n");
  295. typedef std::multimap<int, String> SortedMap;
  296. SortedMap sortedMap;
  297. for (auto& entry : uniqueTimingMap)
  298. {
  299. sortedMap.insert(SortedMap::value_type(-entry.second, entry.first));
  300. }
  301. for (auto& entry : sortedMap)
  302. {
  303. String text = entry.second;
  304. for (int i = (int)text.length(); i < 96; i++)
  305. text += " ";
  306. text += StrFormat("%6.1f\n", -entry.first / 1000.0f);
  307. OutputDebugStr(text.c_str());
  308. }
  309. {
  310. String text = "PerfTimer Timing Overhead";
  311. for (int i = (int) text.length(); i < 96; i++)
  312. text += " ";
  313. text += StrFormat("%6.1f\n", mOverhead / 1000.0f);
  314. OutputDebugStr(text.c_str());
  315. }
  316. }
  317. AutoPerf::AutoPerf(const char* name, PerfManager* perfManager)
  318. {
  319. if ((perfManager == NULL) || (!perfManager->mRecording))
  320. {
  321. mPerfManager = NULL;
  322. mStartStackIdx = 0;
  323. return;
  324. }
  325. mPerfManager = perfManager;
  326. mPerfManager->ZoneStart(name);
  327. mStartStackIdx = mPerfManager->mCurStackIdx - 1;
  328. }
  329. void AutoPerf::Leave()
  330. {
  331. if (mStartStackIdx <= 0)
  332. return;
  333. BF_ASSERT(mPerfManager->mCurStackIdx <= mStartStackIdx + 1);
  334. if (mPerfManager->mCurStackIdx > mStartStackIdx)
  335. mPerfManager->ZoneEnd();
  336. mStartStackIdx = -1;
  337. }
  338. AutoPerf::~AutoPerf()
  339. {
  340. Leave();
  341. }
  342. //////////////////////////////////////////////////////////////////////////
  343. AutoPerfRecordAndPrint::AutoPerfRecordAndPrint(PerfManager* perfManager)
  344. {
  345. mPerfManager = perfManager;
  346. mDidStart = !perfManager->mRecording;
  347. if (mDidStart)
  348. perfManager->StartRecording();
  349. }
  350. AutoPerfRecordAndPrint::~AutoPerfRecordAndPrint()
  351. {
  352. if (mDidStart)
  353. mPerfManager->StopRecording(true);
  354. }
  355. //////////////////////////////////////////////////////////////////////////
  356. AutoDbgTime::AutoDbgTime(const StringImpl& name)
  357. {
  358. mName = name;
  359. mStartTick = BFTickCount();
  360. }
  361. AutoDbgTime::~AutoDbgTime()
  362. {
  363. int totalTime = BFTickCount() - mStartTick;
  364. OutputDebugStrF("%s: %d\n", mName.c_str(), totalTime);
  365. }
  366. ///
  367. #ifdef BFSYSLIB_DYNAMIC
  368. BF_EXPORT void BF_CALLTYPE PerfTimer_ZoneStart(const char* name)
  369. {
  370. gPerfManager->ZoneStart(name);
  371. }
  372. BF_EXPORT void BF_CALLTYPE PerfTimer_ZoneEnd()
  373. {
  374. gPerfManager->ZoneEnd();
  375. }
  376. BF_EXPORT void BF_CALLTYPE PerfTimer_Message(const char* theString)
  377. {
  378. gPerfManager->Message(theString);
  379. }
  380. BF_EXPORT int BF_CALLTYPE PerfTimer_IsRecording()
  381. {
  382. return gPerfManager->IsRecording() ? 1 : 0;
  383. }
  384. BF_EXPORT void BF_CALLTYPE PerfTimer_StartRecording()
  385. {
  386. gPerfManager->StartRecording();
  387. }
  388. BF_EXPORT void BF_CALLTYPE PerfTimer_StopRecording()
  389. {
  390. gPerfManager->StopRecording();
  391. }
  392. BF_EXPORT void BF_CALLTYPE PerfTimer_DbgPrint()
  393. {
  394. gPerfManager->DbgPrint();
  395. }
  396. #endif