PerformanceTest.cpp 10 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368
  1. // SPDX-FileCopyrightText: 2021 Jorrit Rouwe
  2. // SPDX-License-Identifier: MIT
  3. // Jolt includes
  4. #include <Jolt/Jolt.h>
  5. #include <Jolt/RegisterTypes.h>
  6. #include <Jolt/Core/Factory.h>
  7. #include <Jolt/Core/TempAllocator.h>
  8. #include <Jolt/Core/JobSystemThreadPool.h>
  9. #include <Jolt/Physics/PhysicsSettings.h>
  10. #include <Jolt/Physics/PhysicsSystem.h>
  11. #include <Jolt/Physics/Collision/NarrowPhaseStats.h>
  12. #include <Jolt/Physics/StateRecorderImpl.h>
  13. #ifdef JPH_DEBUG_RENDERER
  14. #include <Jolt/Renderer/DebugRendererRecorder.h>
  15. #include <Jolt/Core/StreamWrapper.h>
  16. #endif // JPH_DEBUG_RENDERER
  17. // STL includes
  18. #include <iostream>
  19. #include <thread>
  20. #include <chrono>
  21. #include <memory>
  22. #include <cstdarg>
  23. using namespace JPH;
  24. using namespace std;
  25. // Disable common warnings triggered by Jolt
  26. JPH_SUPPRESS_WARNINGS
  27. // Local includes
  28. #include "RagdollScene.h"
  29. #include "ConvexVsMeshScene.h"
  30. // Time step for physics
  31. constexpr float cDeltaTime = 1.0f / 60.0f;
  32. static void TraceImpl(const char *inFMT, ...)
  33. {
  34. // Format the message
  35. va_list list;
  36. va_start(list, inFMT);
  37. char buffer[1024];
  38. vsnprintf(buffer, sizeof(buffer), inFMT, list);
  39. // Print to the TTY
  40. cout << buffer << endl;
  41. }
  42. // Program entry point
  43. int main(int argc, char** argv)
  44. {
  45. // Register allocation hook
  46. RegisterDefaultAllocator();
  47. // Parse command line parameters
  48. int specified_quality = -1;
  49. int specified_threads = -1;
  50. uint max_iterations = 500;
  51. bool disable_sleep = false;
  52. bool enable_profiler = false;
  53. #ifdef JPH_DEBUG_RENDERER
  54. bool enable_debug_renderer = false;
  55. #endif // JPH_DEBUG_RENDERER
  56. bool enable_per_frame_recording = false;
  57. bool record_state = false;
  58. bool validate_state = false;
  59. unique_ptr<PerformanceTestScene> scene;
  60. for (int argidx = 1; argidx < argc; ++argidx)
  61. {
  62. const char *arg = argv[argidx];
  63. if (strncmp(arg, "-s=", 3) == 0)
  64. {
  65. // Parse scene
  66. if (strcmp(arg + 3, "Ragdoll") == 0)
  67. scene = unique_ptr<PerformanceTestScene>(new RagdollScene);
  68. else if (strcmp(arg + 3, "ConvexVsMesh") == 0)
  69. scene = unique_ptr<PerformanceTestScene>(new ConvexVsMeshScene);
  70. else
  71. {
  72. cerr << "Invalid scene" << endl;
  73. return 1;
  74. }
  75. }
  76. else if (strncmp(arg, "-i=", 3) == 0)
  77. {
  78. // Parse max iterations
  79. max_iterations = (uint)atoi(arg + 3);
  80. }
  81. else if (strncmp(arg, "-q=", 3) == 0)
  82. {
  83. // Parse quality
  84. if (strcmp(arg + 3, "Discrete") == 0)
  85. specified_quality = 0;
  86. else if (strcmp(arg + 3, "LinearCast") == 0)
  87. specified_quality = 1;
  88. else
  89. {
  90. cerr << "Invalid quality" << endl;
  91. return 1;
  92. }
  93. }
  94. else if (strncmp(arg, "-t=", 3) == 0)
  95. {
  96. // Parse threads
  97. specified_threads = atoi(arg + 3);
  98. }
  99. else if (strcmp(arg, "-no_sleep") == 0)
  100. {
  101. disable_sleep = true;
  102. }
  103. else if (strcmp(arg, "-p") == 0)
  104. {
  105. enable_profiler = true;
  106. }
  107. #ifdef JPH_DEBUG_RENDERER
  108. else if (strcmp(arg, "-r") == 0)
  109. {
  110. enable_debug_renderer = true;
  111. }
  112. #endif // JPH_DEBUG_RENDERER
  113. else if (strcmp(arg, "-f") == 0)
  114. {
  115. enable_per_frame_recording = true;
  116. }
  117. else if (strcmp(arg, "-rs") == 0)
  118. {
  119. record_state = true;
  120. }
  121. else if (strcmp(arg, "-vs") == 0)
  122. {
  123. validate_state = true;
  124. }
  125. else if (strcmp(arg, "-h") == 0)
  126. {
  127. // Print usage
  128. cerr << "Usage:" << endl
  129. << "-s=<scene>: Select scene (Ragdoll, ConvexVsMesh)" << endl
  130. << "-i=<num physics steps>: Number of physics steps to simulate (default 500)" << endl
  131. << "-q=<quality>: Test only with specified quality (Discrete, LinearCast)" << endl
  132. << "-t=<num threads>: Test only with N threads (default is to iterate over 1 .. num hardware threads)" << endl
  133. << "-p: Write out profiles" << endl
  134. << "-r: Record debug renderer output for JoltViewer" << endl
  135. << "-f: Record per frame timings" << endl
  136. << "-no_sleep: Disable sleeping" << endl
  137. << "-rs: Record state" << endl
  138. << "-vs: Validate state" << endl;
  139. return 0;
  140. }
  141. }
  142. // Install callbacks
  143. Trace = TraceImpl;
  144. // Create a factory
  145. Factory::sInstance = new Factory();
  146. // Register all Jolt physics types
  147. RegisterTypes();
  148. // Create temp allocator
  149. TempAllocatorImpl temp_allocator(10 * 1024 * 1024);
  150. // Load the scene
  151. if (scene == nullptr)
  152. scene = unique_ptr<PerformanceTestScene>(new RagdollScene);
  153. if (!scene->Load())
  154. return 1;
  155. // Output scene we're running
  156. cout << "Running scene: " << scene->GetName() << endl;
  157. // Create mapping table from object layer to broadphase layer
  158. BPLayerInterfaceImpl broad_phase_layer_interface;
  159. // Start profiling this program
  160. JPH_PROFILE_START("Main");
  161. // Trace header
  162. cout << "Motion Quality, Thread Count, Steps / Second, Hash" << endl;
  163. // Iterate motion qualities
  164. for (uint mq = 0; mq < 2; ++mq)
  165. {
  166. // Skip quality if another was specified
  167. if (specified_quality != -1 && mq != (uint)specified_quality)
  168. continue;
  169. // Determine motion quality
  170. EMotionQuality motion_quality = mq == 0? EMotionQuality::Discrete : EMotionQuality::LinearCast;
  171. String motion_quality_str = mq == 0? "Discrete" : "LinearCast";
  172. // Determine which thread counts to test
  173. Array<uint> thread_permutations;
  174. if (specified_threads > 0)
  175. thread_permutations.push_back((uint)specified_threads - 1);
  176. else
  177. for (uint num_threads = 0; num_threads < thread::hardware_concurrency(); ++num_threads)
  178. thread_permutations.push_back(num_threads);
  179. // Test thread permutations
  180. for (uint num_threads : thread_permutations)
  181. {
  182. // Create job system with desired number of threads
  183. JobSystemThreadPool job_system(cMaxPhysicsJobs, cMaxPhysicsBarriers, num_threads);
  184. // Create physics system
  185. PhysicsSystem physics_system;
  186. physics_system.Init(10240, 0, 65536, 10240, broad_phase_layer_interface, BroadPhaseCanCollide, ObjectCanCollide);
  187. // Start test scene
  188. scene->StartTest(physics_system, motion_quality);
  189. // Disable sleeping if requested
  190. if (disable_sleep)
  191. {
  192. const BodyLockInterface &bli = physics_system.GetBodyLockInterfaceNoLock();
  193. BodyIDVector body_ids;
  194. physics_system.GetBodies(body_ids);
  195. for (BodyID id : body_ids)
  196. {
  197. BodyLockWrite lock(bli, id);
  198. if (lock.Succeeded())
  199. {
  200. Body &body = lock.GetBody();
  201. if (!body.IsStatic())
  202. body.SetAllowSleeping(false);
  203. }
  204. }
  205. }
  206. // Optimize the broadphase to prevent an expensive first frame
  207. physics_system.OptimizeBroadPhase();
  208. // A tag used to identify the test
  209. String tag = ToLower(motion_quality_str) + "_th" + ConvertToString(num_threads + 1);
  210. #ifdef JPH_DEBUG_RENDERER
  211. // Open renderer output
  212. ofstream renderer_file;
  213. if (enable_debug_renderer)
  214. renderer_file.open(("performance_test_" + tag + ".jor").c_str(), ofstream::out | ofstream::binary | ofstream::trunc);
  215. StreamOutWrapper renderer_stream(renderer_file);
  216. DebugRendererRecorder renderer(renderer_stream);
  217. #endif // JPH_DEBUG_RENDERER
  218. // Open per frame timing output
  219. ofstream per_frame_file;
  220. if (enable_per_frame_recording)
  221. {
  222. per_frame_file.open(("per_frame_" + tag + ".csv").c_str(), ofstream::out | ofstream::trunc);
  223. per_frame_file << "Frame, Time (ms)" << endl;
  224. }
  225. ofstream record_state_file;
  226. ifstream validate_state_file;
  227. if (record_state)
  228. record_state_file.open(("state_" + ToLower(motion_quality_str) + ".bin").c_str(), ofstream::out | ofstream::binary | ofstream::trunc);
  229. else if (validate_state)
  230. validate_state_file.open(("state_" + ToLower(motion_quality_str) + ".bin").c_str(), ifstream::in | ifstream::binary);
  231. chrono::nanoseconds total_duration(0);
  232. // Step the world for a fixed amount of iterations
  233. for (uint iterations = 0; iterations < max_iterations; ++iterations)
  234. {
  235. JPH_PROFILE_NEXTFRAME();
  236. // Start measuring
  237. chrono::high_resolution_clock::time_point clock_start = chrono::high_resolution_clock::now();
  238. // Do a physics step
  239. physics_system.Update(cDeltaTime, 1, 1, &temp_allocator, &job_system);
  240. // Stop measuring
  241. chrono::high_resolution_clock::time_point clock_end = chrono::high_resolution_clock::now();
  242. chrono::nanoseconds duration = chrono::duration_cast<chrono::nanoseconds>(clock_end - clock_start);
  243. total_duration += duration;
  244. #ifdef JPH_DEBUG_RENDERER
  245. if (enable_debug_renderer)
  246. {
  247. // Draw the state of the world
  248. BodyManager::DrawSettings settings;
  249. physics_system.DrawBodies(settings, &renderer);
  250. // Mark end of frame
  251. renderer.EndFrame();
  252. }
  253. #endif // JPH_DEBUG_RENDERER
  254. // Record time taken this iteration
  255. if (enable_per_frame_recording)
  256. per_frame_file << iterations << ", " << (1.0e-6 * duration.count()) << endl;
  257. // Dump profile information every 100 iterations
  258. if (enable_profiler && iterations % 100 == 0)
  259. {
  260. JPH_PROFILE_DUMP(tag + "_it" + ConvertToString(iterations));
  261. }
  262. if (record_state)
  263. {
  264. // Record state
  265. StateRecorderImpl recorder;
  266. physics_system.SaveState(recorder);
  267. // Write to file
  268. string data = recorder.GetData();
  269. size_t size = data.size();
  270. record_state_file.write((char *)&size, sizeof(size));
  271. record_state_file.write(data.data(), size);
  272. }
  273. else if (validate_state)
  274. {
  275. // Read state
  276. size_t size = 0;
  277. validate_state_file.read((char *)&size, sizeof(size));
  278. string data;
  279. data.resize(size);
  280. validate_state_file.read(data.data(), size);
  281. // Copy to validator
  282. StateRecorderImpl validator;
  283. validator.WriteBytes(data.data(), size);
  284. // Validate state
  285. validator.SetValidating(true);
  286. physics_system.RestoreState(validator);
  287. }
  288. }
  289. // Calculate hash of all positions and rotations of the bodies
  290. uint64 hash = HashBytes(nullptr, 0); // Ensure we start with the proper seed
  291. BodyInterface &bi = physics_system.GetBodyInterfaceNoLock();
  292. BodyIDVector body_ids;
  293. physics_system.GetBodies(body_ids);
  294. for (BodyID id : body_ids)
  295. {
  296. Vec3 pos = bi.GetPosition(id);
  297. hash = HashBytes(&pos, 3 * sizeof(float), hash);
  298. Quat rot = bi.GetRotation(id);
  299. hash = HashBytes(&rot, sizeof(Quat), hash);
  300. }
  301. // Stop test scene
  302. scene->StopTest(physics_system);
  303. // Trace stat line
  304. cout << motion_quality_str << ", " << num_threads + 1 << ", " << double(max_iterations) / (1.0e-9 * total_duration.count()) << ", 0x" << hex << hash << dec << endl;
  305. }
  306. }
  307. #ifdef JPH_TRACK_NARROWPHASE_STATS
  308. NarrowPhaseStat::sReportStats();
  309. #endif // JPH_TRACK_NARROWPHASE_STATS
  310. // Destroy the factory
  311. delete Factory::sInstance;
  312. Factory::sInstance = nullptr;
  313. // End profiling this program
  314. JPH_PROFILE_END();
  315. return 0;
  316. }