JobSystemThreadPool.h 6.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153
  1. // SPDX-FileCopyrightText: 2021 Jorrit Rouwe
  2. // SPDX-License-Identifier: MIT
  3. #pragma once
  4. #include <Jolt/Core/JobSystem.h>
  5. #include <Jolt/Core/FixedSizeFreeList.h>
  6. JPH_SUPPRESS_WARNINGS_STD_BEGIN
  7. #include <thread>
  8. #include <mutex>
  9. #include <condition_variable>
  10. JPH_SUPPRESS_WARNINGS_STD_END
  11. JPH_NAMESPACE_BEGIN
  12. /// Implementation of a JobSystem using a thread pool
  13. ///
  14. /// Note that this is considered an example implementation. It is expected that when you integrate
  15. /// the physics engine into your own project that you'll provide your own implementation of the
  16. /// JobSystem built on top of whatever job system your project uses.
  17. class JobSystemThreadPool final : public JobSystem
  18. {
  19. public:
  20. /// Creates a thread pool.
  21. /// @param inMaxJobs Max number of jobs that can be allocated at any time
  22. /// @param inMaxBarriers Max number of barriers that can be allocated at any time
  23. /// @param inNumThreads Number of threads to start (the number of concurrent jobs is 1 more because the main thread will also run jobs while waiting for a barrier to complete). Use -1 to autodetect the amount of CPU's.
  24. JobSystemThreadPool(uint inMaxJobs, uint inMaxBarriers, int inNumThreads = -1);
  25. virtual ~JobSystemThreadPool() override;
  26. // See JobSystem
  27. virtual int GetMaxConcurrency() const override { return int(mThreads.size()) + 1; }
  28. virtual JobHandle CreateJob(const char *inName, ColorArg inColor, const JobFunction &inJobFunction, uint32 inNumDependencies = 0) override;
  29. virtual Barrier * CreateBarrier() override;
  30. virtual void DestroyBarrier(Barrier *inBarrier) override;
  31. virtual void WaitForJobs(Barrier *inBarrier) override;
  32. /// Change the max concurrency after initialization
  33. void SetNumThreads(int inNumThreads) { StopThreads(); StartThreads(inNumThreads); }
  34. protected:
  35. // See JobSystem
  36. virtual void QueueJob(Job *inJob) override;
  37. virtual void QueueJobs(Job **inJobs, uint inNumJobs) override;
  38. virtual void FreeJob(Job *inJob) override;
  39. private:
  40. /// When we switch to C++20 we can use counting_semaphore to unify this
  41. class Semaphore
  42. {
  43. public:
  44. /// Constructor
  45. inline Semaphore();
  46. inline ~Semaphore();
  47. /// Release the semaphore, signalling the thread waiting on the barrier that there may be work
  48. inline void Release(uint inNumber = 1);
  49. /// Acquire the semaphore inNumber times
  50. inline void Acquire(uint inNumber = 1);
  51. /// Get the current value of the semaphore
  52. inline int GetValue() const { return mCount; }
  53. private:
  54. #ifdef JPH_PLATFORM_WINDOWS
  55. // On windows we use a semaphore object since it is more efficient than a lock and a condition variable
  56. alignas(JPH_CACHE_LINE_SIZE) atomic<int> mCount { 0 }; ///< We increment mCount for every release, to acquire we decrement the count. If the count is negative we know that we are waiting on the actual semaphore.
  57. void * mSemaphore; ///< The semaphore is an expensive construct so we only acquire/release it if we know that we need to wait/have waiting threads
  58. #else
  59. // Other platforms: Emulate a semaphore using a mutex, condition variable and count
  60. mutex mLock;
  61. condition_variable mWaitVariable;
  62. int mCount = 0;
  63. #endif
  64. };
  65. class BarrierImpl : public Barrier
  66. {
  67. public:
  68. /// Constructor
  69. BarrierImpl();
  70. virtual ~BarrierImpl() override;
  71. // See Barrier
  72. virtual void AddJob(const JobHandle &inJob) override;
  73. virtual void AddJobs(const JobHandle *inHandles, uint inNumHandles) override;
  74. /// Check if there are any jobs in the job barrier
  75. inline bool IsEmpty() const { return mJobReadIndex == mJobWriteIndex; }
  76. /// Wait for all jobs in this job barrier, while waiting, execute jobs that are part of this barrier on the current thread
  77. void Wait();
  78. /// Flag to indicate if a barrier has been handed out
  79. atomic<bool> mInUse { false };
  80. protected:
  81. /// Called by a Job to mark that it is finished
  82. virtual void OnJobFinished(Job *inJob) override;
  83. /// Jobs queue for the barrier
  84. static constexpr uint cMaxJobs = 1024;
  85. static_assert(IsPowerOf2(cMaxJobs)); // We do bit operations and require max jobs to be a power of 2
  86. atomic<Job *> mJobs[cMaxJobs]; ///< List of jobs that are part of this barrier, nullptrs for empty slots
  87. alignas(JPH_CACHE_LINE_SIZE) atomic<uint> mJobReadIndex { 0 }; ///< First job that could be valid (modulo cMaxJobs), can be nullptr if other thread is still working on adding the job
  88. alignas(JPH_CACHE_LINE_SIZE) atomic<uint> mJobWriteIndex { 0 }; ///< First job that can be written (modulo cMaxJobs)
  89. atomic<int> mNumToAcquire { 0 }; ///< Number of times the semaphore has been released, the barrier should acquire the semaphore this many times (written at the same time as mJobWriteIndex so ok to put in same cache line)
  90. Semaphore mSemaphore; ///< Semaphore used by finishing jobs to signal the barrier that they're done
  91. };
  92. /// Start/stop the worker threads
  93. void StartThreads(int inNumThreads);
  94. void StopThreads();
  95. /// Entry point for a thread
  96. void ThreadMain(const char *inName, int inThreadIndex);
  97. /// Get the head of the thread that has processed the least amount of jobs
  98. inline uint GetHead() const;
  99. /// Internal helper function to queue a job
  100. inline void QueueJobInternal(Job *inJob);
  101. /// Array of jobs (fixed size)
  102. using AvailableJobs = FixedSizeFreeList<Job>;
  103. AvailableJobs mJobs;
  104. /// Array of barriers (we keep them constructed all the time since constructing a semaphore/mutex is not cheap)
  105. uint mMaxBarriers; ///< Max amount of barriers
  106. BarrierImpl * mBarriers; ///< List of the actual barriers
  107. /// Threads running jobs
  108. vector<thread> mThreads;
  109. // The job queue
  110. static constexpr uint32 cQueueLength = 1024;
  111. static_assert(IsPowerOf2(cQueueLength)); // We do bit operations and require queue length to be a power of 2
  112. atomic<Job *> mQueue[cQueueLength];
  113. // Head and tail of the queue, do this value modulo cQueueLength - 1 to get the element in the mQueue array
  114. atomic<uint> * mHeads = nullptr; ///< Per executing thread the head of the current queue
  115. alignas(JPH_CACHE_LINE_SIZE) atomic<uint> mTail = 0; ///< Tail (write end) of the queue
  116. // Semaphore used to signal worker threads that there is new work
  117. Semaphore mSemaphore;
  118. /// Boolean to indicate that we want to stop the job system
  119. atomic<bool> mQuit = false;
  120. };
  121. JPH_NAMESPACE_END