JobSystemThreadPool.h 6.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158
  1. // SPDX-FileCopyrightText: 2021 Jorrit Rouwe
  2. // SPDX-License-Identifier: MIT
  3. #pragma once
  4. #include <Jolt/Core/JobSystem.h>
  5. #include <Jolt/Core/FixedSizeFreeList.h>
  6. JPH_SUPPRESS_WARNINGS_STD_BEGIN
  7. #include <thread>
  8. #include <mutex>
  9. #include <condition_variable>
  10. JPH_SUPPRESS_WARNINGS_STD_END
  11. JPH_NAMESPACE_BEGIN
  12. /// Implementation of a JobSystem using a thread pool
  13. ///
  14. /// Note that this is considered an example implementation. It is expected that when you integrate
  15. /// the physics engine into your own project that you'll provide your own implementation of the
  16. /// JobSystem built on top of whatever job system your project uses.
  17. class JobSystemThreadPool final : public JobSystem
  18. {
  19. public:
  20. /// Creates a thread pool.
  21. /// @see JobSystemThreadPool::Init
  22. JobSystemThreadPool(uint inMaxJobs, uint inMaxBarriers, int inNumThreads = -1);
  23. JobSystemThreadPool() = default;
  24. virtual ~JobSystemThreadPool() override;
  25. /// Initialize the thread pool
  26. /// @param inMaxJobs Max number of jobs that can be allocated at any time
  27. /// @param inMaxBarriers Max number of barriers that can be allocated at any time
  28. /// @param inNumThreads Number of threads to start (the number of concurrent jobs is 1 more because the main thread will also run jobs while waiting for a barrier to complete). Use -1 to autodetect the amount of CPU's.
  29. void Init(uint inMaxJobs, uint inMaxBarriers, int inNumThreads = -1);
  30. // See JobSystem
  31. virtual int GetMaxConcurrency() const override { return int(mThreads.size()) + 1; }
  32. virtual JobHandle CreateJob(const char *inName, ColorArg inColor, const JobFunction &inJobFunction, uint32 inNumDependencies = 0) override;
  33. virtual Barrier * CreateBarrier() override;
  34. virtual void DestroyBarrier(Barrier *inBarrier) override;
  35. virtual void WaitForJobs(Barrier *inBarrier) override;
  36. /// Change the max concurrency after initialization
  37. void SetNumThreads(int inNumThreads) { StopThreads(); StartThreads(inNumThreads); }
  38. protected:
  39. // See JobSystem
  40. virtual void QueueJob(Job *inJob) override;
  41. virtual void QueueJobs(Job **inJobs, uint inNumJobs) override;
  42. virtual void FreeJob(Job *inJob) override;
  43. private:
  44. /// When we switch to C++20 we can use counting_semaphore to unify this
  45. class Semaphore
  46. {
  47. public:
  48. /// Constructor
  49. inline Semaphore();
  50. inline ~Semaphore();
  51. /// Release the semaphore, signalling the thread waiting on the barrier that there may be work
  52. inline void Release(uint inNumber = 1);
  53. /// Acquire the semaphore inNumber times
  54. inline void Acquire(uint inNumber = 1);
  55. /// Get the current value of the semaphore
  56. inline int GetValue() const { return mCount; }
  57. private:
  58. #ifdef JPH_PLATFORM_WINDOWS
  59. // On windows we use a semaphore object since it is more efficient than a lock and a condition variable
  60. alignas(JPH_CACHE_LINE_SIZE) atomic<int> mCount { 0 }; ///< We increment mCount for every release, to acquire we decrement the count. If the count is negative we know that we are waiting on the actual semaphore.
  61. void * mSemaphore; ///< The semaphore is an expensive construct so we only acquire/release it if we know that we need to wait/have waiting threads
  62. #else
  63. // Other platforms: Emulate a semaphore using a mutex, condition variable and count
  64. mutex mLock;
  65. condition_variable mWaitVariable;
  66. int mCount = 0;
  67. #endif
  68. };
  69. class BarrierImpl : public Barrier
  70. {
  71. public:
  72. /// Constructor
  73. BarrierImpl();
  74. virtual ~BarrierImpl() override;
  75. // See Barrier
  76. virtual void AddJob(const JobHandle &inJob) override;
  77. virtual void AddJobs(const JobHandle *inHandles, uint inNumHandles) override;
  78. /// Check if there are any jobs in the job barrier
  79. inline bool IsEmpty() const { return mJobReadIndex == mJobWriteIndex; }
  80. /// Wait for all jobs in this job barrier, while waiting, execute jobs that are part of this barrier on the current thread
  81. void Wait();
  82. /// Flag to indicate if a barrier has been handed out
  83. atomic<bool> mInUse { false };
  84. protected:
  85. /// Called by a Job to mark that it is finished
  86. virtual void OnJobFinished(Job *inJob) override;
  87. /// Jobs queue for the barrier
  88. static constexpr uint cMaxJobs = 2048;
  89. static_assert(IsPowerOf2(cMaxJobs)); // We do bit operations and require max jobs to be a power of 2
  90. atomic<Job *> mJobs[cMaxJobs]; ///< List of jobs that are part of this barrier, nullptrs for empty slots
  91. alignas(JPH_CACHE_LINE_SIZE) atomic<uint> mJobReadIndex { 0 }; ///< First job that could be valid (modulo cMaxJobs), can be nullptr if other thread is still working on adding the job
  92. alignas(JPH_CACHE_LINE_SIZE) atomic<uint> mJobWriteIndex { 0 }; ///< First job that can be written (modulo cMaxJobs)
  93. atomic<int> mNumToAcquire { 0 }; ///< Number of times the semaphore has been released, the barrier should acquire the semaphore this many times (written at the same time as mJobWriteIndex so ok to put in same cache line)
  94. Semaphore mSemaphore; ///< Semaphore used by finishing jobs to signal the barrier that they're done
  95. };
  96. /// Start/stop the worker threads
  97. void StartThreads(int inNumThreads);
  98. void StopThreads();
  99. /// Entry point for a thread
  100. void ThreadMain(const char *inName, int inThreadIndex);
  101. /// Get the head of the thread that has processed the least amount of jobs
  102. inline uint GetHead() const;
  103. /// Internal helper function to queue a job
  104. inline void QueueJobInternal(Job *inJob);
  105. /// Array of jobs (fixed size)
  106. using AvailableJobs = FixedSizeFreeList<Job>;
  107. AvailableJobs mJobs;
  108. /// Array of barriers (we keep them constructed all the time since constructing a semaphore/mutex is not cheap)
  109. uint mMaxBarriers = 0; ///< Max amount of barriers
  110. BarrierImpl * mBarriers = nullptr; ///< List of the actual barriers
  111. /// Threads running jobs
  112. vector<thread> mThreads;
  113. // The job queue
  114. static constexpr uint32 cQueueLength = 1024;
  115. static_assert(IsPowerOf2(cQueueLength)); // We do bit operations and require queue length to be a power of 2
  116. atomic<Job *> mQueue[cQueueLength];
  117. // Head and tail of the queue, do this value modulo cQueueLength - 1 to get the element in the mQueue array
  118. atomic<uint> * mHeads = nullptr; ///< Per executing thread the head of the current queue
  119. alignas(JPH_CACHE_LINE_SIZE) atomic<uint> mTail = 0; ///< Tail (write end) of the queue
  120. // Semaphore used to signal worker threads that there is new work
  121. Semaphore mSemaphore;
  122. /// Boolean to indicate that we want to stop the job system
  123. atomic<bool> mQuit = false;
  124. };
  125. JPH_NAMESPACE_END