circular_buffer_benchmark.cc 3.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138
  1. // Copyright The OpenTelemetry Authors
  2. // SPDX-License-Identifier: Apache-2.0
  3. #include <stddef.h>
  4. #include <atomic>
  5. #include <cstdint>
  6. #include <exception>
  7. #include <functional>
  8. #include <iostream>
  9. #include <memory>
  10. #include <random>
  11. #include <thread>
  12. #include <vector>
  13. #include "benchmark/benchmark.h"
  14. #include "opentelemetry/sdk/common/atomic_unique_ptr.h"
  15. #include "opentelemetry/sdk/common/circular_buffer.h"
  16. #include "opentelemetry/sdk/common/circular_buffer_range.h"
  17. #include "test/common/baseline_circular_buffer.h"
  18. using opentelemetry::sdk::common::AtomicUniquePtr;
  19. using opentelemetry::sdk::common::CircularBuffer;
  20. using opentelemetry::sdk::common::CircularBufferRange;
  21. using opentelemetry::testing::BaselineCircularBuffer;
  22. const int N = 10000;
  23. static uint64_t ConsumeBufferNumbers(BaselineCircularBuffer<uint64_t> &buffer) noexcept
  24. {
  25. uint64_t result = 0;
  26. buffer.Consume([&](std::unique_ptr<uint64_t> &&x) {
  27. result += *x;
  28. x.reset();
  29. });
  30. return result;
  31. }
  32. static uint64_t ConsumeBufferNumbers(CircularBuffer<uint64_t> &buffer) noexcept
  33. {
  34. uint64_t result = 0;
  35. buffer.Consume(buffer.size(),
  36. [&](CircularBufferRange<AtomicUniquePtr<uint64_t>> &range) noexcept {
  37. range.ForEach([&](AtomicUniquePtr<uint64_t> &ptr) noexcept {
  38. result += *ptr;
  39. ptr.Reset();
  40. return true;
  41. });
  42. });
  43. return result;
  44. }
  45. template <class Buffer>
  46. static void GenerateNumbersForThread(Buffer &buffer, int n, std::atomic<uint64_t> &sum) noexcept
  47. {
  48. thread_local std::mt19937_64 random_number_generator{std::random_device{}()};
  49. for (int i = 0; i < n; ++i)
  50. {
  51. auto x = random_number_generator();
  52. std::unique_ptr<uint64_t> element{new uint64_t{x}};
  53. if (buffer.Add(element))
  54. {
  55. sum += x;
  56. }
  57. }
  58. }
  59. template <class Buffer>
  60. static uint64_t GenerateNumbers(Buffer &buffer, int num_threads, int n) noexcept
  61. {
  62. std::atomic<uint64_t> sum{0};
  63. std::vector<std::thread> threads(num_threads);
  64. for (auto &thread : threads)
  65. {
  66. thread = std::thread{GenerateNumbersForThread<Buffer>, std::ref(buffer), n, std::ref(sum)};
  67. }
  68. for (auto &thread : threads)
  69. {
  70. thread.join();
  71. }
  72. return sum;
  73. }
  74. template <class Buffer>
  75. static void ConsumeNumbers(Buffer &buffer, uint64_t &sum, std::atomic<bool> &finished) noexcept
  76. {
  77. while (!finished)
  78. {
  79. sum += ConsumeBufferNumbers(buffer);
  80. }
  81. sum += ConsumeBufferNumbers(buffer);
  82. }
  83. template <class Buffer>
  84. static void RunSimulation(Buffer &buffer, int num_threads, int n) noexcept
  85. {
  86. std::atomic<bool> finished{false};
  87. uint64_t consumer_sum{0};
  88. std::thread consumer_thread{ConsumeNumbers<Buffer>, std::ref(buffer), std::ref(consumer_sum),
  89. std::ref(finished)};
  90. uint64_t producer_sum = GenerateNumbers(buffer, num_threads, n);
  91. finished = true;
  92. consumer_thread.join();
  93. if (consumer_sum != producer_sum)
  94. {
  95. std::cerr << "Sumulation failed: consumer_sum != producer_sum\n";
  96. std::terminate();
  97. }
  98. }
  99. static void BM_BaselineBuffer(benchmark::State &state)
  100. {
  101. const size_t max_elements = 500;
  102. const int num_threads = static_cast<int>(state.range(0));
  103. const int n = static_cast<int>(N / num_threads);
  104. BaselineCircularBuffer<uint64_t> buffer{max_elements};
  105. for (auto _ : state)
  106. {
  107. RunSimulation(buffer, num_threads, n);
  108. }
  109. }
  110. BENCHMARK(BM_BaselineBuffer)->Arg(1)->Arg(2)->Arg(4);
  111. static void BM_LockFreeBuffer(benchmark::State &state)
  112. {
  113. const size_t max_elements = 500;
  114. const int num_threads = static_cast<int>(state.range(0));
  115. const int n = static_cast<int>(N / num_threads);
  116. CircularBuffer<uint64_t> buffer{max_elements};
  117. for (auto _ : state)
  118. {
  119. RunSimulation(buffer, num_threads, n);
  120. }
  121. }
  122. BENCHMARK(BM_LockFreeBuffer)->Arg(1)->Arg(2)->Arg(4);
  123. BENCHMARK_MAIN();