virtualStack.cpp 7.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188
  1. // zlib open source license
  2. //
  3. // Copyright (c) 2024 David Forsgren Piuva
  4. //
  5. // This software is provided 'as-is', without any express or implied
  6. // warranty. In no event will the authors be held liable for any damages
  7. // arising from the use of this software.
  8. //
  9. // Permission is granted to anyone to use this software for any purpose,
  10. // including commercial applications, and to alter it and redistribute it
  11. // freely, subject to the following restrictions:
  12. //
  13. // 1. The origin of this software must not be misrepresented; you must not
  14. // claim that you wrote the original software. If you use this software
  15. // in a product, an acknowledgment in the product documentation would be
  16. // appreciated but is not required.
  17. //
  18. // 2. Altered source versions must be plainly marked as such, and must not be
  19. // misrepresented as being the original software.
  20. //
  21. // 3. This notice may not be removed or altered from any source
  22. // distribution.
  23. #include "virtualStack.h"
  24. #include <thread>
  25. #include "../api/stringAPI.h"
  26. namespace dsr {
  27. // How many bytes that are allocated directly in thread local memory.
  28. static const uint64_t VIRTUAL_STACK_SIZE = 262144;
  29. static const int MAX_EXTRA_STACKS = 63;
  30. static const uintptr_t stackHeaderPaddedSize = memory_getPaddedSize<AllocationHeader>();
  31. static const uintptr_t stackHeaderAlignmentAndMask = memory_createAlignmentAndMask((uintptr_t)alignof(AllocationHeader));
  32. struct StackMemory {
  33. uint8_t *top = nullptr; // The stack pointer is here when completely full.
  34. uint8_t *stackPointer = nullptr; // The virtual stack pointer.
  35. uint8_t *bottom = nullptr; // The stack pointer is here when empty.
  36. };
  37. // The first block of stack memory in stread local memory.
  38. struct FixedStackMemory : public StackMemory {
  39. uint8_t data[VIRTUAL_STACK_SIZE];
  40. FixedStackMemory() {
  41. this->top = this->data;
  42. this->stackPointer = this->data + VIRTUAL_STACK_SIZE;
  43. this->bottom = this->data + VIRTUAL_STACK_SIZE;
  44. }
  45. };
  46. // Additional stacks in heap memory.
  47. struct DynamicStackMemory : public StackMemory {
  48. ~DynamicStackMemory() {
  49. if (this->top != nullptr) {
  50. free(this->top);
  51. }
  52. }
  53. };
  54. // Returns the size of the allocation including alignment.
  55. inline uint64_t increaseStackPointer(uint8_t *&pointer, uint64_t paddedSize, uintptr_t alignmentAndMask) {
  56. // Add the padded payload and align.
  57. uintptr_t oldAddress = (uintptr_t)pointer;
  58. uintptr_t newAddress = (oldAddress - paddedSize) & alignmentAndMask;
  59. pointer = (uint8_t*)newAddress;
  60. return oldAddress - newAddress;
  61. }
  62. inline void decreaseStackPointer(uint8_t *&pointer, uint64_t totalSize) {
  63. // Remove the data and alignment.
  64. pointer += totalSize;
  65. }
  66. static uint8_t *stackAllocate(StackMemory& stack, uint64_t paddedSize, uintptr_t alignmentAndMask) {
  67. uint8_t *newStackPointer = stack.stackPointer;
  68. // Allocate memory for payload.
  69. uint64_t payloadTotalSize = increaseStackPointer(newStackPointer, paddedSize, alignmentAndMask);
  70. // Get a pointer to the payload.
  71. uint8_t *result = newStackPointer;
  72. // Allocate memory for header.
  73. uint64_t headerTotalSize = increaseStackPointer(newStackPointer, stackHeaderPaddedSize, stackHeaderAlignmentAndMask);
  74. // Check that we did not run out of memory.
  75. if (newStackPointer < stack.top) {
  76. // Not enough space.
  77. return nullptr;
  78. } else {
  79. stack.stackPointer = newStackPointer;
  80. // Write the header to memory.
  81. *((AllocationHeader*)stack.stackPointer) = AllocationHeader(payloadTotalSize + headerTotalSize, true);
  82. // Clear the new allocation for determinism.
  83. std::memset((void*)result, 0, payloadTotalSize);
  84. // Return a pointer to the payload.
  85. return result;
  86. }
  87. }
  88. thread_local FixedStackMemory fixedMemory; // Index -1
  89. thread_local DynamicStackMemory dynamicMemory[MAX_EXTRA_STACKS]; // Index 0..MAX_EXTRA_STACKS-1
  90. thread_local int32_t stackIndex = -1;
  91. uint8_t *virtualStack_push(uint64_t paddedSize, uintptr_t alignmentAndMask) {
  92. if (stackIndex < 0) {
  93. uint8_t *result = stackAllocate(fixedMemory, paddedSize, alignmentAndMask);
  94. // Check that we did not run out of memory.
  95. if (result == nullptr) {
  96. // Not enough space in thread local memory. Moving to the first dynamic stack.
  97. stackIndex = 0;
  98. goto allocateDynamic;
  99. } else {
  100. // Return a pointer to the payload.
  101. return result;
  102. }
  103. }
  104. allocateDynamic:
  105. // We should only reach this place if allocating in dynamic stack memory.
  106. assert(stackIndex >= 0);
  107. // Never go above the maximum index.
  108. assert(stackIndex < MAX_EXTRA_STACKS);
  109. // Allocate memory in the dynamic stack if not yet allocated.
  110. if (dynamicMemory[stackIndex].top == nullptr) {
  111. uint64_t regionSize = 16777216 * (1 << stackIndex);
  112. if (paddedSize * 4 > regionSize) {
  113. regionSize = paddedSize * 4;
  114. }
  115. uint8_t *newMemory = (uint8_t*)malloc(regionSize);
  116. if (newMemory == nullptr) {
  117. throwError(U"Failed to allocate ", regionSize, U" bytes of heap memory for expanding the virtual stack when trying to allocate ", paddedSize, " bytes!\n");
  118. return nullptr;
  119. } else {
  120. // Keep the new allocation.
  121. dynamicMemory[stackIndex].top = newMemory;
  122. // Start from the back of the new allocation.
  123. dynamicMemory[stackIndex].stackPointer = newMemory + regionSize;
  124. dynamicMemory[stackIndex].bottom = newMemory + regionSize;
  125. }
  126. }
  127. assert(dynamicMemory[stackIndex].stackPointer != nullptr);
  128. // Allocate memory.
  129. uint8_t *result = stackAllocate(dynamicMemory[stackIndex], paddedSize, alignmentAndMask);
  130. if (result == nullptr) {
  131. if (stackIndex >= MAX_EXTRA_STACKS - 1) {
  132. throwError(U"Exceeded MAX_EXTRA_STACKS to allocate more heap memory for a thread local virtual stack!\n");
  133. return nullptr;
  134. } else {
  135. stackIndex++;
  136. goto allocateDynamic;
  137. }
  138. } else {
  139. // Return a pointer to the payload.
  140. return result;
  141. }
  142. }
  143. // Deallocates the topmost allocation in the stack or returns false if it does not contain any more allocations.
  144. static bool stackDeallocate(StackMemory& stack) {
  145. if (stack.stackPointer + stackHeaderPaddedSize > stack.bottom) {
  146. // If the allocated memory does not fit a header, then it is empty.
  147. return false;
  148. } else {
  149. // Read the header.
  150. AllocationHeader header = *((AllocationHeader*)stack.stackPointer);
  151. // Overwrite the header.
  152. *((AllocationHeader*)stack.stackPointer) = AllocationHeader();
  153. // Deallocate both header and payload using the stored total size.
  154. decreaseStackPointer(stack.stackPointer, header.totalSize);
  155. return true;
  156. }
  157. }
  158. void virtualStack_pop() {
  159. if (stackIndex < 0) {
  160. if (!stackDeallocate(fixedMemory)) {
  161. throwError(U"No more stack memory to pop!\n");
  162. }
  163. } else {
  164. if (!stackDeallocate(dynamicMemory[stackIndex])) {
  165. throwError(U"The virtual stack has been corrupted!\n");
  166. } else {
  167. // If the bottom has been reached then go to the lower stack.
  168. if (dynamicMemory[stackIndex].stackPointer >= dynamicMemory[stackIndex].bottom) {
  169. stackIndex--;
  170. }
  171. }
  172. }
  173. }
  174. }