BsGpuParams.cpp 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449
  1. #include "BsGpuParams.h"
  2. #include "BsGpuParamDesc.h"
  3. #include "BsGpuParamBlock.h"
  4. #include "BsGpuParamBlockBuffer.h"
  5. #include "BsVector2.h"
  6. #include "BsFrameAlloc.h"
  7. #include "BsDebug.h"
  8. #include "BsException.h"
  9. namespace BansheeEngine
  10. {
  11. GpuParamsInternalData::GpuParamsInternalData()
  12. :mTransposeMatrices(false), mData(nullptr), mNumParamBlocks(0), mNumTextures(0), mNumSamplerStates(0), mFrameAlloc(nullptr),
  13. mParamBlocks(nullptr), mParamBlockBuffers(nullptr), mTextures(nullptr), mSamplerStates(nullptr), mCoreDirtyFlags(0xFFFFFFFF),
  14. mIsDestroyed(false), mTextureInfo(nullptr)
  15. { }
  16. GpuParams::GpuParams(const GpuParamDescPtr& paramDesc, bool transposeMatrices)
  17. :mParamDesc(paramDesc)
  18. {
  19. mInternalData = bs_shared_ptr<GpuParamsInternalData>();
  20. mInternalData->mTransposeMatrices = transposeMatrices;
  21. for(auto& paramBlock : mParamDesc->paramBlocks)
  22. {
  23. if ((paramBlock.second.slot + 1) > mInternalData->mNumParamBlocks)
  24. mInternalData->mNumParamBlocks = paramBlock.second.slot + 1;
  25. }
  26. for(auto& texture : mParamDesc->textures)
  27. {
  28. if ((texture.second.slot + 1) > mInternalData->mNumTextures)
  29. mInternalData->mNumTextures = texture.second.slot + 1;
  30. }
  31. for(auto& sampler : mParamDesc->samplers)
  32. {
  33. if ((sampler.second.slot + 1) > mInternalData->mNumSamplerStates)
  34. mInternalData->mNumSamplerStates = sampler.second.slot + 1;
  35. }
  36. constructInternalBuffers();
  37. }
  38. GpuParams::GpuParams(const GpuParamDescPtr& paramDesc, PrivatelyConstruct& dummy)
  39. :mParamDesc(paramDesc)
  40. {
  41. }
  42. GpuParams::~GpuParams()
  43. {
  44. mInternalData->mIsDestroyed = true;
  45. // Ensure everything is destructed
  46. for (UINT32 i = 0; i < mInternalData->mNumParamBlocks; i++)
  47. {
  48. mInternalData->mParamBlocks[i].~shared_ptr();
  49. mInternalData->mParamBlockBuffers[i].~shared_ptr();
  50. }
  51. for (UINT32 i = 0; i < mInternalData->mNumTextures; i++)
  52. mInternalData->mTextures[i].~ResourceHandle();
  53. for (UINT32 i = 0; i < mInternalData->mNumTextures; i++)
  54. mInternalData->mTextureInfo[i].~BoundTextureInfo();
  55. for (UINT32 i = 0; i < mInternalData->mNumSamplerStates; i++)
  56. mInternalData->mSamplerStates[i].~ResourceHandle();
  57. if (mInternalData->mFrameAlloc != nullptr)
  58. mInternalData->mFrameAlloc->dealloc(mInternalData->mData);
  59. else
  60. bs_free(mInternalData->mData);
  61. }
  62. void GpuParams::setParamBlockBuffer(UINT32 slot, const GpuParamBlockBufferPtr& paramBlockBuffer)
  63. {
  64. if (slot < 0 || slot >= mInternalData->mNumParamBlocks)
  65. {
  66. BS_EXCEPT(InvalidParametersException, "Index out of range: Valid range: 0 .. " +
  67. toString(mInternalData->mNumParamBlocks - 1) + ". Requested: " + toString(slot));
  68. }
  69. mInternalData->mParamBlockBuffers[slot] = paramBlockBuffer;
  70. mInternalData->mParamBlocks[slot] = paramBlockBuffer->getParamBlock();
  71. markCoreDirty();
  72. }
  73. void GpuParams::setParamBlockBuffer(const String& name, const GpuParamBlockBufferPtr& paramBlockBuffer)
  74. {
  75. auto iterFind = mParamDesc->paramBlocks.find(name);
  76. if(iterFind == mParamDesc->paramBlocks.end())
  77. {
  78. LOGWRN("Cannot find parameter block with the name: " + name);
  79. return;
  80. }
  81. mInternalData->mParamBlockBuffers[iterFind->second.slot] = paramBlockBuffer;
  82. mInternalData->mParamBlocks[iterFind->second.slot] = paramBlockBuffer != nullptr ? paramBlockBuffer->getParamBlock() : nullptr;
  83. markCoreDirty();
  84. }
  85. UINT32 GpuParams::getDataParamSize(const String& name) const
  86. {
  87. GpuParamDataDesc* desc = getParamDesc(name);
  88. if(desc != nullptr)
  89. return desc->elementSize * 4;
  90. return 0;
  91. }
  92. bool GpuParams::hasParam(const String& name) const
  93. {
  94. return getParamDesc(name) != nullptr;
  95. }
  96. bool GpuParams::hasTexture(const String& name) const
  97. {
  98. auto paramIter = mParamDesc->textures.find(name);
  99. if(paramIter != mParamDesc->textures.end())
  100. return true;
  101. return false;
  102. }
  103. bool GpuParams::hasSamplerState(const String& name) const
  104. {
  105. auto paramIter = mParamDesc->samplers.find(name);
  106. if(paramIter != mParamDesc->samplers.end())
  107. return true;
  108. return false;
  109. }
  110. bool GpuParams::hasParamBlock(const String& name) const
  111. {
  112. auto paramBlockIter = mParamDesc->paramBlocks.find(name);
  113. if(paramBlockIter != mParamDesc->paramBlocks.end())
  114. return true;
  115. return false;
  116. }
  117. void GpuParams::getStructParam(const String& name, GpuParamStruct& output) const
  118. {
  119. auto iterFind = mParamDesc->params.find(name);
  120. if (iterFind == mParamDesc->params.end() || iterFind->second.type != GPDT_STRUCT)
  121. BS_EXCEPT(InvalidParametersException, "Cannot find struct parameter with the name '" + name + "'");
  122. output = GpuParamStruct(&iterFind->second, mInternalData);
  123. }
  124. void GpuParams::getTextureParam(const String& name, GpuParamTexture& output) const
  125. {
  126. auto iterFind = mParamDesc->textures.find(name);
  127. if (iterFind == mParamDesc->textures.end())
  128. BS_EXCEPT(InvalidParametersException, "Cannot find texture parameter with the name '" + name + "'");
  129. output = GpuParamTexture(&iterFind->second, mInternalData);
  130. }
  131. void GpuParams::getLoadStoreTextureParam(const String& name, GpuParamLoadStoreTexture& output) const
  132. {
  133. auto iterFind = mParamDesc->textures.find(name);
  134. if (iterFind == mParamDesc->textures.end())
  135. BS_EXCEPT(InvalidParametersException, "Cannot find texture parameter with the name '" + name + "'");
  136. output = GpuParamLoadStoreTexture(&iterFind->second, mInternalData);
  137. }
  138. void GpuParams::getSamplerStateParam(const String& name, GpuParamSampState& output) const
  139. {
  140. auto iterFind = mParamDesc->samplers.find(name);
  141. if (iterFind == mParamDesc->samplers.end())
  142. BS_EXCEPT(InvalidParametersException, "Cannot find sampler state parameter with the name '" + name + "'");
  143. output = GpuParamSampState(&iterFind->second, mInternalData);
  144. }
  145. GpuParamDataDesc* GpuParams::getParamDesc(const String& name) const
  146. {
  147. auto paramIter = mParamDesc->params.find(name);
  148. if(paramIter != mParamDesc->params.end())
  149. return &paramIter->second;
  150. return nullptr;
  151. }
  152. GpuParamBlockBufferPtr GpuParams::getParamBlockBuffer(UINT32 slot) const
  153. {
  154. if (slot < 0 || slot >= mInternalData->mNumParamBlocks)
  155. {
  156. BS_EXCEPT(InvalidParametersException, "Index out of range: Valid range: 0 .. " +
  157. toString(mInternalData->mNumParamBlocks - 1) + ". Requested: " + toString(slot));
  158. }
  159. return mInternalData->mParamBlockBuffers[slot];
  160. }
  161. HTexture GpuParams::getTexture(UINT32 slot)
  162. {
  163. if (slot < 0 || slot >= mInternalData->mNumTextures)
  164. {
  165. BS_EXCEPT(InvalidParametersException, "Index out of range: Valid range: 0 .. " +
  166. toString(mInternalData->mNumTextures - 1) + ". Requested: " + toString(slot));
  167. }
  168. return mInternalData->mTextures[slot];
  169. }
  170. HSamplerState GpuParams::getSamplerState(UINT32 slot)
  171. {
  172. if (slot < 0 || slot >= mInternalData->mNumSamplerStates)
  173. {
  174. BS_EXCEPT(InvalidParametersException, "Index out of range: Valid range: 0 .. " +
  175. toString(mInternalData->mNumSamplerStates - 1) + ". Requested: " + toString(slot));
  176. }
  177. return mInternalData->mSamplerStates[slot];
  178. }
  179. bool GpuParams::isLoadStoreTexture(UINT32 slot) const
  180. {
  181. if (slot < 0 || slot >= mInternalData->mNumTextures)
  182. {
  183. BS_EXCEPT(InvalidParametersException, "Index out of range: Valid range: 0 .. " +
  184. toString(mInternalData->mNumTextures - 1) + ". Requested: " + toString(slot));
  185. }
  186. return mInternalData->mTextureInfo[slot].isLoadStore;
  187. }
  188. const TextureSurface& GpuParams::getLoadStoreSurface(UINT32 slot) const
  189. {
  190. if (slot < 0 || slot >= mInternalData->mNumTextures)
  191. {
  192. BS_EXCEPT(InvalidParametersException, "Index out of range: Valid range: 0 .. " +
  193. toString(mInternalData->mNumTextures - 1) + ". Requested: " + toString(slot));
  194. }
  195. return mInternalData->mTextureInfo[slot].surface;
  196. }
  197. void GpuParams::updateHardwareBuffers()
  198. {
  199. for (UINT32 i = 0; i < mInternalData->mNumParamBlocks; i++)
  200. {
  201. if (mInternalData->mParamBlocks[i] != nullptr && mInternalData->mParamBlockBuffers[i] != nullptr)
  202. {
  203. if (mInternalData->mParamBlocks[i]->isDirty())
  204. mInternalData->mParamBlocks[i]->uploadToBuffer(mInternalData->mParamBlockBuffers[i]);
  205. }
  206. }
  207. }
  208. void GpuParams::_updateFromCopy(const GpuParamsPtr& copy)
  209. {
  210. assert(copy->mInternalData->mNumParamBlocks == mInternalData->mNumParamBlocks);
  211. assert(copy->mInternalData->mNumTextures == mInternalData->mNumTextures);
  212. assert(copy->mInternalData->mNumSamplerStates == mInternalData->mNumSamplerStates);
  213. for (UINT32 i = 0; i < mInternalData->mNumTextures; i++)
  214. {
  215. mInternalData->mTextures[i] = copy->mInternalData->mTextures[i];
  216. mInternalData->mTextureInfo[i] = copy->mInternalData->mTextureInfo[i];
  217. }
  218. for (UINT32 i = 0; i < mInternalData->mNumSamplerStates; i++)
  219. {
  220. mInternalData->mSamplerStates[i] = copy->mInternalData->mSamplerStates[i];
  221. }
  222. for (UINT32 i = 0; i < mInternalData->mNumParamBlocks; i++)
  223. {
  224. GpuParamBlockPtr destParamBlock = mInternalData->mParamBlocks[i];
  225. GpuParamBlockPtr srcParamBlock = copy->mInternalData->mParamBlocks[i];
  226. if (destParamBlock != nullptr && srcParamBlock != nullptr)
  227. {
  228. destParamBlock->write(0, srcParamBlock->getData(), srcParamBlock->getSize());
  229. }
  230. }
  231. }
  232. GpuParamsPtr GpuParams::_clone(FrameAlloc* frameAlloc, bool onlyDirtyBlocks) const
  233. {
  234. GpuParamsPtr myClone = nullptr;
  235. if (frameAlloc != nullptr)
  236. {
  237. StdFrameAlloc<std::shared_ptr<GpuParams>> myAlloc(frameAlloc);
  238. myClone = std::allocate_shared<GpuParams>(myAlloc, mParamDesc, PrivatelyConstruct());
  239. myClone->mInternalData = std::allocate_shared<GpuParamsInternalData>(myAlloc);
  240. }
  241. else
  242. {
  243. myClone = bs_shared_ptr<GpuParams>(mParamDesc, PrivatelyConstruct());;
  244. myClone->mInternalData = bs_shared_ptr<GpuParamsInternalData>();
  245. }
  246. myClone->mInternalData->mIsDestroyed = mInternalData->mIsDestroyed;
  247. myClone->mInternalData->mTransposeMatrices = mInternalData->mTransposeMatrices;
  248. myClone->mInternalData->mNumParamBlocks = mInternalData->mNumParamBlocks;
  249. myClone->mInternalData->mNumTextures = mInternalData->mNumTextures;
  250. myClone->mInternalData->mNumSamplerStates = mInternalData->mNumSamplerStates;
  251. myClone->constructInternalBuffers(frameAlloc);
  252. for (UINT32 i = 0; i < mInternalData->mNumParamBlocks; i++)
  253. {
  254. GpuParamBlockBufferPtr buffer = mInternalData->mParamBlockBuffers[i];
  255. if (buffer != nullptr && (!onlyDirtyBlocks || buffer->getParamBlock()->isDirty()))
  256. {
  257. GpuParamBlockPtr newBlock = nullptr;
  258. if (frameAlloc != nullptr)
  259. {
  260. StdFrameAlloc<GpuParams> myAlloc(frameAlloc);
  261. newBlock = std::allocate_shared<GpuParamBlock>(myAlloc, frameAlloc, buffer->getSize());
  262. }
  263. else
  264. {
  265. newBlock = bs_shared_ptr<GpuParamBlock>(buffer->getSize());;
  266. }
  267. newBlock->write(0, buffer->getParamBlock()->getData(), buffer->getSize());
  268. myClone->mInternalData->mParamBlocks[i] = newBlock;
  269. }
  270. else
  271. myClone->mInternalData->mParamBlocks[i] = nullptr;
  272. myClone->mInternalData->mParamBlockBuffers[i] = buffer;
  273. }
  274. for (UINT32 i = 0; i < mInternalData->mNumTextures; i++)
  275. {
  276. myClone->mInternalData->mTextures[i] = mInternalData->mTextures[i];
  277. myClone->mInternalData->mTextureInfo[i] = mInternalData->mTextureInfo[i];
  278. }
  279. for (UINT32 i = 0; i < mInternalData->mNumSamplerStates; i++)
  280. {
  281. myClone->mInternalData->mSamplerStates[i] = mInternalData->mSamplerStates[i];
  282. }
  283. return myClone;
  284. }
  285. void GpuParams::constructInternalBuffers(FrameAlloc* frameAlloc)
  286. {
  287. // Allocate everything in a single block of memory to get rid of extra memory allocations
  288. UINT32 bufferSize = 0;
  289. UINT32 paramBlockOffset = 0;
  290. UINT32 paramBlockBufferOffset = 0;
  291. UINT32 textureOffset = 0;
  292. UINT32 samplerStateOffset = 0;
  293. UINT32 textureInfoOffset = 0;
  294. UINT32 paramBlockBufferSize = mInternalData->mNumParamBlocks * sizeof(GpuParamBlockPtr);
  295. UINT32 paramBlockBuffersBufferSize = mInternalData->mNumParamBlocks * sizeof(GpuParamBlockBufferPtr);
  296. UINT32 textureBufferSize = mInternalData->mNumTextures * sizeof(HTexture);
  297. UINT32 textureInfoBufferSize = mInternalData->mNumTextures * sizeof(BoundTextureInfo);
  298. UINT32 samplerStateBufferSize = mInternalData->mNumSamplerStates * sizeof(HSamplerState);
  299. bufferSize = paramBlockBufferSize + paramBlockBuffersBufferSize + textureBufferSize + samplerStateBufferSize + textureInfoBufferSize;
  300. paramBlockOffset = 0;
  301. paramBlockBufferOffset = paramBlockOffset + paramBlockBufferSize;
  302. textureOffset = paramBlockBufferOffset + paramBlockBuffersBufferSize;
  303. samplerStateOffset = textureOffset + textureBufferSize;
  304. textureInfoOffset = samplerStateOffset + samplerStateBufferSize;
  305. if (frameAlloc != nullptr)
  306. {
  307. mInternalData->mData = frameAlloc->alloc(bufferSize);
  308. mInternalData->mFrameAlloc = frameAlloc;
  309. }
  310. else
  311. {
  312. mInternalData->mData = (UINT8*)bs_alloc(bufferSize);
  313. mInternalData->mFrameAlloc = nullptr;
  314. }
  315. mInternalData->mParamBlocks = (GpuParamBlockPtr*)(mInternalData->mData + paramBlockOffset);
  316. mInternalData->mParamBlockBuffers = (GpuParamBlockBufferPtr*)(mInternalData->mData + paramBlockBufferOffset);
  317. mInternalData->mTextures = (HTexture*)(mInternalData->mData + textureOffset);
  318. mInternalData->mSamplerStates = (HSamplerState*)(mInternalData->mData + samplerStateOffset);
  319. mInternalData->mTextureInfo = (BoundTextureInfo*)(mInternalData->mData + textureInfoOffset);
  320. // Ensure everything is constructed
  321. for (UINT32 i = 0; i < mInternalData->mNumParamBlocks; i++)
  322. {
  323. {
  324. GpuParamBlockPtr* ptrToIdx = (&mInternalData->mParamBlocks[i]);
  325. ptrToIdx = new (&mInternalData->mParamBlocks[i]) GpuParamBlockPtr(nullptr);
  326. }
  327. {
  328. GpuParamBlockBufferPtr* ptrToIdx = (&mInternalData->mParamBlockBuffers[i]);
  329. ptrToIdx = new (&mInternalData->mParamBlockBuffers[i]) GpuParamBlockBufferPtr(nullptr);
  330. }
  331. }
  332. for (UINT32 i = 0; i < mInternalData->mNumTextures; i++)
  333. {
  334. {
  335. HTexture* ptrToIdx = (&mInternalData->mTextures[i]);
  336. ptrToIdx = new (&mInternalData->mTextures[i]) HTexture();
  337. }
  338. {
  339. BoundTextureInfo* ptrToIdx = (&mInternalData->mTextureInfo[i]);
  340. ptrToIdx = new (&mInternalData->mTextureInfo[i]) BoundTextureInfo();
  341. }
  342. }
  343. for (UINT32 i = 0; i < mInternalData->mNumSamplerStates; i++)
  344. {
  345. HSamplerState* ptrToIdx = (&mInternalData->mSamplerStates[i]);
  346. ptrToIdx = new (&mInternalData->mSamplerStates[i]) HSamplerState();
  347. }
  348. }
  349. bool GpuParams::_isCoreDirty() const
  350. {
  351. return mInternalData->mCoreDirtyFlags != 0;
  352. }
  353. void GpuParams::_markCoreClean()
  354. {
  355. mInternalData->mCoreDirtyFlags = 0;
  356. for (UINT32 i = 0; i < mInternalData->mNumParamBlocks; i++)
  357. {
  358. if (mInternalData->mParamBlocks[i] != nullptr)
  359. mInternalData->mParamBlocks[i]->setDirty(false);
  360. }
  361. }
  362. void GpuParams::markCoreDirty()
  363. {
  364. mInternalData->mCoreDirtyFlags = 0xFFFFFFFF;
  365. }
  366. }