RtShadows.cpp 28 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723
  1. // Copyright (C) 2009-2023, Panagiotis Christopoulos Charitos and contributors.
  2. // All rights reserved.
  3. // Code licensed under the BSD License.
  4. // http://www.anki3d.org/LICENSE
  5. #include <AnKi/Renderer/RtShadows.h>
  6. #include <AnKi/Renderer/GBuffer.h>
  7. #include <AnKi/Renderer/Renderer.h>
  8. #include <AnKi/Renderer/ShadowMapping.h>
  9. #include <AnKi/Renderer/AccelerationStructureBuilder.h>
  10. #include <AnKi/Renderer/MotionVectors.h>
  11. #include <AnKi/Renderer/DepthDownscale.h>
  12. #include <AnKi/Renderer/RenderQueue.h>
  13. #include <AnKi/Renderer/ClusterBinning.h>
  14. #include <AnKi/Renderer/PackVisibleClusteredObjects.h>
  15. #include <AnKi/Util/Tracer.h>
  16. #include <AnKi/Core/CVarSet.h>
  17. #include <AnKi/Shaders/Include/MaterialTypes.h>
  18. #include <AnKi/Shaders/Include/GpuSceneTypes.h>
  19. #include <AnKi/Core/GpuMemory/UnifiedGeometryBuffer.h>
  20. #include <AnKi/Core/GpuMemory/GpuSceneBuffer.h>
  21. namespace anki {
  22. static BoolCVar g_rtShadowsSvgfCVar(CVarSubsystem::kRenderer, "RtShadowsSvgf", false, "Enable or not RT shadows SVGF");
  23. static NumericCVar<U8> g_rtShadowsSvgfAtrousPassCountCVar(CVarSubsystem::kRenderer, "RtShadowsSvgfAtrousPassCount", 3, 1, 20,
  24. "Number of atrous passes of SVGF");
  25. static NumericCVar<U32> g_rtShadowsRaysPerPixelCVar(CVarSubsystem::kRenderer, "RtShadowsRaysPerPixel", 1, 1, 8, "Number of shadow rays per pixel");
  26. Error RtShadows::init()
  27. {
  28. const Error err = initInternal();
  29. if(err)
  30. {
  31. ANKI_R_LOGE("Failed to initialize ray traced shadows");
  32. }
  33. return err;
  34. }
  35. Error RtShadows::initInternal()
  36. {
  37. ANKI_R_LOGV("Initializing RT shadows");
  38. m_useSvgf = g_rtShadowsSvgfCVar.get();
  39. m_atrousPassCount = g_rtShadowsSvgfAtrousPassCountCVar.get();
  40. ANKI_CHECK(ResourceManager::getSingleton().loadResource("EngineAssets/BlueNoise_Rgba8_64x64.png", m_blueNoiseImage));
  41. // Ray gen program
  42. {
  43. ANKI_CHECK(ResourceManager::getSingleton().loadResource("ShaderBinaries/RtShadowsRayGen.ankiprogbin", m_rayGenProg));
  44. ShaderProgramResourceVariantInitInfo variantInitInfo(m_rayGenProg);
  45. variantInitInfo.addMutation("RAYS_PER_PIXEL", g_rtShadowsRaysPerPixelCVar.get());
  46. const ShaderProgramResourceVariant* variant;
  47. m_rayGenProg->getOrCreateVariant(variantInitInfo, variant);
  48. m_rtLibraryGrProg.reset(&variant->getProgram());
  49. m_rayGenShaderGroupIdx = variant->getShaderGroupHandleIndex();
  50. }
  51. // Miss prog
  52. {
  53. ANKI_CHECK(ResourceManager::getSingleton().loadResource("ShaderBinaries/RtShadowsMiss.ankiprogbin", m_missProg));
  54. const ShaderProgramResourceVariant* variant;
  55. m_missProg->getOrCreateVariant(variant);
  56. m_missShaderGroupIdx = variant->getShaderGroupHandleIndex();
  57. }
  58. // Denoise program
  59. if(!m_useSvgf)
  60. {
  61. ANKI_CHECK(ResourceManager::getSingleton().loadResource("ShaderBinaries/RtShadowsDenoise.ankiprogbin", m_denoiseProg));
  62. ShaderProgramResourceVariantInitInfo variantInitInfo(m_denoiseProg);
  63. variantInitInfo.addConstant("kOutImageSize",
  64. UVec2(getRenderer().getInternalResolution().x() / 2, getRenderer().getInternalResolution().y() / 2));
  65. variantInitInfo.addConstant("kMinSampleCount", 8u);
  66. variantInitInfo.addConstant("kMaxSampleCount", 32u);
  67. variantInitInfo.addMutation("BLUR_ORIENTATION", 0);
  68. const ShaderProgramResourceVariant* variant;
  69. m_denoiseProg->getOrCreateVariant(variantInitInfo, variant);
  70. m_grDenoiseHorizontalProg.reset(&variant->getProgram());
  71. variantInitInfo.addMutation("BLUR_ORIENTATION", 1);
  72. m_denoiseProg->getOrCreateVariant(variantInitInfo, variant);
  73. m_grDenoiseVerticalProg.reset(&variant->getProgram());
  74. }
  75. // SVGF variance program
  76. if(m_useSvgf)
  77. {
  78. ANKI_CHECK(ResourceManager::getSingleton().loadResource("ShaderBinaries/RtShadowsSvgfVariance.ankiprogbin", m_svgfVarianceProg));
  79. ShaderProgramResourceVariantInitInfo variantInitInfo(m_svgfVarianceProg);
  80. variantInitInfo.addConstant("kFramebufferSize",
  81. UVec2(getRenderer().getInternalResolution().x() / 2, getRenderer().getInternalResolution().y() / 2));
  82. const ShaderProgramResourceVariant* variant;
  83. m_svgfVarianceProg->getOrCreateVariant(variantInitInfo, variant);
  84. m_svgfVarianceGrProg.reset(&variant->getProgram());
  85. }
  86. // SVGF atrous program
  87. if(m_useSvgf)
  88. {
  89. ANKI_CHECK(ResourceManager::getSingleton().loadResource("ShaderBinaries/RtShadowsSvgfAtrous.ankiprogbin", m_svgfAtrousProg));
  90. ShaderProgramResourceVariantInitInfo variantInitInfo(m_svgfAtrousProg);
  91. variantInitInfo.addConstant("kFramebufferSize",
  92. UVec2(getRenderer().getInternalResolution().x() / 2, getRenderer().getInternalResolution().y() / 2));
  93. variantInitInfo.addMutation("LAST_PASS", 0);
  94. const ShaderProgramResourceVariant* variant;
  95. m_svgfAtrousProg->getOrCreateVariant(variantInitInfo, variant);
  96. m_svgfAtrousGrProg.reset(&variant->getProgram());
  97. variantInitInfo.addMutation("LAST_PASS", 1);
  98. m_svgfAtrousProg->getOrCreateVariant(variantInitInfo, variant);
  99. m_svgfAtrousLastPassGrProg.reset(&variant->getProgram());
  100. }
  101. // Upscale program
  102. {
  103. ANKI_CHECK(ResourceManager::getSingleton().loadResource("ShaderBinaries/RtShadowsUpscale.ankiprogbin", m_upscaleProg));
  104. ShaderProgramResourceVariantInitInfo variantInitInfo(m_upscaleProg);
  105. variantInitInfo.addConstant("kOutImageSize", UVec2(getRenderer().getInternalResolution().x(), getRenderer().getInternalResolution().y()));
  106. const ShaderProgramResourceVariant* variant;
  107. m_upscaleProg->getOrCreateVariant(variantInitInfo, variant);
  108. m_upscaleGrProg.reset(&variant->getProgram());
  109. }
  110. // Debug program
  111. ANKI_CHECK(
  112. ResourceManager::getSingleton().loadResource("ShaderBinaries/RtShadowsVisualizeRenderTarget.ankiprogbin", m_visualizeRenderTargetsProg));
  113. // Quarter rez shadow RT
  114. {
  115. TextureInitInfo texinit = getRenderer().create2DRenderTargetInitInfo(
  116. getRenderer().getInternalResolution().x() / 2, getRenderer().getInternalResolution().y() / 2, Format::kR32G32_Uint,
  117. TextureUsageBit::kAllSampled | TextureUsageBit::kImageTraceRaysWrite | TextureUsageBit::kImageComputeWrite, "RtShadows History");
  118. m_historyRt = getRenderer().createAndClearRenderTarget(texinit, TextureUsageBit::kSampledFragment);
  119. }
  120. // Temp shadow RT
  121. {
  122. m_intermediateShadowsRtDescr = getRenderer().create2DRenderTargetDescription(
  123. getRenderer().getInternalResolution().x() / 2, getRenderer().getInternalResolution().y() / 2, Format::kR32G32_Uint, "RtShadows Tmp");
  124. m_intermediateShadowsRtDescr.bake();
  125. }
  126. // Moments RT
  127. {
  128. TextureInitInfo texinit = getRenderer().create2DRenderTargetInitInfo(
  129. getRenderer().getInternalResolution().x() / 2, getRenderer().getInternalResolution().y() / 2, Format::kR32G32_Sfloat,
  130. TextureUsageBit::kAllSampled | TextureUsageBit::kImageTraceRaysWrite | TextureUsageBit::kImageComputeWrite, "RtShadows Moments #1");
  131. m_momentsRts[0] = getRenderer().createAndClearRenderTarget(texinit, TextureUsageBit::kSampledFragment);
  132. texinit.setName("RtShadows Moments #2");
  133. m_momentsRts[1] = getRenderer().createAndClearRenderTarget(texinit, TextureUsageBit::kSampledFragment);
  134. }
  135. // Variance RT
  136. if(m_useSvgf)
  137. {
  138. m_varianceRtDescr = getRenderer().create2DRenderTargetDescription(
  139. getRenderer().getInternalResolution().x() / 2, getRenderer().getInternalResolution().y() / 2, Format::kR32_Sfloat, "RtShadows Variance");
  140. m_varianceRtDescr.bake();
  141. }
  142. // Final RT
  143. {
  144. m_upscaledRtDescr = getRenderer().create2DRenderTargetDescription(
  145. getRenderer().getInternalResolution().x(), getRenderer().getInternalResolution().y(), Format::kR32G32_Uint, "RtShadows Upscaled");
  146. m_upscaledRtDescr.bake();
  147. }
  148. // Misc
  149. m_sbtRecordSize = getAlignedRoundUp(GrManager::getSingleton().getDeviceCapabilities().m_sbtRecordAlignment, m_sbtRecordSize);
  150. return Error::kNone;
  151. }
  152. void RtShadows::populateRenderGraph(RenderingContext& ctx)
  153. {
  154. ANKI_TRACE_SCOPED_EVENT(RRtShadows);
  155. RenderGraphDescription& rgraph = ctx.m_renderGraphDescr;
  156. buildSbt(ctx);
  157. const U32 prevRtIdx = getRenderer().getFrameCount() & 1;
  158. // Import RTs
  159. {
  160. if(!m_rtsImportedOnce) [[unlikely]]
  161. {
  162. m_runCtx.m_historyRt = rgraph.importRenderTarget(m_historyRt.get(), TextureUsageBit::kSampledFragment);
  163. m_runCtx.m_prevMomentsRt = rgraph.importRenderTarget(m_momentsRts[prevRtIdx].get(), TextureUsageBit::kSampledFragment);
  164. m_rtsImportedOnce = true;
  165. }
  166. else
  167. {
  168. m_runCtx.m_historyRt = rgraph.importRenderTarget(m_historyRt.get());
  169. m_runCtx.m_prevMomentsRt = rgraph.importRenderTarget(m_momentsRts[prevRtIdx].get());
  170. }
  171. if((getPassCountWithoutUpscaling() % 2) == 1)
  172. {
  173. m_runCtx.m_intermediateShadowsRts[0] = rgraph.newRenderTarget(m_intermediateShadowsRtDescr);
  174. m_runCtx.m_intermediateShadowsRts[1] = rgraph.newRenderTarget(m_intermediateShadowsRtDescr);
  175. }
  176. else
  177. {
  178. // We can save a render target if we have even number of renderpasses
  179. m_runCtx.m_intermediateShadowsRts[0] = rgraph.newRenderTarget(m_intermediateShadowsRtDescr);
  180. m_runCtx.m_intermediateShadowsRts[1] = m_runCtx.m_historyRt;
  181. }
  182. m_runCtx.m_currentMomentsRt = rgraph.importRenderTarget(m_momentsRts[!prevRtIdx].get(), TextureUsageBit::kNone);
  183. if(m_useSvgf)
  184. {
  185. if(m_atrousPassCount > 1)
  186. {
  187. m_runCtx.m_varianceRts[0] = rgraph.newRenderTarget(m_varianceRtDescr);
  188. }
  189. m_runCtx.m_varianceRts[1] = rgraph.newRenderTarget(m_varianceRtDescr);
  190. }
  191. m_runCtx.m_upscaledRt = rgraph.newRenderTarget(m_upscaledRtDescr);
  192. }
  193. #define ANKI_DEPTH_DEP \
  194. getRenderer().getDepthDownscale().getHiZRt(), TextureUsageBit::kSampledTraceRays | TextureUsageBit::kSampledCompute, kHiZHalfSurface
  195. // RT shadows pass
  196. {
  197. ComputeRenderPassDescription& rpass = rgraph.newComputeRenderPass("RtShadows");
  198. rpass.setWork([this](RenderPassWorkContext& rgraphCtx) {
  199. run(rgraphCtx);
  200. });
  201. rpass.newTextureDependency(m_runCtx.m_historyRt, TextureUsageBit::kSampledTraceRays);
  202. rpass.newTextureDependency(m_runCtx.m_intermediateShadowsRts[0], TextureUsageBit::kImageTraceRaysWrite);
  203. rpass.newAccelerationStructureDependency(getRenderer().getAccelerationStructureBuilder().getAccelerationStructureHandle(),
  204. AccelerationStructureUsageBit::kTraceRaysRead);
  205. rpass.newTextureDependency(ANKI_DEPTH_DEP);
  206. rpass.newTextureDependency(getRenderer().getMotionVectors().getMotionVectorsRt(), TextureUsageBit::kSampledTraceRays);
  207. rpass.newTextureDependency(getRenderer().getMotionVectors().getHistoryLengthRt(), TextureUsageBit::kSampledTraceRays);
  208. rpass.newTextureDependency(getRenderer().getGBuffer().getColorRt(2), TextureUsageBit::kSampledTraceRays);
  209. rpass.newTextureDependency(m_runCtx.m_prevMomentsRt, TextureUsageBit::kSampledTraceRays);
  210. rpass.newTextureDependency(m_runCtx.m_currentMomentsRt, TextureUsageBit::kImageTraceRaysWrite);
  211. rpass.newBufferDependency(getRenderer().getClusterBinning().getClustersRenderGraphHandle(), BufferUsageBit::kStorageTraceRaysRead);
  212. }
  213. // Denoise pass horizontal
  214. if(!m_useSvgf)
  215. {
  216. ComputeRenderPassDescription& rpass = rgraph.newComputeRenderPass("RtShadows Denoise Horizontal");
  217. rpass.setWork([this, &ctx](RenderPassWorkContext& rgraphCtx) {
  218. runDenoise(ctx, rgraphCtx);
  219. });
  220. rpass.newTextureDependency(m_runCtx.m_intermediateShadowsRts[0], TextureUsageBit::kSampledCompute);
  221. rpass.newTextureDependency(ANKI_DEPTH_DEP);
  222. rpass.newTextureDependency(getRenderer().getGBuffer().getColorRt(2), TextureUsageBit::kSampledCompute);
  223. rpass.newTextureDependency(m_runCtx.m_currentMomentsRt, TextureUsageBit::kSampledCompute);
  224. rpass.newTextureDependency(getRenderer().getMotionVectors().getHistoryLengthRt(), TextureUsageBit::kSampledCompute);
  225. rpass.newTextureDependency(m_runCtx.m_intermediateShadowsRts[1], TextureUsageBit::kImageComputeWrite);
  226. }
  227. // Denoise pass vertical
  228. if(!m_useSvgf)
  229. {
  230. ComputeRenderPassDescription& rpass = rgraph.newComputeRenderPass("RtShadows Denoise Vertical");
  231. rpass.setWork([this, &ctx](RenderPassWorkContext& rgraphCtx) {
  232. runDenoise(ctx, rgraphCtx);
  233. });
  234. rpass.newTextureDependency(m_runCtx.m_intermediateShadowsRts[1], TextureUsageBit::kSampledCompute);
  235. rpass.newTextureDependency(ANKI_DEPTH_DEP);
  236. rpass.newTextureDependency(getRenderer().getGBuffer().getColorRt(2), TextureUsageBit::kSampledCompute);
  237. rpass.newTextureDependency(m_runCtx.m_currentMomentsRt, TextureUsageBit::kSampledCompute);
  238. rpass.newTextureDependency(getRenderer().getMotionVectors().getHistoryLengthRt(), TextureUsageBit::kSampledCompute);
  239. rpass.newTextureDependency(m_runCtx.m_historyRt, TextureUsageBit::kImageComputeWrite);
  240. }
  241. // Variance calculation pass
  242. if(m_useSvgf)
  243. {
  244. ComputeRenderPassDescription& rpass = rgraph.newComputeRenderPass("RtShadows SVGF Variance");
  245. rpass.setWork([this, &ctx](RenderPassWorkContext& rgraphCtx) {
  246. runSvgfVariance(ctx, rgraphCtx);
  247. });
  248. rpass.newTextureDependency(m_runCtx.m_intermediateShadowsRts[0], TextureUsageBit::kSampledCompute);
  249. rpass.newTextureDependency(m_runCtx.m_currentMomentsRt, TextureUsageBit::kSampledCompute);
  250. rpass.newTextureDependency(getRenderer().getMotionVectors().getHistoryLengthRt(), TextureUsageBit::kSampledCompute);
  251. rpass.newTextureDependency(ANKI_DEPTH_DEP);
  252. rpass.newTextureDependency(getRenderer().getGBuffer().getColorRt(2), TextureUsageBit::kSampledCompute);
  253. rpass.newTextureDependency(m_runCtx.m_intermediateShadowsRts[1], TextureUsageBit::kImageComputeWrite);
  254. rpass.newTextureDependency(m_runCtx.m_varianceRts[1], TextureUsageBit::kImageComputeWrite);
  255. }
  256. // SVGF Atrous
  257. if(m_useSvgf)
  258. {
  259. m_runCtx.m_atrousPassIdx = 0;
  260. for(U32 i = 0; i < m_atrousPassCount; ++i)
  261. {
  262. const Bool lastPass = i == U32(m_atrousPassCount - 1);
  263. const U32 readRtIdx = (i + 1) & 1;
  264. ComputeRenderPassDescription& rpass = rgraph.newComputeRenderPass("RtShadows SVGF Atrous");
  265. rpass.setWork([this, &ctx](RenderPassWorkContext& rgraphCtx) {
  266. runSvgfAtrous(ctx, rgraphCtx);
  267. });
  268. rpass.newTextureDependency(ANKI_DEPTH_DEP);
  269. rpass.newTextureDependency(getRenderer().getGBuffer().getColorRt(2), TextureUsageBit::kSampledCompute);
  270. rpass.newTextureDependency(m_runCtx.m_intermediateShadowsRts[readRtIdx], TextureUsageBit::kSampledCompute);
  271. rpass.newTextureDependency(m_runCtx.m_varianceRts[readRtIdx], TextureUsageBit::kSampledCompute);
  272. if(!lastPass)
  273. {
  274. rpass.newTextureDependency(m_runCtx.m_intermediateShadowsRts[!readRtIdx], TextureUsageBit::kImageComputeWrite);
  275. rpass.newTextureDependency(m_runCtx.m_varianceRts[!readRtIdx], TextureUsageBit::kImageComputeWrite);
  276. }
  277. else
  278. {
  279. rpass.newTextureDependency(m_runCtx.m_historyRt, TextureUsageBit::kImageComputeWrite);
  280. }
  281. }
  282. }
  283. // Upscale
  284. {
  285. ComputeRenderPassDescription& rpass = rgraph.newComputeRenderPass("RtShadows Upscale");
  286. rpass.setWork([this](RenderPassWorkContext& rgraphCtx) {
  287. runUpscale(rgraphCtx);
  288. });
  289. rpass.newTextureDependency(m_runCtx.m_historyRt, TextureUsageBit::kSampledCompute);
  290. rpass.newTextureDependency(getRenderer().getGBuffer().getDepthRt(), TextureUsageBit::kSampledCompute);
  291. rpass.newTextureDependency(ANKI_DEPTH_DEP);
  292. rpass.newTextureDependency(m_runCtx.m_upscaledRt, TextureUsageBit::kImageComputeWrite);
  293. }
  294. // Find out the lights that will take part in RT pass
  295. {
  296. RenderQueue& rqueue = *ctx.m_renderQueue;
  297. m_runCtx.m_layersWithRejectedHistory.unsetAll();
  298. if(rqueue.m_directionalLight.hasShadow())
  299. {
  300. U32 layerIdx;
  301. Bool rejectHistory;
  302. [[maybe_unused]] const Bool layerFound = findShadowLayer(0, layerIdx, rejectHistory);
  303. ANKI_ASSERT(layerFound && "Directional can't fail");
  304. rqueue.m_directionalLight.m_shadowLayer = U8(layerIdx);
  305. ANKI_ASSERT(rqueue.m_directionalLight.m_shadowLayer < kMaxRtShadowLayers);
  306. m_runCtx.m_layersWithRejectedHistory.set(layerIdx, rejectHistory);
  307. }
  308. for(PointLightQueueElement& light : rqueue.m_pointLights)
  309. {
  310. if(!light.hasShadow())
  311. {
  312. continue;
  313. }
  314. U32 layerIdx;
  315. Bool rejectHistory;
  316. const Bool layerFound = findShadowLayer(light.m_uuid, layerIdx, rejectHistory);
  317. if(layerFound)
  318. {
  319. light.m_shadowLayer = U8(layerIdx);
  320. ANKI_ASSERT(light.m_shadowLayer < kMaxRtShadowLayers);
  321. m_runCtx.m_layersWithRejectedHistory.set(layerIdx, rejectHistory);
  322. }
  323. else
  324. {
  325. // Disable shadows
  326. light.m_shadowRenderQueues = {};
  327. }
  328. }
  329. for(SpotLightQueueElement& light : rqueue.m_spotLights)
  330. {
  331. if(!light.hasShadow())
  332. {
  333. continue;
  334. }
  335. U32 layerIdx;
  336. Bool rejectHistory;
  337. const Bool layerFound = findShadowLayer(light.m_uuid, layerIdx, rejectHistory);
  338. if(layerFound)
  339. {
  340. light.m_shadowLayer = U8(layerIdx);
  341. ANKI_ASSERT(light.m_shadowLayer < kMaxRtShadowLayers);
  342. m_runCtx.m_layersWithRejectedHistory.set(layerIdx, rejectHistory);
  343. }
  344. else
  345. {
  346. // Disable shadows
  347. light.m_shadowRenderQueue = nullptr;
  348. }
  349. }
  350. }
  351. }
  352. void RtShadows::run(RenderPassWorkContext& rgraphCtx)
  353. {
  354. CommandBuffer& cmdb = *rgraphCtx.m_commandBuffer;
  355. cmdb.bindShaderProgram(m_rtLibraryGrProg.get());
  356. // Allocate, set and bind global uniforms
  357. {
  358. RebarAllocation globalUniformsToken;
  359. MaterialGlobalUniforms* globalUniforms = static_cast<MaterialGlobalUniforms*>(
  360. RebarTransientMemoryPool::getSingleton().allocateFrame(sizeof(MaterialGlobalUniforms), globalUniformsToken));
  361. memset(globalUniforms, 0, sizeof(*globalUniforms)); // Don't care for now
  362. cmdb.bindUniformBuffer(U32(MaterialSet::kGlobal), U32(MaterialBinding::kGlobalUniforms),
  363. &RebarTransientMemoryPool::getSingleton().getBuffer(), globalUniformsToken.m_offset, globalUniformsToken.m_range);
  364. }
  365. // More globals
  366. cmdb.bindAllBindless(U32(MaterialSet::kBindless));
  367. cmdb.bindSampler(U32(MaterialSet::kGlobal), U32(MaterialBinding::kTrilinearRepeatSampler), getRenderer().getSamplers().m_trilinearRepeat.get());
  368. cmdb.bindStorageBuffer(U32(MaterialSet::kGlobal), U32(MaterialBinding::kGpuScene), &GpuSceneBuffer::getSingleton().getBuffer(), 0, kMaxPtrSize);
  369. #define ANKI_UNIFIED_GEOM_FORMAT(fmt, shaderType) \
  370. cmdb.bindReadOnlyTextureBuffer(U32(MaterialSet::kGlobal), U32(MaterialBinding::kUnifiedGeometry_##fmt), \
  371. &UnifiedGeometryBuffer::getSingleton().getBuffer(), 0, kMaxPtrSize, Format::k##fmt);
  372. #include <AnKi/Shaders/Include/UnifiedGeometryTypes.defs.h>
  373. constexpr U32 kSet = 2;
  374. bindUniforms(cmdb, kSet, 0, getRenderer().getClusterBinning().getClusteredUniformsRebarToken());
  375. getRenderer().getPackVisibleClusteredObjects().bindClusteredObjectBuffer(cmdb, kSet, 1, ClusteredObjectType::kPointLight);
  376. getRenderer().getPackVisibleClusteredObjects().bindClusteredObjectBuffer(cmdb, kSet, 2, ClusteredObjectType::kSpotLight);
  377. rgraphCtx.bindColorTexture(kSet, 3, getRenderer().getShadowMapping().getShadowmapRt());
  378. bindStorage(cmdb, kSet, 4, getRenderer().getClusterBinning().getClustersRebarToken());
  379. cmdb.bindSampler(kSet, 5, getRenderer().getSamplers().m_trilinearRepeat.get());
  380. rgraphCtx.bindImage(kSet, 6, m_runCtx.m_intermediateShadowsRts[0]);
  381. rgraphCtx.bindColorTexture(kSet, 7, m_runCtx.m_historyRt);
  382. cmdb.bindSampler(kSet, 8, getRenderer().getSamplers().m_trilinearClamp.get());
  383. cmdb.bindSampler(kSet, 9, getRenderer().getSamplers().m_nearestNearestClamp.get());
  384. rgraphCtx.bindTexture(kSet, 10, getRenderer().getDepthDownscale().getHiZRt(), kHiZHalfSurface);
  385. rgraphCtx.bindColorTexture(kSet, 11, getRenderer().getMotionVectors().getMotionVectorsRt());
  386. rgraphCtx.bindColorTexture(kSet, 12, getRenderer().getMotionVectors().getHistoryLengthRt());
  387. rgraphCtx.bindColorTexture(kSet, 13, getRenderer().getGBuffer().getColorRt(2));
  388. rgraphCtx.bindAccelerationStructure(kSet, 14, getRenderer().getAccelerationStructureBuilder().getAccelerationStructureHandle());
  389. rgraphCtx.bindColorTexture(kSet, 15, m_runCtx.m_prevMomentsRt);
  390. rgraphCtx.bindImage(kSet, 16, m_runCtx.m_currentMomentsRt);
  391. cmdb.bindTexture(kSet, 17, &m_blueNoiseImage->getTextureView());
  392. RtShadowsUniforms unis;
  393. for(U32 i = 0; i < kMaxRtShadowLayers; ++i)
  394. {
  395. unis.historyRejectFactor[i] = F32(m_runCtx.m_layersWithRejectedHistory.get(i));
  396. }
  397. cmdb.setPushConstants(&unis, sizeof(unis));
  398. cmdb.traceRays(m_runCtx.m_sbtBuffer.get(), m_runCtx.m_sbtOffset, m_sbtRecordSize, m_runCtx.m_hitGroupCount, 1,
  399. getRenderer().getInternalResolution().x() / 2, getRenderer().getInternalResolution().y() / 2, 1);
  400. }
  401. void RtShadows::runDenoise(const RenderingContext& ctx, RenderPassWorkContext& rgraphCtx)
  402. {
  403. CommandBuffer& cmdb = *rgraphCtx.m_commandBuffer;
  404. cmdb.bindShaderProgram((m_runCtx.m_denoiseOrientation == 0) ? m_grDenoiseHorizontalProg.get() : m_grDenoiseVerticalProg.get());
  405. cmdb.bindSampler(0, 0, getRenderer().getSamplers().m_nearestNearestClamp.get());
  406. cmdb.bindSampler(0, 1, getRenderer().getSamplers().m_trilinearClamp.get());
  407. rgraphCtx.bindColorTexture(0, 2, m_runCtx.m_intermediateShadowsRts[m_runCtx.m_denoiseOrientation]);
  408. rgraphCtx.bindTexture(0, 3, getRenderer().getDepthDownscale().getHiZRt(), kHiZHalfSurface);
  409. rgraphCtx.bindColorTexture(0, 4, getRenderer().getGBuffer().getColorRt(2));
  410. rgraphCtx.bindColorTexture(0, 5, m_runCtx.m_currentMomentsRt);
  411. rgraphCtx.bindColorTexture(0, 6, getRenderer().getMotionVectors().getHistoryLengthRt());
  412. rgraphCtx.bindImage(0, 7, (m_runCtx.m_denoiseOrientation == 0) ? m_runCtx.m_intermediateShadowsRts[1] : m_runCtx.m_historyRt);
  413. RtShadowsDenoiseUniforms unis;
  414. unis.invViewProjMat = ctx.m_matrices.m_invertedViewProjectionJitter;
  415. unis.time = F32(GlobalFrameIndex::getSingleton().m_value);
  416. cmdb.setPushConstants(&unis, sizeof(unis));
  417. dispatchPPCompute(cmdb, 8, 8, getRenderer().getInternalResolution().x() / 2, getRenderer().getInternalResolution().y() / 2);
  418. m_runCtx.m_denoiseOrientation = !m_runCtx.m_denoiseOrientation;
  419. }
  420. void RtShadows::runSvgfVariance(const RenderingContext& ctx, RenderPassWorkContext& rgraphCtx)
  421. {
  422. CommandBuffer& cmdb = *rgraphCtx.m_commandBuffer;
  423. cmdb.bindShaderProgram(m_svgfVarianceGrProg.get());
  424. cmdb.bindSampler(0, 0, getRenderer().getSamplers().m_nearestNearestClamp.get());
  425. cmdb.bindSampler(0, 1, getRenderer().getSamplers().m_trilinearClamp.get());
  426. rgraphCtx.bindColorTexture(0, 2, m_runCtx.m_intermediateShadowsRts[0]);
  427. rgraphCtx.bindColorTexture(0, 3, m_runCtx.m_currentMomentsRt);
  428. rgraphCtx.bindColorTexture(0, 4, getRenderer().getMotionVectors().getHistoryLengthRt());
  429. rgraphCtx.bindTexture(0, 5, getRenderer().getDepthDownscale().getHiZRt(), kHiZHalfSurface);
  430. rgraphCtx.bindImage(0, 6, m_runCtx.m_intermediateShadowsRts[1]);
  431. rgraphCtx.bindImage(0, 7, m_runCtx.m_varianceRts[1]);
  432. const Mat4& invProjMat = ctx.m_matrices.m_projectionJitter.getInverse();
  433. cmdb.setPushConstants(&invProjMat, sizeof(invProjMat));
  434. dispatchPPCompute(cmdb, 8, 8, getRenderer().getInternalResolution().x() / 2, getRenderer().getInternalResolution().y() / 2);
  435. }
  436. void RtShadows::runSvgfAtrous(const RenderingContext& ctx, RenderPassWorkContext& rgraphCtx)
  437. {
  438. CommandBuffer& cmdb = *rgraphCtx.m_commandBuffer;
  439. const Bool lastPass = m_runCtx.m_atrousPassIdx == m_atrousPassCount - 1;
  440. const U32 readRtIdx = (m_runCtx.m_atrousPassIdx + 1) & 1;
  441. if(lastPass)
  442. {
  443. cmdb.bindShaderProgram(m_svgfAtrousLastPassGrProg.get());
  444. }
  445. else
  446. {
  447. cmdb.bindShaderProgram(m_svgfAtrousGrProg.get());
  448. }
  449. cmdb.bindSampler(0, 0, getRenderer().getSamplers().m_nearestNearestClamp.get());
  450. cmdb.bindSampler(0, 1, getRenderer().getSamplers().m_trilinearClamp.get());
  451. rgraphCtx.bindTexture(0, 2, getRenderer().getDepthDownscale().getHiZRt(), kHiZHalfSurface);
  452. rgraphCtx.bindColorTexture(0, 3, m_runCtx.m_intermediateShadowsRts[readRtIdx]);
  453. rgraphCtx.bindColorTexture(0, 4, m_runCtx.m_varianceRts[readRtIdx]);
  454. if(!lastPass)
  455. {
  456. rgraphCtx.bindImage(0, 5, m_runCtx.m_intermediateShadowsRts[!readRtIdx]);
  457. rgraphCtx.bindImage(0, 6, m_runCtx.m_varianceRts[!readRtIdx]);
  458. }
  459. else
  460. {
  461. rgraphCtx.bindImage(0, 5, m_runCtx.m_historyRt);
  462. }
  463. const Mat4& invProjMat = ctx.m_matrices.m_projectionJitter.getInverse();
  464. cmdb.setPushConstants(&invProjMat, sizeof(invProjMat));
  465. dispatchPPCompute(cmdb, 8, 8, getRenderer().getInternalResolution().x() / 2, getRenderer().getInternalResolution().y() / 2);
  466. ++m_runCtx.m_atrousPassIdx;
  467. }
  468. void RtShadows::runUpscale(RenderPassWorkContext& rgraphCtx)
  469. {
  470. CommandBuffer& cmdb = *rgraphCtx.m_commandBuffer;
  471. cmdb.bindShaderProgram(m_upscaleGrProg.get());
  472. cmdb.bindSampler(0, 0, getRenderer().getSamplers().m_nearestNearestClamp.get());
  473. cmdb.bindSampler(0, 1, getRenderer().getSamplers().m_trilinearClamp.get());
  474. rgraphCtx.bindColorTexture(0, 2, m_runCtx.m_historyRt);
  475. rgraphCtx.bindImage(0, 3, m_runCtx.m_upscaledRt);
  476. rgraphCtx.bindTexture(0, 4, getRenderer().getDepthDownscale().getHiZRt(), kHiZHalfSurface);
  477. rgraphCtx.bindTexture(0, 5, getRenderer().getGBuffer().getDepthRt(), TextureSubresourceInfo(DepthStencilAspectBit::kDepth));
  478. dispatchPPCompute(cmdb, 8, 8, getRenderer().getInternalResolution().x(), getRenderer().getInternalResolution().y());
  479. }
  480. void RtShadows::buildSbt(RenderingContext& ctx)
  481. {
  482. // Get some things
  483. ANKI_ASSERT(ctx.m_renderQueue->m_rayTracingQueue);
  484. ConstWeakArray<RayTracingInstanceQueueElement> instanceElements = ctx.m_renderQueue->m_rayTracingQueue->m_rayTracingInstances;
  485. const U32 instanceCount = instanceElements.getSize();
  486. ANKI_ASSERT(instanceCount > 0);
  487. const U32 shaderHandleSize = GrManager::getSingleton().getDeviceCapabilities().m_shaderGroupHandleSize;
  488. const U32 extraSbtRecords = 1 + 1; // Raygen + miss
  489. m_runCtx.m_hitGroupCount = instanceCount;
  490. // Allocate SBT
  491. RebarAllocation token;
  492. U8* sbt = allocateStorage<U8*>(PtrSize(m_sbtRecordSize) * (instanceCount + extraSbtRecords), token);
  493. [[maybe_unused]] const U8* sbtStart = sbt;
  494. m_runCtx.m_sbtBuffer.reset(const_cast<Buffer*>(&RebarTransientMemoryPool::getSingleton().getBuffer()));
  495. m_runCtx.m_sbtOffset = token.m_offset;
  496. // Set the miss and ray gen handles
  497. ConstWeakArray<U8> shaderGroupHandles = m_rtLibraryGrProg->getShaderGroupHandles();
  498. memcpy(sbt, &shaderGroupHandles[m_rayGenShaderGroupIdx * shaderHandleSize], shaderHandleSize);
  499. sbt += m_sbtRecordSize;
  500. memcpy(sbt, &shaderGroupHandles[m_missShaderGroupIdx * shaderHandleSize], shaderHandleSize);
  501. sbt += m_sbtRecordSize;
  502. // Init SBT and instances
  503. ANKI_ASSERT(m_sbtRecordSize >= shaderHandleSize + sizeof(ModelGpuDescriptor));
  504. for(U32 instanceIdx = 0; instanceIdx < instanceCount; ++instanceIdx)
  505. {
  506. const RayTracingInstanceQueueElement& element = instanceElements[instanceIdx];
  507. // Init SBT record
  508. memcpy(sbt, &shaderGroupHandles[element.m_shaderGroupHandleIndex * shaderHandleSize], shaderHandleSize);
  509. ANKI_ASSERT(shaderHandleSize + sizeof(GpuSceneRenderable) <= m_sbtRecordSize);
  510. GpuSceneRenderable* shaderRecord = reinterpret_cast<GpuSceneRenderable*>(sbt + shaderHandleSize);
  511. shaderRecord->m_worldTransformsOffset = element.m_worldTransformsOffset;
  512. shaderRecord->m_uniformsOffset = element.m_uniformsOffset;
  513. shaderRecord->m_geometryOffset = element.m_geometryOffset;
  514. shaderRecord->m_boneTransformsOffset = 0;
  515. sbt += m_sbtRecordSize;
  516. }
  517. ANKI_ASSERT(sbtStart + m_sbtRecordSize * (instanceCount + extraSbtRecords) == sbt);
  518. }
  519. Bool RtShadows::findShadowLayer(U64 lightUuid, U32& layerIdx, Bool& rejectHistoryBuffer)
  520. {
  521. const U64 crntFrame = getRenderer().getFrameCount();
  522. layerIdx = kMaxU32;
  523. U32 nextBestLayerIdx = kMaxU32;
  524. U64 nextBestLayerFame = crntFrame;
  525. rejectHistoryBuffer = false;
  526. for(U32 i = 0; i < m_shadowLayers.getSize(); ++i)
  527. {
  528. ShadowLayer& layer = m_shadowLayers[i];
  529. if(layer.m_lightUuid == lightUuid && layer.m_frameLastUsed == crntFrame - 1)
  530. {
  531. // Found it being used last frame
  532. layerIdx = i;
  533. layer.m_frameLastUsed = crntFrame;
  534. layer.m_lightUuid = lightUuid;
  535. break;
  536. }
  537. else if(layer.m_lightUuid == lightUuid || layer.m_frameLastUsed == kMaxU64)
  538. {
  539. // Found an empty slot or slot used by the same light
  540. layerIdx = i;
  541. layer.m_frameLastUsed = crntFrame;
  542. layer.m_lightUuid = lightUuid;
  543. rejectHistoryBuffer = true;
  544. break;
  545. }
  546. else if(layer.m_frameLastUsed < nextBestLayerFame)
  547. {
  548. nextBestLayerIdx = i;
  549. nextBestLayerFame = crntFrame;
  550. }
  551. }
  552. // Not found but there is a good candidate. Use that
  553. if(layerIdx == kMaxU32 && nextBestLayerIdx != kMaxU32)
  554. {
  555. layerIdx = nextBestLayerIdx;
  556. m_shadowLayers[nextBestLayerIdx].m_frameLastUsed = crntFrame;
  557. m_shadowLayers[nextBestLayerIdx].m_lightUuid = lightUuid;
  558. rejectHistoryBuffer = true;
  559. }
  560. return layerIdx != kMaxU32;
  561. }
  562. void RtShadows::getDebugRenderTarget(CString rtName, Array<RenderTargetHandle, kMaxDebugRenderTargets>& handles,
  563. ShaderProgramPtr& optionalShaderProgram) const
  564. {
  565. U32 layerGroup = 0;
  566. if(rtName == "RtShadows")
  567. {
  568. layerGroup = 0;
  569. }
  570. else if(rtName == "RtShadows1")
  571. {
  572. layerGroup = 1;
  573. }
  574. else
  575. {
  576. ANKI_ASSERT(rtName == "RtShadows2");
  577. layerGroup = 2;
  578. }
  579. handles[0] = m_runCtx.m_upscaledRt;
  580. ShaderProgramResourceVariantInitInfo variantInit(m_visualizeRenderTargetsProg);
  581. variantInit.addMutation("LAYER_GROUP", layerGroup);
  582. const ShaderProgramResourceVariant* variant;
  583. m_visualizeRenderTargetsProg->getOrCreateVariant(variantInit, variant);
  584. optionalShaderProgram.reset(&variant->getProgram());
  585. }
  586. } // end namespace anki