IndirectDiffuseClipmaps.cpp 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288
  1. // Copyright (C) 2009-present, Panagiotis Christopoulos Charitos and contributors.
  2. // All rights reserved.
  3. // Code licensed under the BSD License.
  4. // http://www.anki3d.org/LICENSE
  5. #include <AnKi/Renderer/IndirectDiffuseClipmaps.h>
  6. #include <AnKi/Renderer/Renderer.h>
  7. #include <AnKi/Renderer/GBuffer.h>
  8. #include <AnKi/Renderer/AccelerationStructureBuilder.h>
  9. #include <AnKi/Renderer/Sky.h>
  10. #include <AnKi/Renderer/ShadowMapping.h>
  11. #include <AnKi/Scene/Components/SkyboxComponent.h>
  12. #include <AnKi/Shaders/Include/MaterialTypes.h>
  13. #include <AnKi/Util/Tracer.h>
  14. #include <AnKi/GpuMemory/UnifiedGeometryBuffer.h>
  15. namespace anki {
  16. Error IndirectDiffuseClipmaps::init()
  17. {
  18. m_tmpRtDesc = getRenderer().create2DRenderTargetDescription(getRenderer().getInternalResolution().x(), getRenderer().getInternalResolution().y(),
  19. Format::kR8G8B8A8_Unorm, "Test");
  20. m_tmpRtDesc.bake();
  21. m_clipmapInfo[0].m_probeCounts = Vec3(F32(g_indirectDiffuseClipmap0ProbesPerDimCVar));
  22. m_clipmapInfo[1].m_probeCounts = Vec3(F32(g_indirectDiffuseClipmap1ProbesPerDimCVar));
  23. m_clipmapInfo[2].m_probeCounts = Vec3(F32(g_indirectDiffuseClipmap2ProbesPerDimCVar));
  24. m_clipmapInfo[0].m_size = Vec3(g_indirectDiffuseClipmap0SizeCVar);
  25. m_clipmapInfo[1].m_size = Vec3(g_indirectDiffuseClipmap1SizeCVar);
  26. m_clipmapInfo[2].m_size = Vec3(g_indirectDiffuseClipmap2SizeCVar);
  27. for(U32 clipmap = 0; clipmap < kIndirectDiffuseClipmapCount; ++clipmap)
  28. {
  29. for(U32 dir = 0; dir < 6; ++dir)
  30. {
  31. TextureInitInfo volumeInit = getRenderer().create2DRenderTargetInitInfo(
  32. U32(m_clipmapInfo[clipmap].m_probeCounts.x()), U32(m_clipmapInfo[clipmap].m_probeCounts.y()), Format::kB10G11R11_Ufloat_Pack32,
  33. TextureUsageBit::kAllShaderResource, generateTempPassName("IndirectDiffuseClipmap #%u dir #%u", clipmap, dir));
  34. volumeInit.m_depth = U32(m_clipmapInfo[clipmap].m_probeCounts.z());
  35. volumeInit.m_type = TextureType::k3D;
  36. m_clipmapVolumes[clipmap].m_directions[dir] = getRenderer().createAndClearRenderTarget(volumeInit, TextureUsageBit::kSrvCompute);
  37. }
  38. }
  39. ANKI_CHECK(loadShaderProgram("ShaderBinaries/IndirectDiffuseClipmaps.ankiprogbin", {}, m_prog, m_tmpVisGrProg, "Test"));
  40. ANKI_CHECK(loadShaderProgram("ShaderBinaries/RtSbtBuild.ankiprogbin", {{"TECHNIQUE", 1}}, m_sbtProg, m_sbtBuildGrProg, "SbtBuild"));
  41. {
  42. ShaderProgramResourcePtr tmpProg;
  43. ANKI_CHECK(ResourceManager::getSingleton().loadResource("ShaderBinaries/IndirectDiffuseClipmaps.ankiprogbin", tmpProg));
  44. ANKI_ASSERT(tmpProg == m_prog);
  45. ShaderProgramResourceVariantInitInfo variantInitInfo(m_prog);
  46. variantInitInfo.requestTechniqueAndTypes(ShaderTypeBit::kRayGen, "RtMaterialFetch");
  47. const ShaderProgramResourceVariant* variant;
  48. m_prog->getOrCreateVariant(variantInitInfo, variant);
  49. m_libraryGrProg.reset(&variant->getProgram());
  50. m_rayGenShaderGroupIdx = variant->getShaderGroupHandleIndex();
  51. }
  52. {
  53. ANKI_CHECK(ResourceManager::getSingleton().loadResource("ShaderBinaries/RtMaterialFetchMiss.ankiprogbin", m_missProg));
  54. ShaderProgramResourceVariantInitInfo variantInitInfo(m_missProg);
  55. variantInitInfo.requestTechniqueAndTypes(ShaderTypeBit::kMiss, "RtMaterialFetch");
  56. const ShaderProgramResourceVariant* variant;
  57. m_missProg->getOrCreateVariant(variantInitInfo, variant);
  58. m_missShaderGroupIdx = variant->getShaderGroupHandleIndex();
  59. }
  60. m_sbtRecordSize = getAlignedRoundUp(GrManager::getSingleton().getDeviceCapabilities().m_sbtRecordAlignment,
  61. GrManager::getSingleton().getDeviceCapabilities().m_shaderGroupHandleSize + U32(sizeof(UVec4)));
  62. return Error::kNone;
  63. }
  64. void IndirectDiffuseClipmaps::populateRenderGraph(RenderingContext& ctx)
  65. {
  66. ANKI_TRACE_SCOPED_EVENT(IndirectDiffuse);
  67. RenderGraphBuilder& rgraph = ctx.m_renderGraphDescr;
  68. Array2d<RenderTargetHandle, kIndirectDiffuseClipmapCount, 6> volumeRts;
  69. for(U32 clipmap = 0; clipmap < kIndirectDiffuseClipmapCount; ++clipmap)
  70. {
  71. for(U32 dir = 0; dir < 6; ++dir)
  72. {
  73. if(!m_clipmapsImportedOnce)
  74. {
  75. volumeRts[clipmap][dir] = rgraph.importRenderTarget(m_clipmapVolumes[clipmap].m_directions[dir].get(), TextureUsageBit::kSrvCompute);
  76. }
  77. else
  78. {
  79. volumeRts[clipmap][dir] = rgraph.importRenderTarget(m_clipmapVolumes[clipmap].m_directions[dir].get());
  80. }
  81. }
  82. }
  83. m_clipmapsImportedOnce = true;
  84. m_runCtx.m_tmpRt = rgraph.newRenderTarget(m_tmpRtDesc);
  85. // SBT build
  86. BufferHandle sbtHandle;
  87. BufferView sbtBuffer;
  88. {
  89. BufferHandle visibilityDep;
  90. BufferView visibleRenderableIndicesBuff, buildSbtIndirectArgsBuff;
  91. getRenderer().getAccelerationStructureBuilder().getVisibilityInfo(visibilityDep, visibleRenderableIndicesBuff, buildSbtIndirectArgsBuff);
  92. // Allocate SBT
  93. U32 sbtAlignment = (GrManager::getSingleton().getDeviceCapabilities().m_structuredBufferNaturalAlignment)
  94. ? sizeof(U32)
  95. : GrManager::getSingleton().getDeviceCapabilities().m_structuredBufferBindOffsetAlignment;
  96. sbtAlignment = computeCompoundAlignment(sbtAlignment, GrManager::getSingleton().getDeviceCapabilities().m_sbtRecordAlignment);
  97. U8* sbtMem;
  98. sbtBuffer = RebarTransientMemoryPool::getSingleton().allocate(
  99. (GpuSceneArrays::RenderableBoundingVolumeRt::getSingleton().getElementCount() + 2) * m_sbtRecordSize, sbtAlignment, sbtMem);
  100. sbtHandle = rgraph.importBuffer(sbtBuffer, BufferUsageBit::kNone);
  101. // Write the first 2 entries of the SBT
  102. ConstWeakArray<U8> shaderGroupHandles = m_libraryGrProg->getShaderGroupHandles();
  103. const U32 shaderHandleSize = GrManager::getSingleton().getDeviceCapabilities().m_shaderGroupHandleSize;
  104. memcpy(sbtMem, &shaderGroupHandles[m_rayGenShaderGroupIdx * shaderHandleSize], shaderHandleSize);
  105. memcpy(sbtMem + m_sbtRecordSize, &shaderGroupHandles[m_missShaderGroupIdx * shaderHandleSize], shaderHandleSize);
  106. // Create the pass
  107. NonGraphicsRenderPass& rpass = rgraph.newNonGraphicsRenderPass("RtReflections build SBT");
  108. rpass.newBufferDependency(visibilityDep, BufferUsageBit::kIndirectCompute | BufferUsageBit::kSrvCompute);
  109. rpass.newBufferDependency(sbtHandle, BufferUsageBit::kUavCompute);
  110. rpass.setWork([this, buildSbtIndirectArgsBuff, sbtBuffer, visibleRenderableIndicesBuff](RenderPassWorkContext& rgraphCtx) {
  111. ANKI_TRACE_SCOPED_EVENT(ReflectionsSbtBuild);
  112. CommandBuffer& cmdb = *rgraphCtx.m_commandBuffer;
  113. cmdb.bindShaderProgram(m_sbtBuildGrProg.get());
  114. cmdb.bindSrv(0, 0, GpuSceneArrays::Renderable::getSingleton().getBufferView());
  115. cmdb.bindSrv(1, 0, visibleRenderableIndicesBuff);
  116. cmdb.bindSrv(2, 0, BufferView(&m_libraryGrProg->getShaderGroupHandlesGpuBuffer()));
  117. cmdb.bindUav(0, 0, sbtBuffer);
  118. RtShadowsSbtBuildConstants consts = {};
  119. ANKI_ASSERT(m_sbtRecordSize % 4 == 0);
  120. consts.m_sbtRecordDwordSize = m_sbtRecordSize / 4;
  121. const U32 shaderHandleSize = GrManager::getSingleton().getDeviceCapabilities().m_shaderGroupHandleSize;
  122. ANKI_ASSERT(shaderHandleSize % 4 == 0);
  123. consts.m_shaderHandleDwordSize = shaderHandleSize / 4;
  124. cmdb.setFastConstants(&consts, sizeof(consts));
  125. cmdb.dispatchComputeIndirect(buildSbtIndirectArgsBuff);
  126. });
  127. }
  128. // Do ray tracing around the probes
  129. {
  130. NonGraphicsRenderPass& pass = rgraph.newNonGraphicsRenderPass("IndirectDiffuseClipmaps");
  131. for(U32 clipmap = 0; clipmap < kIndirectDiffuseClipmapCount; ++clipmap)
  132. {
  133. for(U32 dir = 0; dir < 6; ++dir)
  134. {
  135. pass.newTextureDependency(volumeRts[clipmap][dir], TextureUsageBit::kUavCompute);
  136. }
  137. }
  138. pass.newBufferDependency(sbtHandle, BufferUsageBit::kShaderBindingTable);
  139. if(getRenderer().getGeneratedSky().isEnabled())
  140. {
  141. pass.newTextureDependency(getRenderer().getGeneratedSky().getEnvironmentMapRt(), TextureUsageBit::kSrvTraceRays);
  142. }
  143. pass.newTextureDependency(getRenderer().getShadowMapping().getShadowmapRt(), TextureUsageBit::kSrvTraceRays);
  144. pass.newAccelerationStructureDependency(getRenderer().getAccelerationStructureBuilder().getAccelerationStructureHandle(),
  145. AccelerationStructureUsageBit::kTraceRaysSrv);
  146. pass.setWork([this, volumeRts, &ctx, sbtBuffer](RenderPassWorkContext& rgraphCtx) {
  147. CommandBuffer& cmdb = *rgraphCtx.m_commandBuffer;
  148. cmdb.bindShaderProgram(m_libraryGrProg.get());
  149. // More globals
  150. cmdb.bindSampler(ANKI_MATERIAL_REGISTER_TILINEAR_REPEAT_SAMPLER, 0, getRenderer().getSamplers().m_trilinearRepeat.get());
  151. cmdb.bindSrv(ANKI_MATERIAL_REGISTER_GPU_SCENE, 0, GpuSceneBuffer::getSingleton().getBufferView());
  152. cmdb.bindSrv(ANKI_MATERIAL_REGISTER_MESH_LODS, 0, GpuSceneArrays::MeshLod::getSingleton().getBufferView());
  153. cmdb.bindSrv(ANKI_MATERIAL_REGISTER_TRANSFORMS, 0, GpuSceneArrays::Transform::getSingleton().getBufferView());
  154. #define ANKI_UNIFIED_GEOM_FORMAT(fmt, shaderType, reg) \
  155. cmdb.bindSrv( \
  156. reg, 0, \
  157. BufferView(&UnifiedGeometryBuffer::getSingleton().getBuffer(), 0, \
  158. getAlignedRoundDown(getFormatInfo(Format::k##fmt).m_texelSize, UnifiedGeometryBuffer::getSingleton().getBuffer().getSize())), \
  159. Format::k##fmt);
  160. #include <AnKi/Shaders/Include/UnifiedGeometryTypes.def.h>
  161. cmdb.bindConstantBuffer(0, 2, ctx.m_globalRenderingConstantsBuffer);
  162. rgraphCtx.bindSrv(0, 2, getRenderer().getAccelerationStructureBuilder().getAccelerationStructureHandle());
  163. cmdb.bindSrv(1, 2, TextureView(getDummyGpuResources().m_texture2DSrv.get(), TextureSubresourceDesc::all()));
  164. cmdb.bindSrv(2, 2, TextureView(getDummyGpuResources().m_texture2DSrv.get(), TextureSubresourceDesc::all()));
  165. cmdb.bindSrv(3, 2, TextureView(getDummyGpuResources().m_texture2DSrv.get(), TextureSubresourceDesc::all()));
  166. const LightComponent* dirLight = SceneGraph::getSingleton().getDirectionalLight();
  167. const SkyboxComponent* sky = SceneGraph::getSingleton().getSkybox();
  168. const Bool bSkySolidColor =
  169. (!sky || sky->getSkyboxType() == SkyboxType::kSolidColor || (!dirLight && sky->getSkyboxType() == SkyboxType::kGenerated));
  170. if(bSkySolidColor)
  171. {
  172. cmdb.bindSrv(4, 2, TextureView(getDummyGpuResources().m_texture2DSrv.get(), TextureSubresourceDesc::all()));
  173. }
  174. else if(sky->getSkyboxType() == SkyboxType::kImage2D)
  175. {
  176. cmdb.bindSrv(4, 2, TextureView(&sky->getImageResource().getTexture(), TextureSubresourceDesc::all()));
  177. }
  178. else
  179. {
  180. rgraphCtx.bindSrv(4, 2, getRenderer().getGeneratedSky().getEnvironmentMapRt());
  181. }
  182. cmdb.bindSrv(5, 2, BufferView(getDummyGpuResources().m_buffer.get(), 0, sizeof(U32)));
  183. cmdb.bindSrv(6, 2, BufferView(getDummyGpuResources().m_buffer.get(), 0, sizeof(U32)));
  184. rgraphCtx.bindSrv(7, 2, getRenderer().getShadowMapping().getShadowmapRt());
  185. cmdb.bindSampler(0, 2, getRenderer().getSamplers().m_trilinearClamp.get());
  186. cmdb.bindSampler(1, 2, getRenderer().getSamplers().m_trilinearClampShadow.get());
  187. cmdb.bindUav(7, 2, TextureView(getDummyGpuResources().m_texture2DUav.get(), TextureSubresourceDesc::firstSurface()));
  188. cmdb.bindUav(8, 2, TextureView(getDummyGpuResources().m_texture2DUav.get(), TextureSubresourceDesc::firstSurface()));
  189. for(U32 clipmap = 0; clipmap < kIndirectDiffuseClipmapCount; ++clipmap)
  190. {
  191. for(U32 dir = 0; dir < 6; ++dir)
  192. {
  193. rgraphCtx.bindUav(dir, 2, volumeRts[clipmap][dir]);
  194. }
  195. const UVec4 consts(clipmap);
  196. cmdb.setFastConstants(&consts, sizeof(consts));
  197. const U32 probeCount = m_clipmapVolumes[clipmap].m_directions[0]->getWidth();
  198. cmdb.traceRays(sbtBuffer, m_sbtRecordSize, GpuSceneArrays::RenderableBoundingVolumeRt::getSingleton().getElementCount(), 1,
  199. probeCount, probeCount, probeCount);
  200. }
  201. });
  202. }
  203. {
  204. NonGraphicsRenderPass& pass = rgraph.newNonGraphicsRenderPass("IndirectDiffuseClipmaps test");
  205. for(U32 clipmap = 0; clipmap < kIndirectDiffuseClipmapCount; ++clipmap)
  206. {
  207. for(U32 dir = 0; dir < 6; ++dir)
  208. {
  209. pass.newTextureDependency(volumeRts[clipmap][dir], TextureUsageBit::kSrvCompute);
  210. }
  211. }
  212. pass.newTextureDependency(getRenderer().getGBuffer().getDepthRt(), TextureUsageBit::kSrvCompute);
  213. pass.newTextureDependency(getRenderer().getGBuffer().getColorRt(2), TextureUsageBit::kSrvCompute);
  214. pass.newTextureDependency(m_runCtx.m_tmpRt, TextureUsageBit::kUavCompute);
  215. pass.setWork([this, volumeRts, &ctx](RenderPassWorkContext& rgraphCtx) {
  216. CommandBuffer& cmdb = *rgraphCtx.m_commandBuffer;
  217. cmdb.bindShaderProgram(m_tmpVisGrProg.get());
  218. rgraphCtx.bindSrv(0, 0, getRenderer().getGBuffer().getDepthRt());
  219. rgraphCtx.bindSrv(1, 0, getRenderer().getGBuffer().getColorRt(2));
  220. for(U32 clipmap = 0; clipmap < kIndirectDiffuseClipmapCount; ++clipmap)
  221. {
  222. for(U32 dir = 0; dir < 6; ++dir)
  223. {
  224. rgraphCtx.bindSrv(clipmap * 6 + dir + 2, 0, volumeRts[clipmap][dir]);
  225. }
  226. }
  227. rgraphCtx.bindUav(0, 0, m_runCtx.m_tmpRt);
  228. cmdb.bindConstantBuffer(0, 0, ctx.m_globalRenderingConstantsBuffer);
  229. cmdb.bindSampler(0, 0, getRenderer().getSamplers().m_trilinearRepeat.get());
  230. dispatchPPCompute(cmdb, 8, 8, getRenderer().getInternalResolution().x(), getRenderer().getInternalResolution().y());
  231. });
  232. }
  233. }
  234. } // end namespace anki