Ssgi.cpp 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286
  1. // Copyright (C) 2009-2021, Panagiotis Christopoulos Charitos and contributors.
  2. // All rights reserved.
  3. // Code licensed under the BSD License.
  4. // http://www.anki3d.org/LICENSE
  5. #include <AnKi/Renderer/Ssgi.h>
  6. #include <AnKi/Renderer/Renderer.h>
  7. #include <AnKi/Renderer/DepthDownscale.h>
  8. #include <AnKi/Renderer/GBuffer.h>
  9. #include <AnKi/Renderer/DownscaleBlur.h>
  10. #include <AnKi/Renderer/MotionVectors.h>
  11. #include <AnKi/Core/ConfigSet.h>
  12. #include <AnKi/Shaders/Include/SsgiTypes.h>
  13. namespace anki
  14. {
  15. static constexpr U32 WRITE = 0;
  16. static constexpr U32 READ = 1;
  17. Ssgi::~Ssgi()
  18. {
  19. }
  20. Error Ssgi::init(const ConfigSet& cfg)
  21. {
  22. const Error err = initInternal(cfg);
  23. if(err)
  24. {
  25. ANKI_R_LOGE("Failed to initialize SSGI pass");
  26. }
  27. return err;
  28. }
  29. Error Ssgi::initInternal(const ConfigSet& cfg)
  30. {
  31. const U32 width = m_r->getWidth();
  32. const U32 height = m_r->getHeight();
  33. ANKI_ASSERT((width % 2) == 0 && (height % 2) == 0 && "The algorithms won't work");
  34. ANKI_R_LOGI("Initializing SSGI pass");
  35. m_main.m_maxSteps = cfg.getNumberU32("r_ssgiMaxSteps");
  36. m_main.m_depthLod = min(cfg.getNumberU32("r_ssgiDepthLod"), m_r->getDepthDownscale().getMipmapCount() - 1);
  37. m_main.m_firstStepPixels = 32;
  38. ANKI_CHECK(getResourceManager().loadResource("EngineAssets/BlueNoiseRgb816x16.png", m_main.m_noiseTex));
  39. // Init main
  40. {
  41. m_main.m_rtDescr =
  42. m_r->create2DRenderTargetDescription(width / 2, height / 2, Format::B10G11R11_UFLOAT_PACK32, "SSGI_tmp");
  43. m_main.m_rtDescr.bake();
  44. ANKI_CHECK(getResourceManager().loadResource("Shaders/Ssgi.ankiprog", m_main.m_prog));
  45. ShaderProgramResourceVariantInitInfo variantInitInfo(m_main.m_prog);
  46. for(U32 i = 0; i < 4; ++i)
  47. {
  48. variantInitInfo.addMutation("VARIANT", i);
  49. const ShaderProgramResourceVariant* variant;
  50. m_main.m_prog->getOrCreateVariant(variantInitInfo, variant);
  51. m_main.m_grProg[i] = variant->getProgram();
  52. }
  53. }
  54. // Init denoise
  55. {
  56. ANKI_CHECK(getResourceManager().loadResource("Shaders/SsgiDenoise.ankiprog", m_denoise.m_prog));
  57. ShaderProgramResourceVariantInitInfo variantInitInfo(m_denoise.m_prog);
  58. const ShaderProgramResourceVariant* variant;
  59. variantInitInfo.addConstant("IN_TEXTURE_SIZE", UVec2(width / 2, height / 2));
  60. for(U32 i = 0; i < 4; ++i)
  61. {
  62. variantInitInfo.addMutation("VARIANT", i);
  63. variantInitInfo.addMutation("SAMPLE_COUNT", 11);
  64. variantInitInfo.addMutation("ORIENTATION", 0);
  65. m_denoise.m_prog->getOrCreateVariant(variantInitInfo, variant);
  66. m_denoise.m_grProg[0][i] = variant->getProgram();
  67. variantInitInfo.addMutation("SAMPLE_COUNT", 15);
  68. variantInitInfo.addMutation("ORIENTATION", 1);
  69. m_denoise.m_prog->getOrCreateVariant(variantInitInfo, variant);
  70. m_denoise.m_grProg[1][i] = variant->getProgram();
  71. }
  72. }
  73. // Init reconstruction
  74. {
  75. ANKI_CHECK(getResourceManager().loadResource("Shaders/SsgiReconstruct.ankiprog", m_recontruction.m_prog));
  76. ShaderProgramResourceVariantInitInfo variantInitInfo(m_recontruction.m_prog);
  77. variantInitInfo.addConstant("FB_SIZE", UVec2(m_r->getWidth(), m_r->getHeight()));
  78. const ShaderProgramResourceVariant* variant;
  79. for(U32 i = 0; i < 4; ++i)
  80. {
  81. variantInitInfo.addMutation("VARIANT", i);
  82. m_recontruction.m_prog->getOrCreateVariant(variantInitInfo, variant);
  83. m_recontruction.m_grProg[i] = variant->getProgram();
  84. }
  85. TextureInitInfo initInfo = m_r->create2DRenderTargetInitInfo(
  86. width, height, Format::B10G11R11_UFLOAT_PACK32,
  87. TextureUsageBit::ALL_SAMPLED | TextureUsageBit::IMAGE_COMPUTE_WRITE, "SSGI");
  88. initInfo.m_initialUsage = TextureUsageBit::SAMPLED_FRAGMENT;
  89. m_recontruction.m_rt = m_r->createAndClearRenderTarget(initInfo);
  90. }
  91. return Error::NONE;
  92. }
  93. void Ssgi::populateRenderGraph(RenderingContext& ctx)
  94. {
  95. RenderGraphDescription& rgraph = ctx.m_renderGraphDescr;
  96. m_runCtx.m_ctx = &ctx;
  97. // Main pass
  98. {
  99. // Create RTs
  100. if(ANKI_LIKELY(m_recontruction.m_rtImportedOnce))
  101. {
  102. m_runCtx.m_finalRt = rgraph.importRenderTarget(m_recontruction.m_rt);
  103. }
  104. else
  105. {
  106. m_runCtx.m_finalRt = rgraph.importRenderTarget(m_recontruction.m_rt, TextureUsageBit::SAMPLED_FRAGMENT);
  107. m_recontruction.m_rtImportedOnce = true;
  108. }
  109. m_runCtx.m_intermediateRts[WRITE] = rgraph.newRenderTarget(m_main.m_rtDescr);
  110. m_runCtx.m_intermediateRts[READ] = rgraph.newRenderTarget(m_main.m_rtDescr);
  111. // Create pass
  112. ComputeRenderPassDescription& rpass = rgraph.newComputeRenderPass("SSGI");
  113. rpass.setWork(
  114. [](RenderPassWorkContext& rgraphCtx) { static_cast<Ssgi*>(rgraphCtx.m_userData)->run(rgraphCtx); }, this,
  115. 0);
  116. rpass.newDependency({m_runCtx.m_intermediateRts[WRITE], TextureUsageBit::IMAGE_COMPUTE_WRITE});
  117. rpass.newDependency({m_runCtx.m_finalRt, TextureUsageBit::SAMPLED_COMPUTE});
  118. TextureSubresourceInfo hizSubresource;
  119. hizSubresource.m_firstMipmap = m_main.m_depthLod;
  120. rpass.newDependency({m_r->getDepthDownscale().getHiZRt(), TextureUsageBit::SAMPLED_COMPUTE, hizSubresource});
  121. rpass.newDependency({m_r->getGBuffer().getColorRt(2), TextureUsageBit::SAMPLED_COMPUTE});
  122. rpass.newDependency({m_r->getDownscaleBlur().getRt(), TextureUsageBit::SAMPLED_COMPUTE});
  123. rpass.newDependency({m_r->getMotionVectors().getMotionVectorsRt(), TextureUsageBit::SAMPLED_COMPUTE});
  124. rpass.newDependency({m_r->getMotionVectors().getRejectionFactorRt(), TextureUsageBit::SAMPLED_COMPUTE});
  125. }
  126. // Blur vertical
  127. {
  128. ComputeRenderPassDescription& rpass = rgraph.newComputeRenderPass("SSGI_blur_v");
  129. rpass.newDependency({m_runCtx.m_intermediateRts[WRITE], TextureUsageBit::SAMPLED_COMPUTE});
  130. rpass.newDependency({m_runCtx.m_intermediateRts[READ], TextureUsageBit::IMAGE_COMPUTE_WRITE});
  131. rpass.newDependency({m_r->getGBuffer().getColorRt(2), TextureUsageBit::SAMPLED_COMPUTE});
  132. rpass.newDependency({m_r->getGBuffer().getDepthRt(), TextureUsageBit::SAMPLED_COMPUTE});
  133. rpass.setWork(
  134. [](RenderPassWorkContext& rgraphCtx) { static_cast<Ssgi*>(rgraphCtx.m_userData)->runVBlur(rgraphCtx); },
  135. this, 0);
  136. }
  137. // Blur horizontal
  138. {
  139. ComputeRenderPassDescription& rpass = rgraph.newComputeRenderPass("SSGI_blur_h");
  140. rpass.newDependency({m_runCtx.m_intermediateRts[READ], TextureUsageBit::SAMPLED_COMPUTE});
  141. rpass.newDependency({m_runCtx.m_intermediateRts[WRITE], TextureUsageBit::IMAGE_COMPUTE_WRITE});
  142. rpass.newDependency({m_r->getGBuffer().getColorRt(2), TextureUsageBit::SAMPLED_COMPUTE});
  143. rpass.newDependency({m_r->getGBuffer().getDepthRt(), TextureUsageBit::SAMPLED_COMPUTE});
  144. rpass.setWork(
  145. [](RenderPassWorkContext& rgraphCtx) { static_cast<Ssgi*>(rgraphCtx.m_userData)->runHBlur(rgraphCtx); },
  146. this, 0);
  147. }
  148. // Reconstruction
  149. {
  150. ComputeRenderPassDescription& rpass = rgraph.newComputeRenderPass("SSGI_recon");
  151. rpass.newDependency({m_runCtx.m_intermediateRts[WRITE], TextureUsageBit::SAMPLED_COMPUTE});
  152. rpass.newDependency({m_runCtx.m_finalRt, TextureUsageBit::IMAGE_COMPUTE_WRITE});
  153. rpass.newDependency({m_r->getGBuffer().getDepthRt(), TextureUsageBit::SAMPLED_COMPUTE});
  154. rpass.newDependency({m_r->getGBuffer().getColorRt(2), TextureUsageBit::SAMPLED_COMPUTE});
  155. rpass.setWork(
  156. [](RenderPassWorkContext& rgraphCtx) {
  157. static_cast<Ssgi*>(rgraphCtx.m_userData)->runRecontruct(rgraphCtx);
  158. },
  159. this, 0);
  160. }
  161. }
  162. void Ssgi::run(RenderPassWorkContext& rgraphCtx)
  163. {
  164. RenderingContext& ctx = *m_runCtx.m_ctx;
  165. CommandBufferPtr& cmdb = rgraphCtx.m_commandBuffer;
  166. cmdb->bindShaderProgram(m_main.m_grProg[m_r->getFrameCount() % 4]);
  167. rgraphCtx.bindImage(0, 0, m_runCtx.m_intermediateRts[WRITE], TextureSubresourceInfo());
  168. // Bind uniforms
  169. SsgiUniforms* unis = allocateAndBindUniforms<SsgiUniforms*>(sizeof(SsgiUniforms), cmdb, 0, 1);
  170. unis->m_depthBufferSize = UVec2(m_r->getWidth(), m_r->getHeight()) >> (m_main.m_depthLod + 1);
  171. unis->m_framebufferSize = UVec2(m_r->getWidth(), m_r->getHeight());
  172. unis->m_invProjMat = ctx.m_matrices.m_projectionJitter.getInverse();
  173. unis->m_projMat = ctx.m_matrices.m_projectionJitter;
  174. unis->m_prevViewProjMatMulInvViewProjMat =
  175. ctx.m_prevMatrices.m_viewProjection * ctx.m_matrices.m_viewProjectionJitter.getInverse();
  176. unis->m_normalMat = Mat3x4(Vec3(0.0f), ctx.m_matrices.m_view.getRotationPart());
  177. unis->m_frameCount = m_r->getFrameCount() & MAX_U32;
  178. unis->m_maxSteps = m_main.m_maxSteps;
  179. unis->m_firstStepPixels = m_main.m_firstStepPixels;
  180. cmdb->bindSampler(0, 2, m_r->getSamplers().m_trilinearClamp);
  181. rgraphCtx.bindColorTexture(0, 3, m_r->getGBuffer().getColorRt(2));
  182. TextureSubresourceInfo hizSubresource;
  183. hizSubresource.m_firstMipmap = m_main.m_depthLod;
  184. rgraphCtx.bindTexture(0, 4, m_r->getDepthDownscale().getHiZRt(), hizSubresource);
  185. rgraphCtx.bindColorTexture(0, 5, m_r->getDownscaleBlur().getRt());
  186. rgraphCtx.bindColorTexture(0, 6, m_runCtx.m_finalRt);
  187. rgraphCtx.bindColorTexture(0, 7, m_r->getMotionVectors().getMotionVectorsRt());
  188. rgraphCtx.bindColorTexture(0, 8, m_r->getMotionVectors().getRejectionFactorRt());
  189. // Dispatch
  190. dispatchPPCompute(cmdb, 16, 16, m_r->getWidth() / 2, m_r->getHeight() / 2);
  191. }
  192. void Ssgi::runVBlur(RenderPassWorkContext& rgraphCtx)
  193. {
  194. CommandBufferPtr& cmdb = rgraphCtx.m_commandBuffer;
  195. cmdb->bindShaderProgram(m_denoise.m_grProg[0][m_r->getFrameCount() % 4]);
  196. cmdb->bindSampler(0, 0, m_r->getSamplers().m_trilinearClamp);
  197. rgraphCtx.bindColorTexture(0, 1, m_runCtx.m_intermediateRts[WRITE]);
  198. rgraphCtx.bindTexture(0, 2, m_r->getGBuffer().getDepthRt(), TextureSubresourceInfo(DepthStencilAspectBit::DEPTH));
  199. rgraphCtx.bindColorTexture(0, 3, m_r->getGBuffer().getColorRt(2));
  200. rgraphCtx.bindImage(0, 4, m_runCtx.m_intermediateRts[READ], TextureSubresourceInfo());
  201. const Mat4 mat = m_runCtx.m_ctx->m_matrices.m_viewProjectionJitter.getInverse();
  202. cmdb->setPushConstants(&mat, sizeof(mat));
  203. dispatchPPCompute(cmdb, 8, 8, m_r->getWidth() / 2, m_r->getHeight() / 2);
  204. }
  205. void Ssgi::runHBlur(RenderPassWorkContext& rgraphCtx)
  206. {
  207. CommandBufferPtr& cmdb = rgraphCtx.m_commandBuffer;
  208. cmdb->bindShaderProgram(m_denoise.m_grProg[1][m_r->getFrameCount() % 4]);
  209. cmdb->bindSampler(0, 0, m_r->getSamplers().m_trilinearClamp);
  210. rgraphCtx.bindColorTexture(0, 1, m_runCtx.m_intermediateRts[READ]);
  211. rgraphCtx.bindTexture(0, 2, m_r->getGBuffer().getDepthRt(), TextureSubresourceInfo(DepthStencilAspectBit::DEPTH));
  212. rgraphCtx.bindColorTexture(0, 3, m_r->getGBuffer().getColorRt(2));
  213. rgraphCtx.bindImage(0, 4, m_runCtx.m_intermediateRts[WRITE], TextureSubresourceInfo());
  214. const Mat4 mat = m_runCtx.m_ctx->m_matrices.m_viewProjectionJitter.getInverse();
  215. cmdb->setPushConstants(&mat, sizeof(mat));
  216. dispatchPPCompute(cmdb, 8, 8, m_r->getWidth() / 2, m_r->getHeight() / 2);
  217. }
  218. void Ssgi::runRecontruct(RenderPassWorkContext& rgraphCtx)
  219. {
  220. CommandBufferPtr& cmdb = rgraphCtx.m_commandBuffer;
  221. cmdb->bindShaderProgram(m_recontruction.m_grProg[m_r->getFrameCount() % 4]);
  222. cmdb->bindSampler(0, 0, m_r->getSamplers().m_trilinearClamp);
  223. rgraphCtx.bindColorTexture(0, 1, m_runCtx.m_intermediateRts[WRITE]);
  224. rgraphCtx.bindTexture(0, 2, m_r->getGBuffer().getDepthRt(), TextureSubresourceInfo(DepthStencilAspectBit::DEPTH));
  225. rgraphCtx.bindImage(0, 3, m_runCtx.m_finalRt, TextureSubresourceInfo());
  226. dispatchPPCompute(cmdb, 16, 16, m_r->getWidth(), m_r->getHeight());
  227. }
  228. } // end namespace anki