VrsSriGeneration.cpp 6.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197
  1. // Copyright (C) 2009-2022, Panagiotis Christopoulos Charitos and contributors.
  2. // All rights reserved.
  3. // Code licensed under the BSD License.
  4. // http://www.anki3d.org/LICENSE
  5. #include <AnKi/Renderer/VrsSriGeneration.h>
  6. #include <AnKi/Renderer/Renderer.h>
  7. #include <AnKi/Renderer/LightShading.h>
  8. #include <AnKi/Core/ConfigSet.h>
  9. namespace anki {
  10. VrsSriGeneration::VrsSriGeneration(Renderer* r)
  11. : RendererObject(r)
  12. {
  13. registerDebugRenderTarget("VrsSri");
  14. registerDebugRenderTarget("VrsSriDownscaled");
  15. }
  16. VrsSriGeneration::~VrsSriGeneration()
  17. {
  18. }
  19. Error VrsSriGeneration::init()
  20. {
  21. const Error err = initInternal();
  22. if(err)
  23. {
  24. ANKI_R_LOGE("Failed to initialize VRS SRI generation");
  25. }
  26. return err;
  27. }
  28. Error VrsSriGeneration::initInternal()
  29. {
  30. if(!getGrManager().getDeviceCapabilities().m_vrs)
  31. {
  32. return Error::NONE;
  33. }
  34. m_sriTexelDimension = getGrManager().getDeviceCapabilities().m_minShadingRateImageTexelSize;
  35. ANKI_ASSERT(m_sriTexelDimension == 8 || m_sriTexelDimension == 16);
  36. const UVec2 rez = (m_r->getInternalResolution() + m_sriTexelDimension - 1) / m_sriTexelDimension;
  37. ANKI_R_LOGV("Intializing VRS SRI generation. SRI resolution %ux%u", rez.x(), rez.y());
  38. // Create textures
  39. const TextureUsageBit texUsage =
  40. TextureUsageBit::FRAMEBUFFER_SHADING_RATE | TextureUsageBit::IMAGE_COMPUTE_WRITE | TextureUsageBit::ALL_SAMPLED;
  41. TextureInitInfo sriInitInfo =
  42. m_r->create2DRenderTargetInitInfo(rez.x(), rez.y(), Format::R8_UINT, texUsage, "VrsSri");
  43. m_sriTex = m_r->createAndClearRenderTarget(sriInitInfo, TextureUsageBit::FRAMEBUFFER_SHADING_RATE);
  44. const UVec2 rezDownscaled = (m_r->getInternalResolution() / 2 + m_sriTexelDimension - 1) / m_sriTexelDimension;
  45. sriInitInfo = m_r->create2DRenderTargetInitInfo(rezDownscaled.x(), rezDownscaled.y(), Format::R8_UINT, texUsage,
  46. "VrsSriDownscaled");
  47. m_downscaledSriTex = m_r->createAndClearRenderTarget(sriInitInfo, TextureUsageBit::FRAMEBUFFER_SHADING_RATE);
  48. // Load programs
  49. ANKI_CHECK(getResourceManager().loadResource("ShaderBinaries/VrsSriGenerationCompute.ankiprogbin", m_prog));
  50. ShaderProgramResourceVariantInitInfo variantInit(m_prog);
  51. variantInit.addMutation("SRI_TEXEL_DIMENSION", m_sriTexelDimension);
  52. if(m_sriTexelDimension == 16 && getGrManager().getDeviceCapabilities().m_minSubgroupSize >= 32)
  53. {
  54. // Algorithm's workgroup size is 32, GPU's subgroup size is min 32 -> each workgroup has 1 subgroup -> No need
  55. // for shared mem
  56. variantInit.addMutation("SHARED_MEMORY", 0);
  57. }
  58. else if(m_sriTexelDimension == 8 && getGrManager().getDeviceCapabilities().m_minSubgroupSize >= 16)
  59. {
  60. // Algorithm's workgroup size is 16, GPU's subgroup size is min 16 -> each workgroup has 1 subgroup -> No need
  61. // for shared mem
  62. variantInit.addMutation("SHARED_MEMORY", 0);
  63. }
  64. else
  65. {
  66. variantInit.addMutation("SHARED_MEMORY", 1);
  67. }
  68. variantInit.addMutation("LIMIT_RATE_TO_2X2", getConfig().getRVrsLimitTo2x2());
  69. const ShaderProgramResourceVariant* variant;
  70. m_prog->getOrCreateVariant(variantInit, variant);
  71. m_grProg = variant->getProgram();
  72. ANKI_CHECK(
  73. getResourceManager().loadResource("ShaderBinaries/VrsSriVisualizeRenderTarget.ankiprogbin", m_visualizeProg));
  74. m_visualizeProg->getOrCreateVariant(variant);
  75. m_visualizeGrProg = variant->getProgram();
  76. ANKI_CHECK(getResourceManager().loadResource("ShaderBinaries/VrsSriDownscale.ankiprogbin", m_downscaleProg));
  77. m_downscaleProg->getOrCreateVariant(variant);
  78. m_downscaleGrProg = variant->getProgram();
  79. return Error::NONE;
  80. }
  81. void VrsSriGeneration::getDebugRenderTarget(CString rtName, RenderTargetHandle& handle,
  82. ShaderProgramPtr& optionalShaderProgram) const
  83. {
  84. if(rtName == "VrsSri")
  85. {
  86. handle = m_runCtx.m_rt;
  87. }
  88. else
  89. {
  90. ANKI_ASSERT(rtName == "VrsSriDownscaled");
  91. handle = m_runCtx.m_downscaledRt;
  92. }
  93. optionalShaderProgram = m_visualizeGrProg;
  94. }
  95. void VrsSriGeneration::importRenderTargets(RenderingContext& ctx)
  96. {
  97. const Bool enableVrs = getGrManager().getDeviceCapabilities().m_vrs && getConfig().getRVrs();
  98. if(!enableVrs)
  99. {
  100. return;
  101. }
  102. if(m_sriTexImportedOnce)
  103. {
  104. m_runCtx.m_rt = ctx.m_renderGraphDescr.importRenderTarget(m_sriTex);
  105. m_runCtx.m_downscaledRt = ctx.m_renderGraphDescr.importRenderTarget(m_downscaledSriTex);
  106. }
  107. else
  108. {
  109. m_runCtx.m_rt = ctx.m_renderGraphDescr.importRenderTarget(m_sriTex, TextureUsageBit::FRAMEBUFFER_SHADING_RATE);
  110. m_runCtx.m_downscaledRt =
  111. ctx.m_renderGraphDescr.importRenderTarget(m_downscaledSriTex, TextureUsageBit::FRAMEBUFFER_SHADING_RATE);
  112. m_sriTexImportedOnce = true;
  113. }
  114. }
  115. void VrsSriGeneration::populateRenderGraph(RenderingContext& ctx)
  116. {
  117. const Bool enableVrs = getGrManager().getDeviceCapabilities().m_vrs && getConfig().getRVrs();
  118. if(!enableVrs)
  119. {
  120. return;
  121. }
  122. RenderGraphDescription& rgraph = ctx.m_renderGraphDescr;
  123. // SRI generation
  124. {
  125. ComputeRenderPassDescription& pass = rgraph.newComputeRenderPass("VRS SRI generation");
  126. pass.newDependency(RenderPassDependency(m_runCtx.m_rt, TextureUsageBit::IMAGE_COMPUTE_WRITE));
  127. pass.newDependency(RenderPassDependency(m_r->getLightShading().getRt(), TextureUsageBit::SAMPLED_COMPUTE));
  128. pass.setWork([this](RenderPassWorkContext& rgraphCtx) {
  129. CommandBufferPtr& cmdb = rgraphCtx.m_commandBuffer;
  130. cmdb->bindShaderProgram(m_grProg);
  131. rgraphCtx.bindColorTexture(0, 0, m_r->getLightShading().getRt());
  132. cmdb->bindSampler(0, 1, m_r->getSamplers().m_nearestNearestClamp);
  133. rgraphCtx.bindImage(0, 2, m_runCtx.m_rt);
  134. const Vec4 pc(1.0f / Vec2(m_r->getInternalResolution()), getConfig().getRVrsThreshold(), 0.0f);
  135. cmdb->setPushConstants(&pc, sizeof(pc));
  136. const U32 fakeWorkgroupSizeXorY = m_sriTexelDimension;
  137. dispatchPPCompute(cmdb, fakeWorkgroupSizeXorY, fakeWorkgroupSizeXorY, m_r->getInternalResolution().x(),
  138. m_r->getInternalResolution().y());
  139. });
  140. }
  141. // Downscale
  142. {
  143. ComputeRenderPassDescription& pass = rgraph.newComputeRenderPass("VRS SRI downscale");
  144. pass.newDependency(RenderPassDependency(m_runCtx.m_rt, TextureUsageBit::SAMPLED_COMPUTE));
  145. pass.newDependency(RenderPassDependency(m_runCtx.m_downscaledRt, TextureUsageBit::IMAGE_COMPUTE_WRITE));
  146. pass.setWork([this](RenderPassWorkContext& rgraphCtx) {
  147. const UVec2 rezDownscaled =
  148. (m_r->getInternalResolution() / 2 + m_sriTexelDimension - 1) / m_sriTexelDimension;
  149. CommandBufferPtr& cmdb = rgraphCtx.m_commandBuffer;
  150. cmdb->bindShaderProgram(m_downscaleGrProg);
  151. rgraphCtx.bindColorTexture(0, 0, m_runCtx.m_rt);
  152. cmdb->bindSampler(0, 1, m_r->getSamplers().m_nearestNearestClamp);
  153. rgraphCtx.bindImage(0, 2, m_runCtx.m_downscaledRt);
  154. const Vec4 pc(1.0f / Vec2(rezDownscaled), 0.0f, 0.0f);
  155. cmdb->setPushConstants(&pc, sizeof(pc));
  156. dispatchPPCompute(cmdb, 8, 8, rezDownscaled.x(), rezDownscaled.y());
  157. });
  158. }
  159. }
  160. } // end namespace anki