VrsSriGeneration.cpp 4.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142
  1. // Copyright (C) 2009-2022, Panagiotis Christopoulos Charitos and contributors.
  2. // All rights reserved.
  3. // Code licensed under the BSD License.
  4. // http://www.anki3d.org/LICENSE
  5. #include <AnKi/Renderer/VrsSriGeneration.h>
  6. #include <AnKi/Renderer/Renderer.h>
  7. #include <AnKi/Renderer/TemporalAA.h>
  8. #include <AnKi/Core/ConfigSet.h>
  9. namespace anki {
  10. VrsSriGeneration::VrsSriGeneration(Renderer* r)
  11. : RendererObject(r)
  12. {
  13. registerDebugRenderTarget("VRS");
  14. }
  15. VrsSriGeneration::~VrsSriGeneration()
  16. {
  17. }
  18. Error VrsSriGeneration::init()
  19. {
  20. const Error err = initInternal();
  21. if(err)
  22. {
  23. ANKI_R_LOGE("Failed to initialize VRS SRI generation");
  24. }
  25. return err;
  26. }
  27. Error VrsSriGeneration::initInternal()
  28. {
  29. if(!getGrManager().getDeviceCapabilities().m_vrs)
  30. {
  31. return Error::NONE;
  32. }
  33. const UVec2 rez = (m_r->getInternalResolution() + m_sriTexelDimension - 1) / m_sriTexelDimension;
  34. ANKI_R_LOGV("Intializing VRS SRI generation. SRI resolution %ux%u", rez.x(), rez.y());
  35. // SRI
  36. const TextureUsageBit texUsage = TextureUsageBit::FRAMEBUFFER_SHADING_RATE | TextureUsageBit::IMAGE_COMPUTE_WRITE
  37. | TextureUsageBit::SAMPLED_FRAGMENT;
  38. TextureInitInfo sriInitInfo =
  39. m_r->create2DRenderTargetInitInfo(rez.x(), rez.y(), Format::R8_UINT, texUsage, "VRS SRI");
  40. m_sriTex = m_r->createAndClearRenderTarget(sriInitInfo, TextureUsageBit::FRAMEBUFFER_SHADING_RATE);
  41. // Descr
  42. m_fbDescr.m_colorAttachmentCount = 1;
  43. m_fbDescr.bake();
  44. // Load programs
  45. ANKI_CHECK(getResourceManager().loadResource("ShaderBinaries/VrsSriGenerationCompute.ankiprogbin", m_prog));
  46. ShaderProgramResourceVariantInitInfo variantInit(m_prog);
  47. variantInit.addMutation("SRI_TEXEL_DIMENSION", m_sriTexelDimension);
  48. if(m_sriTexelDimension == 16 && getGrManager().getDeviceCapabilities().m_minSubgroupSize >= 32)
  49. {
  50. // Algorithm's workgroup size is 32, GPU's subgroup size is min 32 -> each workgroup has 1 subgroup -> No need
  51. // for shared mem
  52. variantInit.addMutation("SHARED_MEMORY", 0);
  53. }
  54. else
  55. {
  56. variantInit.addMutation("SHARED_MEMORY", 1);
  57. }
  58. const ShaderProgramResourceVariant* variant;
  59. m_prog->getOrCreateVariant(variantInit, variant);
  60. m_grProg = variant->getProgram();
  61. ANKI_CHECK(
  62. getResourceManager().loadResource("ShaderBinaries/VrsSriVisualizeRenderTarget.ankiprogbin", m_visualizeProg));
  63. m_visualizeProg->getOrCreateVariant(variant);
  64. m_visualizeGrProg = variant->getProgram();
  65. return Error::NONE;
  66. }
  67. void VrsSriGeneration::getDebugRenderTarget(CString rtName, RenderTargetHandle& handle,
  68. ShaderProgramPtr& optionalShaderProgram) const
  69. {
  70. ANKI_ASSERT(rtName == "VRS");
  71. handle = m_runCtx.m_rt;
  72. optionalShaderProgram = m_visualizeGrProg;
  73. }
  74. void VrsSriGeneration::importRenderTargets(RenderingContext& ctx)
  75. {
  76. const Bool enableVrs = getGrManager().getDeviceCapabilities().m_vrs && getConfig().getRVrs();
  77. if(!enableVrs)
  78. {
  79. return;
  80. }
  81. if(m_sriTexImportedOnce)
  82. {
  83. m_runCtx.m_rt = ctx.m_renderGraphDescr.importRenderTarget(m_sriTex);
  84. }
  85. else
  86. {
  87. m_runCtx.m_rt = ctx.m_renderGraphDescr.importRenderTarget(m_sriTex, TextureUsageBit::FRAMEBUFFER_SHADING_RATE);
  88. m_sriTexImportedOnce = true;
  89. }
  90. }
  91. void VrsSriGeneration::populateRenderGraph(RenderingContext& ctx)
  92. {
  93. const Bool enableVrs = getGrManager().getDeviceCapabilities().m_vrs && getConfig().getRVrs();
  94. if(!enableVrs)
  95. {
  96. return;
  97. }
  98. RenderGraphDescription& rgraph = ctx.m_renderGraphDescr;
  99. ComputeRenderPassDescription& pass = rgraph.newComputeRenderPass("VRS SRI generation");
  100. pass.newDependency(RenderPassDependency(m_runCtx.m_rt, TextureUsageBit::IMAGE_COMPUTE_WRITE));
  101. pass.newDependency(RenderPassDependency(m_r->getTemporalAA().getTonemappedRt(), TextureUsageBit::SAMPLED_COMPUTE));
  102. pass.setWork([this](RenderPassWorkContext& rgraphCtx) {
  103. CommandBufferPtr& cmdb = rgraphCtx.m_commandBuffer;
  104. cmdb->bindShaderProgram(m_grProg);
  105. rgraphCtx.bindColorTexture(0, 0, m_r->getTemporalAA().getTonemappedRt());
  106. cmdb->bindSampler(0, 1, m_r->getSamplers().m_nearestNearestClamp);
  107. rgraphCtx.bindImage(0, 2, m_runCtx.m_rt);
  108. const Vec4 pc(1.0f / Vec2(m_r->getInternalResolution()), getConfig().getRVrsThreshold(), 0.0f);
  109. cmdb->setPushConstants(&pc, sizeof(pc));
  110. const U32 fakeWorkgroupSizeXorY = m_sriTexelDimension;
  111. dispatchPPCompute(cmdb, fakeWorkgroupSizeXorY, fakeWorkgroupSizeXorY, m_r->getInternalResolution().x(),
  112. m_r->getInternalResolution().y());
  113. });
  114. }
  115. } // end namespace anki