| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405 |
- // Copyright (C) 2009-2023, Panagiotis Christopoulos Charitos and contributors.
- // All rights reserved.
- // Code licensed under the BSD License.
- // http://www.anki3d.org/LICENSE
- #include <AnKi/Renderer/IndirectDiffuse.h>
- #include <AnKi/Renderer/Renderer.h>
- #include <AnKi/Renderer/DepthDownscale.h>
- #include <AnKi/Renderer/GBuffer.h>
- #include <AnKi/Renderer/DownscaleBlur.h>
- #include <AnKi/Renderer/MotionVectors.h>
- #include <AnKi/Renderer/IndirectDiffuseProbes.h>
- #include <AnKi/Renderer/ClusterBinning.h>
- #include <AnKi/Renderer/PackVisibleClusteredObjects.h>
- #include <AnKi/Core/ConfigSet.h>
- namespace anki {
- static NumericCVar<U32> g_indirectDiffuseSsgiSampleCountCVar(CVarSubsystem::kRenderer, "IndirectDiffuseSsgiSampleCount", 8, 1, 1024,
- "SSGI sample count");
- static NumericCVar<F32> g_indirectDiffuseSsgiRadiusCVar(CVarSubsystem::kRenderer, "IndirectDiffuseSsgiRadius", 2.0f, 0.1f, 100.0f,
- "SSGI radius in meters");
- static NumericCVar<U32> g_indirectDiffuseDenoiseSampleCountCVar(CVarSubsystem::kRenderer, "IndirectDiffuseDenoiseSampleCount", 4, 1, 128,
- "Indirect diffuse denoise sample count");
- static NumericCVar<F32> g_indirectDiffuseSsaoStrengthCVar(CVarSubsystem::kRenderer, "IndirectDiffuseSsaoStrength", 2.5f, 0.1f, 10.0f,
- "SSAO strength");
- static NumericCVar<F32> g_indirectDiffuseSsaoBiasCVar(CVarSubsystem::kRenderer, "IndirectDiffuseSsaoBias", -0.1f, -10.0f, 10.0f, "SSAO bias");
- static NumericCVar<F32> g_indirectDiffuseVrsDistanceThresholdCVar(CVarSubsystem::kRenderer, "IndirectDiffuseVrsDistanceThreshold", 0.01f, 0.00001f,
- 10.0f, "The meters that control the VRS SRI generation");
- Error IndirectDiffuse::init()
- {
- const Error err = initInternal();
- if(err)
- {
- ANKI_R_LOGE("Failed to initialize indirect diffuse pass");
- }
- return err;
- }
- Error IndirectDiffuse::initInternal()
- {
- const UVec2 size = getRenderer().getInternalResolution() / 2;
- ANKI_ASSERT((getRenderer().getInternalResolution() % 2) == UVec2(0u) && "Needs to be dividable for proper upscaling");
- ANKI_R_LOGV("Initializing indirect diffuse. Resolution %ux%u", size.x(), size.y());
- const Bool preferCompute = g_preferComputeCVar.get();
- // Init textures
- TextureUsageBit usage = TextureUsageBit::kAllSampled;
- usage |= (preferCompute) ? TextureUsageBit::kImageComputeWrite : TextureUsageBit::kFramebufferWrite;
- TextureInitInfo texInit =
- getRenderer().create2DRenderTargetInitInfo(size.x(), size.y(), getRenderer().getHdrFormat(), usage, "IndirectDiffuse #1");
- m_rts[0] = getRenderer().createAndClearRenderTarget(texInit, TextureUsageBit::kAllSampled);
- texInit.setName("IndirectDiffuse #2");
- m_rts[1] = getRenderer().createAndClearRenderTarget(texInit, TextureUsageBit::kAllSampled);
- if(!preferCompute)
- {
- m_main.m_fbDescr.m_colorAttachmentCount = 1;
- m_main.m_fbDescr.bake();
- }
- // Init VRS SRI generation
- const Bool enableVrs = GrManager::getSingleton().getDeviceCapabilities().m_vrs && g_vrsCVar.get() && !preferCompute;
- if(enableVrs)
- {
- m_vrs.m_sriTexelDimension = GrManager::getSingleton().getDeviceCapabilities().m_minShadingRateImageTexelSize;
- ANKI_ASSERT(m_vrs.m_sriTexelDimension == 8 || m_vrs.m_sriTexelDimension == 16);
- const UVec2 rez = (size + m_vrs.m_sriTexelDimension - 1) / m_vrs.m_sriTexelDimension;
- m_vrs.m_rtHandle = getRenderer().create2DRenderTargetDescription(rez.x(), rez.y(), Format::kR8_Uint, "IndirectDiffuseVrsSri");
- m_vrs.m_rtHandle.bake();
- ANKI_CHECK(ResourceManager::getSingleton().loadResource("ShaderBinaries/IndirectDiffuseVrsSriGeneration.ankiprogbin", m_vrs.m_prog));
- ShaderProgramResourceVariantInitInfo variantInit(m_vrs.m_prog);
- variantInit.addMutation("SRI_TEXEL_DIMENSION", m_vrs.m_sriTexelDimension);
- if(m_vrs.m_sriTexelDimension == 16 && GrManager::getSingleton().getDeviceCapabilities().m_minSubgroupSize >= 32)
- {
- // Algorithm's workgroup size is 32, GPU's subgroup size is min 32 -> each workgroup has 1 subgroup -> No
- // need for shared mem
- variantInit.addMutation("SHARED_MEMORY", 0);
- }
- else if(m_vrs.m_sriTexelDimension == 8 && GrManager::getSingleton().getDeviceCapabilities().m_minSubgroupSize >= 16)
- {
- // Algorithm's workgroup size is 16, GPU's subgroup size is min 16 -> each workgroup has 1 subgroup -> No
- // need for shared mem
- variantInit.addMutation("SHARED_MEMORY", 0);
- }
- else
- {
- variantInit.addMutation("SHARED_MEMORY", 1);
- }
- variantInit.addMutation("LIMIT_RATE_TO_2X2", g_vrsLimitTo2x2CVar.get());
- const ShaderProgramResourceVariant* variant;
- m_vrs.m_prog->getOrCreateVariant(variantInit, variant);
- m_vrs.m_grProg.reset(&variant->getProgram());
- ANKI_CHECK(ResourceManager::getSingleton().loadResource("ShaderBinaries/VrsSriVisualizeRenderTarget.ankiprogbin", m_vrs.m_visualizeProg));
- m_vrs.m_visualizeProg->getOrCreateVariant(variant);
- m_vrs.m_visualizeGrProg.reset(&variant->getProgram());
- }
- // Init SSGI+probes pass
- {
- CString progFname =
- (preferCompute) ? "ShaderBinaries/IndirectDiffuseCompute.ankiprogbin" : "ShaderBinaries/IndirectDiffuseRaster.ankiprogbin";
- ANKI_CHECK(ResourceManager::getSingleton().loadResource(progFname, m_main.m_prog));
- const ShaderProgramResourceVariant* variant;
- m_main.m_prog->getOrCreateVariant(variant);
- m_main.m_grProg.reset(&variant->getProgram());
- }
- // Init denoise
- {
- m_denoise.m_fbDescr.m_colorAttachmentCount = 1;
- m_denoise.m_fbDescr.bake();
- CString progFname =
- (preferCompute) ? "ShaderBinaries/IndirectDiffuseDenoiseCompute.ankiprogbin" : "ShaderBinaries/IndirectDiffuseDenoiseRaster.ankiprogbin";
- ANKI_CHECK(ResourceManager::getSingleton().loadResource(progFname, m_denoise.m_prog));
- ShaderProgramResourceVariantInitInfo variantInit(m_denoise.m_prog);
- variantInit.addMutation("BLUR_ORIENTATION", 0);
- const ShaderProgramResourceVariant* variant;
- m_denoise.m_prog->getOrCreateVariant(variantInit, variant);
- m_denoise.m_grProgs[0].reset(&variant->getProgram());
- variantInit.addMutation("BLUR_ORIENTATION", 1);
- m_denoise.m_prog->getOrCreateVariant(variantInit, variant);
- m_denoise.m_grProgs[1].reset(&variant->getProgram());
- }
- return Error::kNone;
- }
- void IndirectDiffuse::populateRenderGraph(RenderingContext& ctx)
- {
- RenderGraphDescription& rgraph = ctx.m_renderGraphDescr;
- const Bool preferCompute = g_preferComputeCVar.get();
- const Bool enableVrs = GrManager::getSingleton().getDeviceCapabilities().m_vrs && g_vrsCVar.get() && !preferCompute;
- const Bool fbDescrHasVrs = m_main.m_fbDescr.m_shadingRateAttachmentTexelWidth > 0;
- if(!preferCompute && enableVrs != fbDescrHasVrs)
- {
- // Re-bake the FB descriptor if the VRS state has changed
- if(enableVrs)
- {
- m_main.m_fbDescr.m_shadingRateAttachmentTexelWidth = m_vrs.m_sriTexelDimension;
- m_main.m_fbDescr.m_shadingRateAttachmentTexelHeight = m_vrs.m_sriTexelDimension;
- }
- else
- {
- m_main.m_fbDescr.m_shadingRateAttachmentTexelWidth = 0;
- m_main.m_fbDescr.m_shadingRateAttachmentTexelHeight = 0;
- }
- m_main.m_fbDescr.bake();
- }
- // VRS SRI
- if(enableVrs)
- {
- m_runCtx.m_sriRt = rgraph.newRenderTarget(m_vrs.m_rtHandle);
- ComputeRenderPassDescription& pass = rgraph.newComputeRenderPass("IndirectDiffuse VRS SRI gen");
- pass.newTextureDependency(m_runCtx.m_sriRt, TextureUsageBit::kImageComputeWrite);
- pass.newTextureDependency(getRenderer().getDepthDownscale().getHiZRt(), TextureUsageBit::kSampledCompute, kHiZHalfSurface);
- pass.setWork([this, &ctx](RenderPassWorkContext& rgraphCtx) {
- const UVec2 viewport = getRenderer().getInternalResolution() / 2u;
- CommandBuffer& cmdb = *rgraphCtx.m_commandBuffer;
- cmdb.bindShaderProgram(m_vrs.m_grProg.get());
- rgraphCtx.bindTexture(0, 0, getRenderer().getDepthDownscale().getHiZRt(), kHiZHalfSurface);
- cmdb.bindSampler(0, 1, getRenderer().getSamplers().m_nearestNearestClamp.get());
- rgraphCtx.bindImage(0, 2, m_runCtx.m_sriRt);
- class
- {
- public:
- Vec4 m_v4;
- Mat4 m_invertedProjectionJitter;
- } pc;
- pc.m_v4 = Vec4(1.0f / Vec2(viewport), g_indirectDiffuseVrsDistanceThresholdCVar.get(), 0.0f);
- pc.m_invertedProjectionJitter = ctx.m_matrices.m_invertedProjectionJitter;
- cmdb.setPushConstants(&pc, sizeof(pc));
- dispatchPPCompute(cmdb, m_vrs.m_sriTexelDimension, m_vrs.m_sriTexelDimension, viewport.x(), viewport.y());
- });
- }
- // SSGI+probes
- {
- // Create RTs
- const U32 readRtIdx = getRenderer().getFrameCount() & 1;
- const U32 writeRtIdx = !readRtIdx;
- if(m_rtsImportedOnce) [[likely]]
- {
- m_runCtx.m_mainRtHandles[0] = rgraph.importRenderTarget(m_rts[readRtIdx].get());
- m_runCtx.m_mainRtHandles[1] = rgraph.importRenderTarget(m_rts[writeRtIdx].get());
- }
- else
- {
- m_runCtx.m_mainRtHandles[0] = rgraph.importRenderTarget(m_rts[readRtIdx].get(), TextureUsageBit::kAllSampled);
- m_runCtx.m_mainRtHandles[1] = rgraph.importRenderTarget(m_rts[writeRtIdx].get(), TextureUsageBit::kAllSampled);
- m_rtsImportedOnce = true;
- }
- // Create main pass
- TextureUsageBit readUsage;
- TextureUsageBit writeUsage;
- RenderPassDescriptionBase* prpass;
- if(preferCompute)
- {
- ComputeRenderPassDescription& rpass = rgraph.newComputeRenderPass("IndirectDiffuse");
- readUsage = TextureUsageBit::kSampledCompute;
- writeUsage = TextureUsageBit::kImageComputeWrite;
- prpass = &rpass;
- }
- else
- {
- GraphicsRenderPassDescription& rpass = rgraph.newGraphicsRenderPass("IndirectDiffuse");
- rpass.setFramebufferInfo(m_main.m_fbDescr, {m_runCtx.m_mainRtHandles[kWrite]}, {}, (enableVrs) ? m_runCtx.m_sriRt : RenderTargetHandle());
- readUsage = TextureUsageBit::kSampledFragment;
- writeUsage = TextureUsageBit::kFramebufferWrite;
- prpass = &rpass;
- if(enableVrs)
- {
- prpass->newTextureDependency(m_runCtx.m_sriRt, TextureUsageBit::kFramebufferShadingRate);
- }
- }
- prpass->newTextureDependency(m_runCtx.m_mainRtHandles[kWrite], writeUsage);
- if(getRenderer().getIndirectDiffuseProbes().hasCurrentlyRefreshedVolumeRt())
- {
- prpass->newTextureDependency(getRenderer().getIndirectDiffuseProbes().getCurrentlyRefreshedVolumeRt(), readUsage);
- }
- prpass->newTextureDependency(getRenderer().getGBuffer().getColorRt(2), readUsage);
- TextureSubresourceInfo hizSubresource;
- hizSubresource.m_mipmapCount = 1;
- prpass->newTextureDependency(getRenderer().getDepthDownscale().getHiZRt(), readUsage, hizSubresource);
- prpass->newTextureDependency(getRenderer().getDownscaleBlur().getRt(), readUsage);
- prpass->newTextureDependency(getRenderer().getMotionVectors().getMotionVectorsRt(), readUsage);
- prpass->newTextureDependency(getRenderer().getMotionVectors().getHistoryLengthRt(), readUsage);
- prpass->newTextureDependency(m_runCtx.m_mainRtHandles[kRead], readUsage);
- prpass->setWork([this, &ctx, enableVrs](RenderPassWorkContext& rgraphCtx) {
- CommandBuffer& cmdb = *rgraphCtx.m_commandBuffer;
- cmdb.bindShaderProgram(m_main.m_grProg.get());
- bindUniforms(cmdb, 0, 0, getRenderer().getClusterBinning().getClusteredUniformsRebarToken());
- getRenderer().getPackVisibleClusteredObjects().bindClusteredObjectBuffer(cmdb, 0, 1, ClusteredObjectType::kGlobalIlluminationProbe);
- bindStorage(cmdb, 0, 2, getRenderer().getClusterBinning().getClustersRebarToken());
- cmdb.bindSampler(0, 3, getRenderer().getSamplers().m_trilinearClamp.get());
- rgraphCtx.bindColorTexture(0, 4, getRenderer().getGBuffer().getColorRt(2));
- TextureSubresourceInfo hizSubresource;
- hizSubresource.m_mipmapCount = 1;
- rgraphCtx.bindTexture(0, 5, getRenderer().getDepthDownscale().getHiZRt(), hizSubresource);
- rgraphCtx.bindColorTexture(0, 6, getRenderer().getDownscaleBlur().getRt());
- rgraphCtx.bindColorTexture(0, 7, m_runCtx.m_mainRtHandles[kRead]);
- rgraphCtx.bindColorTexture(0, 8, getRenderer().getMotionVectors().getMotionVectorsRt());
- rgraphCtx.bindColorTexture(0, 9, getRenderer().getMotionVectors().getHistoryLengthRt());
- if(g_preferComputeCVar.get())
- {
- rgraphCtx.bindImage(0, 10, m_runCtx.m_mainRtHandles[kWrite]);
- }
- cmdb.bindAllBindless(1);
- // Bind uniforms
- IndirectDiffuseUniforms unis;
- unis.m_viewportSize = getRenderer().getInternalResolution() / 2u;
- unis.m_viewportSizef = Vec2(unis.m_viewportSize);
- const Mat4& pmat = ctx.m_matrices.m_projection;
- unis.m_projectionMat = Vec4(pmat(0, 0), pmat(1, 1), pmat(2, 2), pmat(2, 3));
- unis.m_radius = g_indirectDiffuseSsgiRadiusCVar.get();
- unis.m_sampleCount = g_indirectDiffuseSsgiSampleCountCVar.get();
- unis.m_sampleCountf = F32(unis.m_sampleCount);
- unis.m_ssaoBias = g_indirectDiffuseSsaoBiasCVar.get();
- unis.m_ssaoStrength = g_indirectDiffuseSsaoStrengthCVar.get();
- cmdb.setPushConstants(&unis, sizeof(unis));
- if(g_preferComputeCVar.get())
- {
- dispatchPPCompute(cmdb, 8, 8, unis.m_viewportSize.x(), unis.m_viewportSize.y());
- }
- else
- {
- cmdb.setViewport(0, 0, unis.m_viewportSize.x(), unis.m_viewportSize.y());
- if(enableVrs)
- {
- cmdb.setVrsRate(VrsRate::k1x1);
- }
- cmdb.draw(PrimitiveTopology::kTriangles, 3);
- }
- });
- }
- // Denoise
- for(U32 dir = 0; dir < 2; ++dir)
- {
- const U32 readIdx = (dir == 0) ? kWrite : kRead;
- TextureUsageBit readUsage;
- TextureUsageBit writeUsage;
- RenderPassDescriptionBase* prpass;
- if(preferCompute)
- {
- ComputeRenderPassDescription& rpass = rgraph.newComputeRenderPass((dir == 0) ? "IndirectDiffuseDenoiseH" : "IndirectDiffuseDenoiseV");
- readUsage = TextureUsageBit::kSampledCompute;
- writeUsage = TextureUsageBit::kImageComputeWrite;
- prpass = &rpass;
- }
- else
- {
- GraphicsRenderPassDescription& rpass = rgraph.newGraphicsRenderPass((dir == 0) ? "IndirectDiffuseDenoiseH" : "IndirectDiffuseDenoiseV");
- rpass.setFramebufferInfo(m_denoise.m_fbDescr, {m_runCtx.m_mainRtHandles[!readIdx]});
- readUsage = TextureUsageBit::kSampledFragment;
- writeUsage = TextureUsageBit::kFramebufferWrite;
- prpass = &rpass;
- }
- prpass->newTextureDependency(m_runCtx.m_mainRtHandles[readIdx], readUsage);
- TextureSubresourceInfo hizSubresource;
- hizSubresource.m_mipmapCount = 1;
- prpass->newTextureDependency(getRenderer().getDepthDownscale().getHiZRt(), readUsage, hizSubresource);
- prpass->newTextureDependency(m_runCtx.m_mainRtHandles[!readIdx], writeUsage);
- prpass->setWork([this, &ctx, dir, readIdx](RenderPassWorkContext& rgraphCtx) {
- CommandBuffer& cmdb = *rgraphCtx.m_commandBuffer;
- cmdb.bindShaderProgram(m_denoise.m_grProgs[dir].get());
- cmdb.bindSampler(0, 0, getRenderer().getSamplers().m_trilinearClamp.get());
- rgraphCtx.bindColorTexture(0, 1, m_runCtx.m_mainRtHandles[readIdx]);
- TextureSubresourceInfo hizSubresource;
- hizSubresource.m_mipmapCount = 1;
- rgraphCtx.bindTexture(0, 2, getRenderer().getDepthDownscale().getHiZRt(), hizSubresource);
- if(g_preferComputeCVar.get())
- {
- rgraphCtx.bindImage(0, 3, m_runCtx.m_mainRtHandles[!readIdx]);
- }
- IndirectDiffuseDenoiseUniforms unis;
- unis.m_invertedViewProjectionJitterMat = ctx.m_matrices.m_invertedViewProjectionJitter;
- unis.m_viewportSize = getRenderer().getInternalResolution() / 2u;
- unis.m_viewportSizef = Vec2(unis.m_viewportSize);
- unis.m_sampleCountDiv2 = F32(g_indirectDiffuseDenoiseSampleCountCVar.get());
- unis.m_sampleCountDiv2 = max(1.0f, std::round(unis.m_sampleCountDiv2 / 2.0f));
- cmdb.setPushConstants(&unis, sizeof(unis));
- if(g_preferComputeCVar.get())
- {
- dispatchPPCompute(cmdb, 8, 8, unis.m_viewportSize.x(), unis.m_viewportSize.y());
- }
- else
- {
- cmdb.setViewport(0, 0, unis.m_viewportSize.x(), unis.m_viewportSize.y());
- cmdb.draw(PrimitiveTopology::kTriangles, 3);
- }
- });
- }
- }
- void IndirectDiffuse::getDebugRenderTarget(CString rtName, Array<RenderTargetHandle, kMaxDebugRenderTargets>& handles,
- ShaderProgramPtr& optionalShaderProgram) const
- {
- if(rtName == "IndirectDiffuse")
- {
- handles[0] = m_runCtx.m_mainRtHandles[kWrite];
- }
- else
- {
- ANKI_ASSERT(rtName == "IndirectDiffuseVrsSri");
- handles[0] = m_runCtx.m_sriRt;
- optionalShaderProgram = m_vrs.m_visualizeGrProg;
- }
- }
- } // end namespace anki
|