cpp
/
BansheeEngine
mirror da https://github.com/larioteo/BansheeEngine.git


			
				
					
						
						
							123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199
							#include "$ENGINE$\DepthOfFieldCommon.bslinc"
#include "$ENGINE$\PerCameraData.bslinc"

shader PPBokehDOF
{
	mixin DepthOfFieldCommon;
	mixin PerCameraData;

	variations
	{
		DEPTH_OCCLUSION = { true, false };
	};
	
	depth
	{
		write = false;
		read = false;
	};
	
	blend
	{
		target	
		{
			enabled = true;
			color = { one, one, add };
			alpha = { one, one, add };
		};
	};

	code
	{
		cbuffer Params
		{
			uint2 gTileCount;
			float2 gInvInputSize;
			float2 gInvOutputSize;
			float gAdaptiveThresholdColor;
			float gAdaptiveThresholdCOC;
			float2 gBokehSize;
			uint gLayerPixelOffset;
			float gInvDepthRange;
		};
		
		Texture2D gInputTex;
		SamplerState gInputSampler
		{
			AddressU = CLAMP;
			AddressV = CLAMP;
			AddressW = CLAMP;
		};
	
		struct VStoFS
		{
			float4 position : SV_POSITION;
			noperspective float2 uv0 : TEXCOORD0;
			nointerpolation float4 color : TEXCOORD1;
			
			#if DEPTH_OCCLUSION
			float2 screenUV : TEXCOORD2;
			nointerpolation float depth : TEXCOORD3;
			#endif
		};

		struct VertexInput
		{
			uint vertexId : SV_VertexID;
			uint instanceId : SV_InstanceID;
			float2 uv0 : TEXCOORD0;
		};
		
		VStoFS vsmain(VertexInput input)
		{
			uint vid = input.vertexId;
			uint iid = input.instanceId;
		
			// We group quads in tiles for perfomance reasons (less instances)
			// Additionally, we group the quads within the tiles into 2x2 blocks for adaptive rendering
			// (Generally a tile is 8 quads, meaning 2 blocks per tile)
			uint quadIdxInTile = vid / 4;
			uint quadIdxInBlock = quadIdxInTile % 4;
			
			// Find the top-left position of the current block, in pixels
			uint blocksPerTile = QUADS_PER_TILE / 4;
			
			// TODO - Since the way we're sampling below, should this be the block center?
			// - Then again maybe not, because the offset we apply to blockPos below seems similar?
			uint blocksInRow = gTileCount.x / (blocksPerTile * 2);
			float2 blockPos = 
				float2(iid % blocksInRow, iid / blocksInRow)
				* uint2(blocksPerTile * 2, 2) // Each tile is 2 pixels (quads) high, with N blocks with 2 pixels (quads) wide
				+ uint2((quadIdxInTile/4) * 2, 0); // Each block has N quads laid out in a row, and each block is 2 quads wide
			
			// Color in .rgb, linear depth in .a
			float4 samples[4];
			samples[0] = gInputTex.SampleLevel(gInputSampler, (blockPos + float2(-0.5f, -0.5f)) * gInvInputSize, 0);
			samples[1] = gInputTex.SampleLevel(gInputSampler, (blockPos + float2( 0.5f, -0.5f)) * gInvInputSize, 0);
			samples[2] = gInputTex.SampleLevel(gInputSampler, (blockPos + float2(-0.5f,  0.5f)) * gInvInputSize, 0);
			samples[3] = gInputTex.SampleLevel(gInputSampler, (blockPos + float2( 0.5f,  0.5f)) * gInvInputSize, 0);

			float4 minSamples = min(min(samples[0], samples[1]), min(samples[2], samples[3]));
			float4 maxSamples = max(max(samples[0], samples[1]), max(samples[2], samples[3]));
			
			bool needSeparateQuads = false;
			
			// Are the colors too different?
			float3 colorDiff = maxSamples.rgb - minSamples.rgb;
			if(dot(colorDiff, 1) > gAdaptiveThresholdColor)
				needSeparateQuads = true;
			
			// Do the samples fall on different layers?
			int minLayer = minSamples.a < gFocalPlaneDistance ? 0 :
				(minSamples.a > (gFocalPlaneDistance + gFocalLength) ? 2 : 1);
				
			int maxLayer = maxSamples.a < gFocalPlaneDistance ? 0 :
				(maxSamples.a > (gFocalPlaneDistance + gFocalLength) ? 2 : 1);

			if(minLayer != maxLayer)
				needSeparateQuads = true;

			// Don't skip small quads
			float avgDepth = (minSamples.a + maxSamples.a) * 0.5f;
			float avgCOC = circleOfConfusionPhysical(avgDepth);
			if(avgCOC < gAdaptiveThresholdCOC)
				needSeparateQuads = true;
			
			float4 colorAndDepth;
			if(needSeparateQuads)
			{
				colorAndDepth = samples[quadIdxInBlock];
				blockPos += float2(quadIdxInBlock % 2, quadIdxInBlock / 2) - 0.5f;
			}
			else
				colorAndDepth = (samples[0] + samples[1] + samples[2] + samples[3]) * 0.25f;

			float sceneDepth = colorAndDepth.a;
			float coc = circleOfConfusionPhysical(sceneDepth);

			// 2 pixel minimum size
			float2 cocPixelSize = max(coc * gBokehSize.xy, 2.0f);

			float4 color = float4(colorAndDepth.rgb, 1);
			float2 layer = computeLayerContributions(sceneDepth);

			color *= (sceneDepth < gFocalPlaneDistance) ? layer.r : layer.g;

			if(!needSeparateQuads)
			{
				// Make other three quads zero-sized
				if(quadIdxInBlock != 0)
					cocPixelSize = 0;
			}
			else
				color *= 0.25f;

			// Offset so we render both near and far fields in the same texture but with an offset
			float vertOffset = sceneDepth < gFocalPlaneDistance ? gLayerPixelOffset : 0;
			
			// Determine location of the vertex within the current quad
			uint vertexIdxInQuad = vid % 4;				
			float2 localPos = float2(vertexIdxInQuad % 2, vertexIdxInQuad / 2);
			
			float2 screenPos = blockPos + (localPos - 0.5f) * cocPixelSize;
			float2 uvPos = (screenPos + float2(0, vertOffset)) * gInvOutputSize;			
			float2 ndcPos = UVToNDC(uvPos);
			
			VStoFS output;			
			output.position = float4(ndcPos, 0, 1);
			output.uv0 = input.uv0;
			output.color = color;
			
			#if DEPTH_OCCLUSION
			output.screenUV = screenPos * gInvInputSize;
			output.depth = sceneDepth;
			#endif

			return output;
		}			

		Texture2D gBokehTex;
		SamplerState gBokehSampler;
		
		float4 fsmain(VStoFS input) : SV_Target0
		{
			float4 output = gBokehTex.Sample(gBokehSampler, input.uv0).r * input.color;
			
			#if DEPTH_OCCLUSION
				float spriteDepth = input.depth;
				float sceneDepth = gInputTex.SampleLevel(gInputSampler, input.screenUV, 0).a;
				
				float diff = spriteDepth - sceneDepth;
				float fade = 1.0f - saturate(diff * gInvDepthRange);
			
				output *= fade;
			#endif
			
			return output;
		}	
	};
};