BsSamplerOverrides.cpp 8.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289
  1. //********************************** Banshee Engine (www.banshee3d.com) **************************************************//
  2. //**************** Copyright (c) 2016 Marko Pintera ([email protected]). All rights reserved. **********************//
  3. #include "BsSamplerOverrides.h"
  4. #include "BsRenderBeastOptions.h"
  5. #include "BsMaterial.h"
  6. #include "BsGpuParams.h"
  7. #include "BsGpuParamsSet.h"
  8. #include "BsGpuParamDesc.h"
  9. #include "BsMaterialParams.h"
  10. #include "BsSamplerState.h"
  11. #include "BsRenderStateManager.h"
  12. namespace bs
  13. {
  14. MaterialSamplerOverrides* SamplerOverrideUtility::generateSamplerOverrides(const SPtr<ShaderCore>& shader,
  15. const SPtr<MaterialParamsCore>& params, const SPtr<GpuParamsSetCore>& paramsSet,
  16. const SPtr<RenderBeastOptions>& options)
  17. {
  18. MaterialSamplerOverrides* output = nullptr;
  19. if (shader == nullptr)
  20. return nullptr;
  21. bs_frame_mark();
  22. {
  23. // Generate a list of all sampler state overrides
  24. FrameUnorderedMap<String, UINT32> overrideLookup;
  25. Vector<SamplerOverride> overrides;
  26. auto& samplerParams = shader->getSamplerParams();
  27. for(auto& samplerParam : samplerParams)
  28. {
  29. UINT32 paramIdx;
  30. auto result = params->getParamIndex(samplerParam.first, MaterialParams::ParamType::Sampler, GPDT_UNKNOWN,
  31. 0, paramIdx);
  32. // Parameter shouldn't be in the valid parameter list if it cannot be found
  33. assert(result == MaterialParams::GetParamResult::Success);
  34. const MaterialParamsBase::ParamData* materialParamData = params->getParamData(paramIdx);
  35. UINT32 overrideIdx = (UINT32)overrides.size();
  36. overrides.push_back(SamplerOverride());
  37. SamplerOverride& override = overrides.back();
  38. SPtr<SamplerStateCore> samplerState;
  39. params->getSamplerState(materialParamData->index, samplerState);
  40. if (samplerState == nullptr)
  41. samplerState = SamplerStateCore::getDefault();
  42. override.paramIdx = paramIdx;
  43. if (checkNeedsOverride(samplerState, options))
  44. override.state = generateSamplerOverride(samplerState, options);
  45. else
  46. override.state = samplerState;
  47. override.originalStateHash = override.state->getProperties().getHash();
  48. overrideLookup[samplerParam.first] = overrideIdx;
  49. }
  50. UINT32 numPasses = paramsSet->getNumPasses();
  51. // First pass just determine if we even need to override and count the number of sampler states
  52. UINT32* numSetsPerPass = (UINT32*)bs_stack_alloc<UINT32>(numPasses);
  53. memset(numSetsPerPass, 0, sizeof(UINT32) * numPasses);
  54. UINT32 totalNumSets = 0;
  55. for (UINT32 i = 0; i < numPasses; i++)
  56. {
  57. UINT32 maxSamplerSet = 0;
  58. SPtr<GpuParamsCore> paramsPtr = paramsSet->getGpuParams(i);
  59. for (UINT32 j = 0; j < GpuParamsSetCore::NUM_STAGES; j++)
  60. {
  61. GpuProgramType progType = (GpuProgramType)j;
  62. SPtr<GpuParamDesc> paramDesc = paramsPtr->getParamDesc(progType);
  63. if (paramDesc == nullptr)
  64. continue;
  65. for (auto iter = paramDesc->samplers.begin(); iter != paramDesc->samplers.end(); ++iter)
  66. {
  67. UINT32 set = iter->second.set;
  68. maxSamplerSet = std::max(maxSamplerSet, set + 1);
  69. }
  70. }
  71. numSetsPerPass[i] = maxSamplerSet;
  72. totalNumSets += maxSamplerSet;
  73. }
  74. UINT32 totalNumSamplerStates = 0;
  75. UINT32* slotsPerSet = (UINT32*)bs_stack_alloc<UINT32>(totalNumSets);
  76. memset(slotsPerSet, 0, sizeof(UINT32) * totalNumSets);
  77. UINT32* slotsPerSetIter = slotsPerSet;
  78. for (UINT32 i = 0; i < numPasses; i++)
  79. {
  80. SPtr<GpuParamsCore> paramsPtr = paramsSet->getGpuParams(i);
  81. for (UINT32 j = 0; j < GpuParamsSetCore::NUM_STAGES; j++)
  82. {
  83. GpuProgramType progType = (GpuProgramType)j;
  84. SPtr<GpuParamDesc> paramDesc = paramsPtr->getParamDesc(progType);
  85. if (paramDesc == nullptr)
  86. continue;
  87. for (auto iter = paramDesc->samplers.begin(); iter != paramDesc->samplers.end(); ++iter)
  88. {
  89. UINT32 set = iter->second.set;
  90. UINT32 slot = iter->second.slot;
  91. slotsPerSetIter[set] = std::max(slotsPerSetIter[set], slot + 1);
  92. }
  93. }
  94. for(UINT32 j = 0; j < numSetsPerPass[i]; j++)
  95. totalNumSamplerStates += slotsPerSetIter[j];
  96. slotsPerSetIter += numSetsPerPass[i];
  97. }
  98. UINT32 outputSize = sizeof(MaterialSamplerOverrides) +
  99. numPasses * sizeof(PassSamplerOverrides) +
  100. totalNumSets * sizeof(UINT32*) +
  101. totalNumSamplerStates * sizeof(UINT32) +
  102. (UINT32)overrides.size() * sizeof(SamplerOverride);
  103. UINT8* outputData = (UINT8*)bs_alloc(outputSize);
  104. output = (MaterialSamplerOverrides*)outputData;
  105. outputData += sizeof(MaterialSamplerOverrides);
  106. output->refCount = 0;
  107. output->numPasses = numPasses;
  108. output->passes = (PassSamplerOverrides*)outputData;
  109. output->isDirty = true;
  110. outputData += sizeof(PassSamplerOverrides) * numPasses;
  111. slotsPerSetIter = slotsPerSet;
  112. for (UINT32 i = 0; i < numPasses; i++)
  113. {
  114. SPtr<GpuParamsCore> paramsPtr = paramsSet->getGpuParams(i);
  115. PassSamplerOverrides& passOverrides = output->passes[i];
  116. passOverrides.numSets = numSetsPerPass[i];
  117. passOverrides.stateOverrides = (UINT32**)outputData;
  118. outputData += sizeof(UINT32*) * passOverrides.numSets;
  119. for (UINT32 j = 0; j < passOverrides.numSets; j++)
  120. {
  121. GpuProgramType progType = (GpuProgramType)j;
  122. SPtr<GpuParamDesc> paramDesc = paramsPtr->getParamDesc(progType);
  123. if (paramDesc == nullptr)
  124. continue;
  125. passOverrides.stateOverrides[j] = (UINT32*)outputData;
  126. UINT32 numStates = 0;
  127. for (auto iter = paramDesc->samplers.begin(); iter != paramDesc->samplers.end(); ++iter)
  128. {
  129. UINT32 slot = iter->second.slot;
  130. while (slot > numStates)
  131. {
  132. passOverrides.stateOverrides[j][numStates] = (UINT32)-1;
  133. numStates++;
  134. }
  135. numStates = std::max(numStates, slot + 1);
  136. auto iterFind = overrideLookup.find(iter->first);
  137. if (iterFind != overrideLookup.end())
  138. passOverrides.stateOverrides[j][slot] = iterFind->second;
  139. else
  140. passOverrides.stateOverrides[j][slot] = (UINT32)-1;
  141. }
  142. outputData += sizeof(UINT32) * slotsPerSetIter[j];
  143. }
  144. slotsPerSetIter += passOverrides.numSets;
  145. }
  146. output->numOverrides = (UINT32)overrides.size();
  147. output->overrides = (SamplerOverride*)outputData;
  148. for(UINT32 i = 0; i < output->numOverrides; i++)
  149. {
  150. new (&output->overrides[i].state) SPtr<SamplerStateCore>();
  151. output->overrides[i] = overrides[i];
  152. }
  153. bs_stack_free(slotsPerSet);
  154. bs_stack_free(numSetsPerPass);
  155. }
  156. bs_frame_clear();
  157. return output;
  158. }
  159. void SamplerOverrideUtility::destroySamplerOverrides(MaterialSamplerOverrides* overrides)
  160. {
  161. if (overrides != nullptr)
  162. {
  163. for (UINT32 i = 0; i < overrides->numOverrides; i++)
  164. overrides->overrides[i].state.~SPtr<SamplerStateCore>();
  165. bs_free(overrides);
  166. overrides = nullptr;
  167. }
  168. }
  169. bool SamplerOverrideUtility::checkNeedsOverride(const SPtr<SamplerStateCore>& samplerState, const SPtr<RenderBeastOptions>& options)
  170. {
  171. const SamplerProperties& props = samplerState->getProperties();
  172. switch (options->filtering)
  173. {
  174. case RenderBeastFiltering::Bilinear:
  175. {
  176. if (props.getTextureFiltering(FT_MIN) != FO_LINEAR)
  177. return true;
  178. if (props.getTextureFiltering(FT_MAG) != FO_LINEAR)
  179. return true;
  180. if (props.getTextureFiltering(FT_MIP) != FO_POINT)
  181. return true;
  182. }
  183. break;
  184. case RenderBeastFiltering::Trilinear:
  185. {
  186. if (props.getTextureFiltering(FT_MIN) != FO_LINEAR)
  187. return true;
  188. if (props.getTextureFiltering(FT_MAG) != FO_LINEAR)
  189. return true;
  190. if (props.getTextureFiltering(FT_MIP) != FO_LINEAR)
  191. return true;
  192. }
  193. break;
  194. case RenderBeastFiltering::Anisotropic:
  195. {
  196. if (props.getTextureFiltering(FT_MIN) != FO_ANISOTROPIC)
  197. return true;
  198. if (props.getTextureFiltering(FT_MAG) != FO_ANISOTROPIC)
  199. return true;
  200. if (props.getTextureFiltering(FT_MIP) != FO_ANISOTROPIC)
  201. return true;
  202. if (props.getTextureAnisotropy() != options->anisotropyMax)
  203. return true;
  204. }
  205. break;
  206. }
  207. return false;
  208. }
  209. SPtr<SamplerStateCore> SamplerOverrideUtility::generateSamplerOverride(const SPtr<SamplerStateCore>& samplerState, const SPtr<RenderBeastOptions>& options)
  210. {
  211. const SamplerProperties& props = samplerState->getProperties();
  212. SAMPLER_STATE_DESC desc = props.getDesc();
  213. switch (options->filtering)
  214. {
  215. case RenderBeastFiltering::Bilinear:
  216. desc.minFilter = FO_LINEAR;
  217. desc.magFilter = FO_LINEAR;
  218. desc.mipFilter = FO_POINT;
  219. break;
  220. case RenderBeastFiltering::Trilinear:
  221. desc.minFilter = FO_LINEAR;
  222. desc.magFilter = FO_LINEAR;
  223. desc.mipFilter = FO_LINEAR;
  224. break;
  225. case RenderBeastFiltering::Anisotropic:
  226. desc.minFilter = FO_ANISOTROPIC;
  227. desc.magFilter = FO_ANISOTROPIC;
  228. desc.mipFilter = FO_ANISOTROPIC;
  229. break;
  230. }
  231. desc.maxAniso = options->anisotropyMax;
  232. return RenderStateCoreManager::instance().createSamplerState(desc);
  233. }
  234. }