BsD3D11RenderAPI.cpp 36 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149
  1. #include "BsD3D11RenderAPI.h"
  2. #include "BsD3D11DriverList.h"
  3. #include "BsD3D11Driver.h"
  4. #include "BsD3D11Device.h"
  5. #include "BsD3D11TextureManager.h"
  6. #include "BsD3D11Texture.h"
  7. #include "BsD3D11HardwareBufferManager.h"
  8. #include "BsD3D11RenderWindowManager.h"
  9. #include "BsD3D11HLSLProgramFactory.h"
  10. #include "BsD3D11BlendState.h"
  11. #include "BsD3D11RasterizerState.h"
  12. #include "BsD3D11DepthStencilState.h"
  13. #include "BsD3D11SamplerState.h"
  14. #include "BsD3D11GpuProgram.h"
  15. #include "BsD3D11Mappings.h"
  16. #include "BsD3D11VertexBuffer.h"
  17. #include "BsD3D11IndexBuffer.h"
  18. #include "BsD3D11RenderStateManager.h"
  19. #include "BsD3D11GpuParamBlockBuffer.h"
  20. #include "BsD3D11InputLayoutManager.h"
  21. #include "BsD3D11TextureView.h"
  22. #include "BsD3D11RenderUtility.h"
  23. #include "BsGpuParams.h"
  24. #include "BsCoreThread.h"
  25. #include "BsD3D11QueryManager.h"
  26. #include "BsDebug.h"
  27. #include "BsException.h"
  28. #include "BsRenderStats.h"
  29. #include "BsGpuParamDesc.h"
  30. namespace BansheeEngine
  31. {
  32. D3D11RenderAPI::D3D11RenderAPI()
  33. : mDXGIFactory(nullptr), mDevice(nullptr), mDriverList(nullptr)
  34. , mActiveD3DDriver(nullptr), mFeatureLevel(D3D_FEATURE_LEVEL_11_0)
  35. , mHLSLFactory(nullptr), mIAManager(nullptr)
  36. , mStencilRef(0), mActiveDrawOp(DOT_TRIANGLE_LIST)
  37. , mViewportNorm(0.0f, 0.0f, 1.0f, 1.0f)
  38. {
  39. mClipPlanesDirty = false; // DX11 handles clip planes through shaders
  40. }
  41. D3D11RenderAPI::~D3D11RenderAPI()
  42. {
  43. }
  44. const StringID& D3D11RenderAPI::getName() const
  45. {
  46. static StringID strName("D3D11RenderAPI");
  47. return strName;
  48. }
  49. const String& D3D11RenderAPI::getShadingLanguageName() const
  50. {
  51. static String strName("hlsl");
  52. return strName;
  53. }
  54. void D3D11RenderAPI::initializePrepare()
  55. {
  56. THROW_IF_NOT_CORE_THREAD;
  57. HRESULT hr = CreateDXGIFactory(__uuidof(IDXGIFactory), (void**)&mDXGIFactory);
  58. if(FAILED(hr))
  59. BS_EXCEPT(RenderingAPIException, "Failed to create Direct3D11 DXGIFactory");
  60. mDriverList = bs_new<D3D11DriverList>(mDXGIFactory);
  61. mActiveD3DDriver = mDriverList->item(0); // TODO: Always get first driver, for now
  62. mVideoModeInfo = mActiveD3DDriver->getVideoModeInfo();
  63. IDXGIAdapter* selectedAdapter = mActiveD3DDriver->getDeviceAdapter();
  64. D3D_FEATURE_LEVEL requestedLevels[] = {
  65. D3D_FEATURE_LEVEL_11_0,
  66. D3D_FEATURE_LEVEL_10_1,
  67. D3D_FEATURE_LEVEL_10_0,
  68. D3D_FEATURE_LEVEL_9_3,
  69. D3D_FEATURE_LEVEL_9_2,
  70. D3D_FEATURE_LEVEL_9_1
  71. };
  72. UINT32 numRequestedLevel = sizeof(requestedLevels) / sizeof(requestedLevels[0]);
  73. UINT32 deviceFlags = 0;
  74. #if BS_DEBUG_MODE
  75. deviceFlags |= D3D11_CREATE_DEVICE_DEBUG;
  76. #endif
  77. ID3D11Device* device;
  78. hr = D3D11CreateDevice(selectedAdapter, D3D_DRIVER_TYPE_UNKNOWN, nullptr, deviceFlags,
  79. requestedLevels, numRequestedLevel, D3D11_SDK_VERSION, &device, &mFeatureLevel, nullptr);
  80. if(FAILED(hr))
  81. BS_EXCEPT(RenderingAPIException, "Failed to create Direct3D11 object. D3D11CreateDeviceN returned this error code: " + toString(hr));
  82. mDevice = bs_new<D3D11Device>(device);
  83. // This must query for DirectX 10 interface as this is unsupported for DX11
  84. LARGE_INTEGER driverVersion;
  85. if(SUCCEEDED(selectedAdapter->CheckInterfaceSupport(IID_ID3D10Device, &driverVersion)))
  86. {
  87. mDriverVersion.major = HIWORD(driverVersion.HighPart);
  88. mDriverVersion.minor = LOWORD(driverVersion.HighPart);
  89. mDriverVersion.release = HIWORD(driverVersion.LowPart);
  90. mDriverVersion.build = LOWORD(driverVersion.LowPart);
  91. }
  92. // Create the texture manager for use by others
  93. TextureManager::startUp<D3D11TextureManager>();
  94. TextureCoreManager::startUp<D3D11TextureCoreManager>();
  95. // Create hardware buffer manager
  96. HardwareBufferManager::startUp();
  97. HardwareBufferCoreManager::startUp<D3D11HardwareBufferCoreManager>(std::ref(*mDevice));
  98. // Create render window manager
  99. RenderWindowManager::startUp<D3D11RenderWindowManager>(this);
  100. RenderWindowCoreManager::startUp<D3D11RenderWindowCoreManager>(this);
  101. // Create & register HLSL factory
  102. mHLSLFactory = bs_new<D3D11HLSLProgramFactory>();
  103. // Create render state manager
  104. RenderStateCoreManager::startUp<D3D11RenderStateCoreManager>();
  105. mCurrentCapabilities = createRenderSystemCapabilities();
  106. mCurrentCapabilities->addShaderProfile("hlsl");
  107. GpuProgramCoreManager::instance().addFactory(mHLSLFactory);
  108. mIAManager = bs_new<D3D11InputLayoutManager>();
  109. RenderAPICore::initializePrepare();
  110. }
  111. void D3D11RenderAPI::initializeFinalize(const SPtr<RenderWindowCore>& primaryWindow)
  112. {
  113. D3D11RenderUtility::startUp(mDevice);
  114. QueryManager::startUp<D3D11QueryManager>();
  115. RenderAPICore::initializeFinalize(primaryWindow);
  116. }
  117. void D3D11RenderAPI::destroyCore()
  118. {
  119. THROW_IF_NOT_CORE_THREAD;
  120. for (auto& boundUAV : mBoundUAVs)
  121. {
  122. if (boundUAV.second != nullptr)
  123. boundUAV.first->releaseView(boundUAV.second);
  124. }
  125. QueryManager::shutDown();
  126. D3D11RenderUtility::shutDown();
  127. if(mIAManager != nullptr)
  128. {
  129. bs_delete(mIAManager);
  130. mIAManager = nullptr;
  131. }
  132. if(mHLSLFactory != nullptr)
  133. {
  134. bs_delete(mHLSLFactory);
  135. mHLSLFactory = nullptr;
  136. }
  137. mActiveVertexDeclaration = nullptr;
  138. mActiveVertexShader = nullptr;
  139. mActiveRenderTarget = nullptr;
  140. RenderStateCoreManager::shutDown();
  141. RenderWindowCoreManager::shutDown();
  142. RenderWindowManager::shutDown();
  143. HardwareBufferCoreManager::shutDown();
  144. HardwareBufferManager::shutDown();
  145. TextureCoreManager::shutDown();
  146. TextureManager::shutDown();
  147. SAFE_RELEASE(mDXGIFactory);
  148. if(mDevice != nullptr)
  149. {
  150. bs_delete(mDevice);
  151. mDevice = nullptr;
  152. }
  153. if(mDriverList != nullptr)
  154. {
  155. bs_delete(mDriverList);
  156. mDriverList = nullptr;
  157. }
  158. mActiveD3DDriver = nullptr;
  159. RenderAPICore::destroyCore();
  160. }
  161. void D3D11RenderAPI::setSamplerState(GpuProgramType gptype, UINT16 texUnit, const SPtr<SamplerStateCore>& samplerState)
  162. {
  163. THROW_IF_NOT_CORE_THREAD;
  164. // TODO - I'm setting up views one by one, it might be more efficient to hold them in an array
  165. // and then set them all up at once before rendering? Needs testing
  166. ID3D11SamplerState* samplerArray[1];
  167. D3D11SamplerStateCore* d3d11SamplerState = static_cast<D3D11SamplerStateCore*>(const_cast<SamplerStateCore*>(samplerState.get()));
  168. samplerArray[0] = d3d11SamplerState->getInternal();
  169. switch(gptype)
  170. {
  171. case GPT_VERTEX_PROGRAM:
  172. mDevice->getImmediateContext()->VSSetSamplers(texUnit, 1, samplerArray);
  173. break;
  174. case GPT_FRAGMENT_PROGRAM:
  175. mDevice->getImmediateContext()->PSSetSamplers(texUnit, 1, samplerArray);
  176. break;
  177. case GPT_GEOMETRY_PROGRAM:
  178. mDevice->getImmediateContext()->GSSetSamplers(texUnit, 1, samplerArray);
  179. break;
  180. case GPT_DOMAIN_PROGRAM:
  181. mDevice->getImmediateContext()->DSSetSamplers(texUnit, 1, samplerArray);
  182. break;
  183. case GPT_HULL_PROGRAM:
  184. mDevice->getImmediateContext()->HSSetSamplers(texUnit, 1, samplerArray);
  185. break;
  186. case GPT_COMPUTE_PROGRAM:
  187. mDevice->getImmediateContext()->CSSetSamplers(texUnit, 1, samplerArray);
  188. break;
  189. default:
  190. BS_EXCEPT(InvalidParametersException, "Unsupported gpu program type: " + toString(gptype));
  191. }
  192. BS_INC_RENDER_STAT(NumSamplerBinds);
  193. }
  194. void D3D11RenderAPI::setBlendState(const SPtr<BlendStateCore>& blendState)
  195. {
  196. THROW_IF_NOT_CORE_THREAD;
  197. D3D11BlendStateCore* d3d11BlendState = static_cast<D3D11BlendStateCore*>(const_cast<BlendStateCore*>(blendState.get()));
  198. mDevice->getImmediateContext()->OMSetBlendState(d3d11BlendState->getInternal(), nullptr, 0xFFFFFFFF);
  199. BS_INC_RENDER_STAT(NumBlendStateChanges);
  200. }
  201. void D3D11RenderAPI::setRasterizerState(const SPtr<RasterizerStateCore>& rasterizerState)
  202. {
  203. THROW_IF_NOT_CORE_THREAD;
  204. D3D11RasterizerStateCore* d3d11RasterizerState = static_cast<D3D11RasterizerStateCore*>(const_cast<RasterizerStateCore*>(rasterizerState.get()));
  205. mDevice->getImmediateContext()->RSSetState(d3d11RasterizerState->getInternal());
  206. BS_INC_RENDER_STAT(NumRasterizerStateChanges);
  207. }
  208. void D3D11RenderAPI::setDepthStencilState(const SPtr<DepthStencilStateCore>& depthStencilState, UINT32 stencilRefValue)
  209. {
  210. THROW_IF_NOT_CORE_THREAD;
  211. D3D11DepthStencilStateCore* d3d11RasterizerState = static_cast<D3D11DepthStencilStateCore*>(const_cast<DepthStencilStateCore*>(depthStencilState.get()));
  212. mDevice->getImmediateContext()->OMSetDepthStencilState(d3d11RasterizerState->getInternal(), stencilRefValue);
  213. BS_INC_RENDER_STAT(NumDepthStencilStateChanges);
  214. }
  215. void D3D11RenderAPI::setTexture(GpuProgramType gptype, UINT16 unit, bool enabled, const SPtr<TextureCore>& texPtr)
  216. {
  217. THROW_IF_NOT_CORE_THREAD;
  218. // TODO - I'm setting up views one by one, it might be more efficient to hold them in an array
  219. // and then set them all up at once before rendering? Needs testing
  220. ID3D11ShaderResourceView* viewArray[1];
  221. if(texPtr != nullptr && enabled)
  222. {
  223. D3D11TextureCore* d3d11Texture = static_cast<D3D11TextureCore*>(texPtr.get());
  224. viewArray[0] = d3d11Texture->getSRV();
  225. }
  226. else
  227. viewArray[0] = nullptr;
  228. switch(gptype)
  229. {
  230. case GPT_VERTEX_PROGRAM:
  231. mDevice->getImmediateContext()->VSSetShaderResources(unit, 1, viewArray);
  232. break;
  233. case GPT_FRAGMENT_PROGRAM:
  234. mDevice->getImmediateContext()->PSSetShaderResources(unit, 1, viewArray);
  235. break;
  236. case GPT_GEOMETRY_PROGRAM:
  237. mDevice->getImmediateContext()->GSSetShaderResources(unit, 1, viewArray);
  238. break;
  239. case GPT_DOMAIN_PROGRAM:
  240. mDevice->getImmediateContext()->DSSetShaderResources(unit, 1, viewArray);
  241. break;
  242. case GPT_HULL_PROGRAM:
  243. mDevice->getImmediateContext()->HSSetShaderResources(unit, 1, viewArray);
  244. break;
  245. case GPT_COMPUTE_PROGRAM:
  246. mDevice->getImmediateContext()->CSSetShaderResources(unit, 1, viewArray);
  247. break;
  248. default:
  249. BS_EXCEPT(InvalidParametersException, "Unsupported gpu program type: " + toString(gptype));
  250. }
  251. BS_INC_RENDER_STAT(NumTextureBinds);
  252. }
  253. void D3D11RenderAPI::setLoadStoreTexture(GpuProgramType gptype, UINT16 unit, bool enabled, const SPtr<TextureCore>& texPtr,
  254. const TextureSurface& surface)
  255. {
  256. THROW_IF_NOT_CORE_THREAD;
  257. // TODO - This hasn't bee tested and might be incorrect. I might need to set UAVs together with render targets,
  258. // especially considering DX11 expects number of UAVs to match number of render targets.
  259. ID3D11UnorderedAccessView* viewArray[1];
  260. if (texPtr != nullptr && enabled)
  261. {
  262. D3D11TextureCore* d3d11Texture = static_cast<D3D11TextureCore*>(texPtr.get());
  263. TextureViewPtr texView = TextureCore::requestView(texPtr, surface.mipLevel, 1,
  264. surface.arraySlice, surface.numArraySlices, GVU_RANDOMWRITE);
  265. D3D11TextureView* d3d11texView = static_cast<D3D11TextureView*>(texView.get());
  266. viewArray[0] = d3d11texView->getUAV();
  267. if (mBoundUAVs[unit].second != nullptr)
  268. mBoundUAVs[unit].first->releaseView(mBoundUAVs[unit].second);
  269. mBoundUAVs[unit] = std::make_pair(texPtr, texView);
  270. }
  271. else
  272. {
  273. viewArray[0] = nullptr;
  274. if (mBoundUAVs[unit].second != nullptr)
  275. mBoundUAVs[unit].first->releaseView(mBoundUAVs[unit].second);
  276. mBoundUAVs[unit] = std::pair<SPtr<TextureCore>, TextureViewPtr>();
  277. }
  278. if (gptype == GPT_FRAGMENT_PROGRAM)
  279. {
  280. mDevice->getImmediateContext()->OMSetRenderTargetsAndUnorderedAccessViews(
  281. D3D11_KEEP_RENDER_TARGETS_AND_DEPTH_STENCIL, nullptr, nullptr, unit, 1, viewArray, nullptr);
  282. }
  283. else if (gptype == GPT_COMPUTE_PROGRAM)
  284. {
  285. mDevice->getImmediateContext()->CSSetUnorderedAccessViews(unit, 1, viewArray, nullptr);
  286. }
  287. else
  288. BS_EXCEPT(InvalidParametersException, "Unsupported gpu program type: " + toString(gptype));
  289. BS_INC_RENDER_STAT(NumTextureBinds);
  290. }
  291. void D3D11RenderAPI::disableTextureUnit(GpuProgramType gptype, UINT16 texUnit)
  292. {
  293. THROW_IF_NOT_CORE_THREAD;
  294. setTexture(gptype, texUnit, false, nullptr);
  295. }
  296. void D3D11RenderAPI::beginFrame()
  297. {
  298. // Not used
  299. }
  300. void D3D11RenderAPI::endFrame()
  301. {
  302. // Not used
  303. }
  304. void D3D11RenderAPI::setViewport(const Rect2& vp)
  305. {
  306. THROW_IF_NOT_CORE_THREAD;
  307. mViewportNorm = vp;
  308. applyViewport();
  309. }
  310. void D3D11RenderAPI::applyViewport()
  311. {
  312. if (mActiveRenderTarget == nullptr)
  313. return;
  314. const RenderTargetProperties& rtProps = mActiveRenderTarget->getProperties();
  315. // Set viewport dimensions
  316. mViewport.TopLeftX = (FLOAT)(rtProps.getWidth() * mViewportNorm.x);
  317. mViewport.TopLeftY = (FLOAT)(rtProps.getHeight() * mViewportNorm.y);
  318. mViewport.Width = (FLOAT)(rtProps.getWidth() * mViewportNorm.width);
  319. mViewport.Height = (FLOAT)(rtProps.getHeight() * mViewportNorm.height);
  320. if (rtProps.requiresTextureFlipping())
  321. {
  322. // Convert "top-left" to "bottom-left"
  323. mViewport.TopLeftY = rtProps.getHeight() - mViewport.Height - mViewport.TopLeftY;
  324. }
  325. mViewport.MinDepth = 0.0f;
  326. mViewport.MaxDepth = 1.0f;
  327. mDevice->getImmediateContext()->RSSetViewports(1, &mViewport);
  328. }
  329. void D3D11RenderAPI::setVertexBuffers(UINT32 index, SPtr<VertexBufferCore>* buffers, UINT32 numBuffers)
  330. {
  331. THROW_IF_NOT_CORE_THREAD;
  332. UINT32 maxBoundVertexBuffers = mCurrentCapabilities->getMaxBoundVertexBuffers();
  333. if(index < 0 || (index + numBuffers) >= maxBoundVertexBuffers)
  334. BS_EXCEPT(InvalidParametersException, "Invalid vertex index: " + toString(index) + ". Valid range is 0 .. " + toString(maxBoundVertexBuffers - 1));
  335. ID3D11Buffer* dx11buffers[MAX_BOUND_VERTEX_BUFFERS];
  336. UINT32 strides[MAX_BOUND_VERTEX_BUFFERS];
  337. UINT32 offsets[MAX_BOUND_VERTEX_BUFFERS];
  338. for(UINT32 i = 0; i < numBuffers; i++)
  339. {
  340. SPtr<D3D11VertexBufferCore> vertexBuffer = std::static_pointer_cast<D3D11VertexBufferCore>(buffers[i]);
  341. const VertexBufferProperties& vbProps = vertexBuffer->getProperties();
  342. dx11buffers[i] = vertexBuffer->getD3DVertexBuffer();
  343. strides[i] = vbProps.getVertexSize();
  344. offsets[i] = 0;
  345. }
  346. mDevice->getImmediateContext()->IASetVertexBuffers(index, numBuffers, dx11buffers, strides, offsets);
  347. BS_INC_RENDER_STAT(NumVertexBufferBinds);
  348. }
  349. void D3D11RenderAPI::setIndexBuffer(const SPtr<IndexBufferCore>& buffer)
  350. {
  351. THROW_IF_NOT_CORE_THREAD;
  352. SPtr<D3D11IndexBufferCore> indexBuffer = std::static_pointer_cast<D3D11IndexBufferCore>(buffer);
  353. DXGI_FORMAT indexFormat = DXGI_FORMAT_R16_UINT;
  354. if(indexBuffer->getProperties().getType() == IT_16BIT)
  355. indexFormat = DXGI_FORMAT_R16_UINT;
  356. else if (indexBuffer->getProperties().getType() == IT_32BIT)
  357. indexFormat = DXGI_FORMAT_R32_UINT;
  358. else
  359. BS_EXCEPT(InternalErrorException, "Unsupported index format: " + toString(indexBuffer->getProperties().getType()));
  360. mDevice->getImmediateContext()->IASetIndexBuffer(indexBuffer->getD3DIndexBuffer(), indexFormat, 0);
  361. BS_INC_RENDER_STAT(NumIndexBufferBinds);
  362. }
  363. void D3D11RenderAPI::setVertexDeclaration(const SPtr<VertexDeclarationCore>& vertexDeclaration)
  364. {
  365. THROW_IF_NOT_CORE_THREAD;
  366. mActiveVertexDeclaration = vertexDeclaration;
  367. }
  368. void D3D11RenderAPI::setDrawOperation(DrawOperationType op)
  369. {
  370. THROW_IF_NOT_CORE_THREAD;
  371. mDevice->getImmediateContext()->IASetPrimitiveTopology(D3D11Mappings::getPrimitiveType(op));
  372. }
  373. void D3D11RenderAPI::bindGpuProgram(const SPtr<GpuProgramCore>& prg)
  374. {
  375. THROW_IF_NOT_CORE_THREAD;
  376. switch(prg->getProperties().getType())
  377. {
  378. case GPT_VERTEX_PROGRAM:
  379. {
  380. D3D11GpuVertexProgramCore* d3d11GpuProgram = static_cast<D3D11GpuVertexProgramCore*>(prg.get());
  381. mDevice->getImmediateContext()->VSSetShader(d3d11GpuProgram->getVertexShader(), nullptr, 0);
  382. mActiveVertexShader = std::static_pointer_cast<D3D11GpuProgramCore>(prg);
  383. break;
  384. }
  385. case GPT_FRAGMENT_PROGRAM:
  386. {
  387. D3D11GpuFragmentProgramCore* d3d11GpuProgram = static_cast<D3D11GpuFragmentProgramCore*>(prg.get());
  388. mDevice->getImmediateContext()->PSSetShader(d3d11GpuProgram->getPixelShader(), nullptr, 0);
  389. break;
  390. }
  391. case GPT_GEOMETRY_PROGRAM:
  392. {
  393. D3D11GpuGeometryProgramCore* d3d11GpuProgram = static_cast<D3D11GpuGeometryProgramCore*>(prg.get());
  394. mDevice->getImmediateContext()->GSSetShader(d3d11GpuProgram->getGeometryShader(), nullptr, 0);
  395. break;
  396. }
  397. case GPT_DOMAIN_PROGRAM:
  398. {
  399. D3D11GpuDomainProgramCore* d3d11GpuProgram = static_cast<D3D11GpuDomainProgramCore*>(prg.get());
  400. mDevice->getImmediateContext()->DSSetShader(d3d11GpuProgram->getDomainShader(), nullptr, 0);
  401. break;
  402. }
  403. case GPT_HULL_PROGRAM:
  404. {
  405. D3D11GpuHullProgramCore* d3d11GpuProgram = static_cast<D3D11GpuHullProgramCore*>(prg.get());
  406. mDevice->getImmediateContext()->HSSetShader(d3d11GpuProgram->getHullShader(), nullptr, 0);
  407. break;
  408. }
  409. case GPT_COMPUTE_PROGRAM:
  410. {
  411. D3D11GpuComputeProgramCore* d3d11GpuProgram = static_cast<D3D11GpuComputeProgramCore*>(prg.get());
  412. mDevice->getImmediateContext()->CSSetShader(d3d11GpuProgram->getComputeShader(), nullptr, 0);
  413. break;
  414. }
  415. default:
  416. BS_EXCEPT(InvalidParametersException, "Unsupported gpu program type: " + toString(prg->getProperties().getType()));
  417. }
  418. if (mDevice->hasError())
  419. BS_EXCEPT(RenderingAPIException, "Failed to bindGpuProgram : " + mDevice->getErrorDescription());
  420. BS_INC_RENDER_STAT(NumGpuProgramBinds);
  421. }
  422. void D3D11RenderAPI::unbindGpuProgram(GpuProgramType gptype)
  423. {
  424. THROW_IF_NOT_CORE_THREAD;
  425. switch(gptype)
  426. {
  427. case GPT_VERTEX_PROGRAM:
  428. mDevice->getImmediateContext()->VSSetShader(nullptr, nullptr, 0);
  429. mActiveVertexShader = nullptr;
  430. break;
  431. case GPT_FRAGMENT_PROGRAM:
  432. mDevice->getImmediateContext()->PSSetShader(nullptr, nullptr, 0);
  433. break;
  434. case GPT_GEOMETRY_PROGRAM:
  435. mDevice->getImmediateContext()->GSSetShader(nullptr, nullptr, 0);
  436. break;
  437. case GPT_DOMAIN_PROGRAM:
  438. mDevice->getImmediateContext()->DSSetShader(nullptr, nullptr, 0);
  439. break;
  440. case GPT_HULL_PROGRAM:
  441. mDevice->getImmediateContext()->HSSetShader(nullptr, nullptr, 0);
  442. break;
  443. case GPT_COMPUTE_PROGRAM:
  444. mDevice->getImmediateContext()->CSSetShader(nullptr, nullptr, 0);
  445. break;
  446. default:
  447. BS_EXCEPT(InvalidParametersException, "Unsupported gpu program type: " + toString(gptype));
  448. }
  449. BS_INC_RENDER_STAT(NumGpuProgramBinds);
  450. }
  451. void D3D11RenderAPI::setConstantBuffers(GpuProgramType gptype, const SPtr<GpuParamsCore>& bindableParams)
  452. {
  453. THROW_IF_NOT_CORE_THREAD;
  454. bindableParams->updateHardwareBuffers();
  455. const GpuParamDesc& paramDesc = bindableParams->getParamDesc();
  456. // TODO - I assign constant buffers one by one but it might be more efficient to do them all at once?
  457. ID3D11Buffer* bufferArray[1];
  458. for(auto iter = paramDesc.paramBlocks.begin(); iter != paramDesc.paramBlocks.end(); ++iter)
  459. {
  460. SPtr<GpuParamBlockBufferCore> currentBlockBuffer = bindableParams->getParamBlockBuffer(iter->second.slot);
  461. if(currentBlockBuffer != nullptr)
  462. {
  463. const D3D11GpuParamBlockBufferCore* d3d11paramBlockBuffer =
  464. static_cast<const D3D11GpuParamBlockBufferCore*>(currentBlockBuffer.get());
  465. bufferArray[0] = d3d11paramBlockBuffer->getD3D11Buffer();
  466. }
  467. else
  468. bufferArray[0] = nullptr;
  469. switch(gptype)
  470. {
  471. case GPT_VERTEX_PROGRAM:
  472. mDevice->getImmediateContext()->VSSetConstantBuffers(iter->second.slot, 1, bufferArray);
  473. break;
  474. case GPT_FRAGMENT_PROGRAM:
  475. mDevice->getImmediateContext()->PSSetConstantBuffers(iter->second.slot, 1, bufferArray);
  476. break;
  477. case GPT_GEOMETRY_PROGRAM:
  478. mDevice->getImmediateContext()->GSSetConstantBuffers(iter->second.slot, 1, bufferArray);
  479. break;
  480. case GPT_HULL_PROGRAM:
  481. mDevice->getImmediateContext()->HSSetConstantBuffers(iter->second.slot, 1, bufferArray);
  482. break;
  483. case GPT_DOMAIN_PROGRAM:
  484. mDevice->getImmediateContext()->DSSetConstantBuffers(iter->second.slot, 1, bufferArray);
  485. break;
  486. case GPT_COMPUTE_PROGRAM:
  487. mDevice->getImmediateContext()->CSSetConstantBuffers(iter->second.slot, 1, bufferArray);
  488. break;
  489. };
  490. BS_INC_RENDER_STAT(NumGpuParamBufferBinds);
  491. }
  492. if (mDevice->hasError())
  493. BS_EXCEPT(RenderingAPIException, "Failed to setConstantBuffers : " + mDevice->getErrorDescription());
  494. }
  495. void D3D11RenderAPI::draw(UINT32 vertexOffset, UINT32 vertexCount)
  496. {
  497. THROW_IF_NOT_CORE_THREAD;
  498. applyInputLayout();
  499. mDevice->getImmediateContext()->Draw(vertexCount, vertexOffset);
  500. #if BS_DEBUG_MODE
  501. if(mDevice->hasError())
  502. LOGWRN(mDevice->getErrorDescription());
  503. #endif
  504. UINT32 primCount = vertexCountToPrimCount(mActiveDrawOp, vertexCount);
  505. BS_INC_RENDER_STAT(NumDrawCalls);
  506. BS_ADD_RENDER_STAT(NumVertices, vertexCount);
  507. BS_ADD_RENDER_STAT(NumPrimitives, primCount);
  508. }
  509. void D3D11RenderAPI::drawIndexed(UINT32 startIndex, UINT32 indexCount, UINT32 vertexOffset, UINT32 vertexCount)
  510. {
  511. THROW_IF_NOT_CORE_THREAD;
  512. applyInputLayout();
  513. mDevice->getImmediateContext()->DrawIndexed(indexCount, startIndex, vertexOffset);
  514. #if BS_DEBUG_MODE
  515. if(mDevice->hasError())
  516. LOGWRN(mDevice->getErrorDescription());
  517. #endif
  518. UINT32 primCount = vertexCountToPrimCount(mActiveDrawOp, vertexCount);
  519. BS_INC_RENDER_STAT(NumDrawCalls);
  520. BS_ADD_RENDER_STAT(NumVertices, vertexCount);
  521. BS_ADD_RENDER_STAT(NumPrimitives, primCount);
  522. }
  523. void D3D11RenderAPI::setScissorRect(UINT32 left, UINT32 top, UINT32 right, UINT32 bottom)
  524. {
  525. THROW_IF_NOT_CORE_THREAD;
  526. mScissorRect.left = static_cast<LONG>(left);
  527. mScissorRect.top = static_cast<LONG>(top);
  528. mScissorRect.bottom = static_cast<LONG>(bottom);
  529. mScissorRect.right = static_cast<LONG>(right);
  530. mDevice->getImmediateContext()->RSSetScissorRects(1, &mScissorRect);
  531. }
  532. void D3D11RenderAPI::clearViewport(UINT32 buffers, const Color& color, float depth, UINT16 stencil, UINT8 targetMask)
  533. {
  534. THROW_IF_NOT_CORE_THREAD;
  535. if(mActiveRenderTarget == nullptr)
  536. return;
  537. const RenderTargetProperties& rtProps = mActiveRenderTarget->getProperties();
  538. Rect2I clearArea((int)mViewport.TopLeftX, (int)mViewport.TopLeftY, (int)mViewport.Width, (int)mViewport.Height);
  539. bool clearEntireTarget = clearArea.width == 0 || clearArea.height == 0;
  540. clearEntireTarget |= (clearArea.x == 0 && clearArea.y == 0 && clearArea.width == rtProps.getWidth() && clearArea.height == rtProps.getHeight());
  541. if (!clearEntireTarget)
  542. {
  543. // TODO - Ignoring targetMask here
  544. D3D11RenderUtility::instance().drawClearQuad(buffers, color, depth, stencil);
  545. BS_INC_RENDER_STAT(NumClears);
  546. }
  547. else
  548. clearRenderTarget(buffers, color, depth, stencil, targetMask);
  549. }
  550. void D3D11RenderAPI::clearRenderTarget(UINT32 buffers, const Color& color, float depth, UINT16 stencil, UINT8 targetMask)
  551. {
  552. THROW_IF_NOT_CORE_THREAD;
  553. if(mActiveRenderTarget == nullptr)
  554. return;
  555. // Clear render surfaces
  556. if (buffers & FBT_COLOR)
  557. {
  558. UINT32 maxRenderTargets = mCurrentCapabilities->getNumMultiRenderTargets();
  559. ID3D11RenderTargetView** views = bs_newN<ID3D11RenderTargetView*>(maxRenderTargets);
  560. memset(views, 0, sizeof(ID3D11RenderTargetView*) * maxRenderTargets);
  561. mActiveRenderTarget->getCustomAttribute("RTV", views);
  562. if (!views[0])
  563. {
  564. bs_deleteN(views, maxRenderTargets);
  565. return;
  566. }
  567. float clearColor[4];
  568. clearColor[0] = color.r;
  569. clearColor[1] = color.g;
  570. clearColor[2] = color.b;
  571. clearColor[3] = color.a;
  572. for(UINT32 i = 0; i < maxRenderTargets; i++)
  573. {
  574. if(views[i] != nullptr && ((1 << i) & targetMask) != 0)
  575. mDevice->getImmediateContext()->ClearRenderTargetView(views[i], clearColor);
  576. }
  577. bs_deleteN(views, maxRenderTargets);
  578. }
  579. // Clear depth stencil
  580. if((buffers & FBT_DEPTH) != 0 || (buffers & FBT_STENCIL) != 0)
  581. {
  582. ID3D11DepthStencilView* depthStencilView = nullptr;
  583. mActiveRenderTarget->getCustomAttribute("DSV", &depthStencilView);
  584. D3D11_CLEAR_FLAG clearFlag;
  585. if((buffers & FBT_DEPTH) != 0 && (buffers & FBT_STENCIL) != 0)
  586. clearFlag = (D3D11_CLEAR_FLAG)(D3D11_CLEAR_DEPTH | D3D11_CLEAR_STENCIL);
  587. else if((buffers & FBT_STENCIL) != 0)
  588. clearFlag = D3D11_CLEAR_STENCIL;
  589. else
  590. clearFlag = D3D11_CLEAR_DEPTH;
  591. if(depthStencilView != nullptr)
  592. mDevice->getImmediateContext()->ClearDepthStencilView(depthStencilView, clearFlag, depth, (UINT8)stencil);
  593. }
  594. BS_INC_RENDER_STAT(NumClears);
  595. }
  596. void D3D11RenderAPI::setRenderTarget(const SPtr<RenderTargetCore>& target, bool readOnlyDepthStencil)
  597. {
  598. THROW_IF_NOT_CORE_THREAD;
  599. mActiveRenderTarget = target;
  600. UINT32 maxRenderTargets = mCurrentCapabilities->getNumMultiRenderTargets();
  601. ID3D11RenderTargetView** views = bs_newN<ID3D11RenderTargetView*>(maxRenderTargets);
  602. memset(views, 0, sizeof(ID3D11RenderTargetView*) * maxRenderTargets);
  603. ID3D11DepthStencilView* depthStencilView = nullptr;
  604. if (target != nullptr)
  605. {
  606. target->getCustomAttribute("RTV", views);
  607. if(readOnlyDepthStencil)
  608. target->getCustomAttribute("RODSV", &depthStencilView);
  609. else
  610. target->getCustomAttribute("DSV", &depthStencilView);
  611. }
  612. // Bind render targets
  613. mDevice->getImmediateContext()->OMSetRenderTargets(maxRenderTargets, views, depthStencilView);
  614. if (mDevice->hasError())
  615. BS_EXCEPT(RenderingAPIException, "Failed to setRenderTarget : " + mDevice->getErrorDescription());
  616. bs_deleteN(views, maxRenderTargets);
  617. applyViewport();
  618. BS_INC_RENDER_STAT(NumRenderTargetChanges);
  619. }
  620. void D3D11RenderAPI::setClipPlanesImpl(const PlaneList& clipPlanes)
  621. {
  622. LOGWRN("This call will be ignored. DX11 uses shaders for setting clip planes.");
  623. }
  624. RenderAPICapabilities* D3D11RenderAPI::createRenderSystemCapabilities() const
  625. {
  626. THROW_IF_NOT_CORE_THREAD;
  627. RenderAPICapabilities* rsc = bs_new<RenderAPICapabilities>();
  628. rsc->setDriverVersion(mDriverVersion);
  629. rsc->setDeviceName(mActiveD3DDriver->getDriverDescription());
  630. rsc->setRenderAPIName(getName());
  631. rsc->setStencilBufferBitDepth(8);
  632. rsc->setCapability(RSC_ANISOTROPY);
  633. rsc->setCapability(RSC_AUTOMIPMAP);
  634. // Cube map
  635. rsc->setCapability(RSC_CUBEMAPPING);
  636. // We always support compression, D3DX will decompress if device does not support
  637. rsc->setCapability(RSC_TEXTURE_COMPRESSION);
  638. rsc->setCapability(RSC_TEXTURE_COMPRESSION_DXT);
  639. rsc->setCapability(RSC_TWO_SIDED_STENCIL);
  640. rsc->setCapability(RSC_STENCIL_WRAP);
  641. rsc->setCapability(RSC_HWOCCLUSION);
  642. rsc->setCapability(RSC_HWOCCLUSION_ASYNCHRONOUS);
  643. if(mFeatureLevel >= D3D_FEATURE_LEVEL_10_1)
  644. rsc->setMaxBoundVertexBuffers(32);
  645. else
  646. rsc->setMaxBoundVertexBuffers(16);
  647. if(mFeatureLevel >= D3D_FEATURE_LEVEL_10_0)
  648. {
  649. rsc->addShaderProfile("ps_4_0");
  650. rsc->addShaderProfile("vs_4_0");
  651. rsc->addShaderProfile("gs_4_0");
  652. rsc->addGpuProgramProfile(GPP_FS_4_0, "ps_4_0");
  653. rsc->addGpuProgramProfile(GPP_VS_4_0, "vs_4_0");
  654. rsc->addGpuProgramProfile(GPP_GS_4_0, "gs_4_0");
  655. rsc->setNumTextureUnits(GPT_FRAGMENT_PROGRAM, D3D11_COMMONSHADER_INPUT_RESOURCE_SLOT_COUNT);
  656. rsc->setNumTextureUnits(GPT_VERTEX_PROGRAM, D3D11_COMMONSHADER_INPUT_RESOURCE_SLOT_COUNT);
  657. rsc->setNumTextureUnits(GPT_GEOMETRY_PROGRAM, D3D11_COMMONSHADER_INPUT_RESOURCE_SLOT_COUNT);
  658. rsc->setNumCombinedTextureUnits(rsc->getNumTextureUnits(GPT_FRAGMENT_PROGRAM)
  659. + rsc->getNumTextureUnits(GPT_VERTEX_PROGRAM) + rsc->getNumTextureUnits(GPT_VERTEX_PROGRAM));
  660. rsc->setNumGpuParamBlockBuffers(GPT_FRAGMENT_PROGRAM, D3D11_COMMONSHADER_CONSTANT_BUFFER_API_SLOT_COUNT);
  661. rsc->setNumGpuParamBlockBuffers(GPT_VERTEX_PROGRAM, D3D11_COMMONSHADER_CONSTANT_BUFFER_API_SLOT_COUNT);
  662. rsc->setNumGpuParamBlockBuffers(GPT_GEOMETRY_PROGRAM, D3D11_COMMONSHADER_CONSTANT_BUFFER_API_SLOT_COUNT);
  663. rsc->setNumCombinedGpuParamBlockBuffers(rsc->getNumGpuParamBlockBuffers(GPT_FRAGMENT_PROGRAM)
  664. + rsc->getNumGpuParamBlockBuffers(GPT_VERTEX_PROGRAM) + rsc->getNumGpuParamBlockBuffers(GPT_VERTEX_PROGRAM));
  665. }
  666. if(mFeatureLevel >= D3D_FEATURE_LEVEL_10_1)
  667. {
  668. rsc->addShaderProfile("ps_4_1");
  669. rsc->addShaderProfile("vs_4_1");
  670. rsc->addShaderProfile("gs_4_1");
  671. rsc->addGpuProgramProfile(GPP_FS_4_1, "ps_4_1");
  672. rsc->addGpuProgramProfile(GPP_VS_4_1, "vs_4_1");
  673. rsc->addGpuProgramProfile(GPP_GS_4_1, "gs_4_1");
  674. }
  675. if(mFeatureLevel >= D3D_FEATURE_LEVEL_11_0)
  676. {
  677. rsc->addShaderProfile("ps_5_0");
  678. rsc->addShaderProfile("vs_5_0");
  679. rsc->addShaderProfile("gs_5_0");
  680. rsc->addShaderProfile("cs_5_0");
  681. rsc->addShaderProfile("hs_5_0");
  682. rsc->addShaderProfile("ds_5_0");
  683. rsc->addGpuProgramProfile(GPP_FS_5_0, "ps_5_0");
  684. rsc->addGpuProgramProfile(GPP_VS_5_0, "vs_5_0");
  685. rsc->addGpuProgramProfile(GPP_GS_5_0, "gs_5_0");
  686. rsc->addGpuProgramProfile(GPP_CS_5_0, "cs_5_0");
  687. rsc->addGpuProgramProfile(GPP_HS_5_0, "hs_5_0");
  688. rsc->addGpuProgramProfile(GPP_DS_5_0, "ds_5_0");
  689. rsc->setNumTextureUnits(GPT_HULL_PROGRAM, D3D11_COMMONSHADER_INPUT_RESOURCE_SLOT_COUNT);
  690. rsc->setNumTextureUnits(GPT_DOMAIN_PROGRAM, D3D11_COMMONSHADER_INPUT_RESOURCE_SLOT_COUNT);
  691. rsc->setNumTextureUnits(GPT_COMPUTE_PROGRAM, D3D11_COMMONSHADER_INPUT_RESOURCE_SLOT_COUNT);
  692. rsc->setNumCombinedTextureUnits(rsc->getNumTextureUnits(GPT_FRAGMENT_PROGRAM)
  693. + rsc->getNumTextureUnits(GPT_VERTEX_PROGRAM) + rsc->getNumTextureUnits(GPT_VERTEX_PROGRAM)
  694. + rsc->getNumTextureUnits(GPT_HULL_PROGRAM) + rsc->getNumTextureUnits(GPT_DOMAIN_PROGRAM)
  695. + rsc->getNumTextureUnits(GPT_COMPUTE_PROGRAM));
  696. rsc->setNumGpuParamBlockBuffers(GPT_HULL_PROGRAM, D3D11_COMMONSHADER_CONSTANT_BUFFER_API_SLOT_COUNT);
  697. rsc->setNumGpuParamBlockBuffers(GPT_DOMAIN_PROGRAM, D3D11_COMMONSHADER_CONSTANT_BUFFER_API_SLOT_COUNT);
  698. rsc->setNumGpuParamBlockBuffers(GPT_COMPUTE_PROGRAM, D3D11_COMMONSHADER_CONSTANT_BUFFER_API_SLOT_COUNT);
  699. rsc->setNumCombinedGpuParamBlockBuffers(rsc->getNumGpuParamBlockBuffers(GPT_FRAGMENT_PROGRAM)
  700. + rsc->getNumGpuParamBlockBuffers(GPT_VERTEX_PROGRAM) + rsc->getNumGpuParamBlockBuffers(GPT_VERTEX_PROGRAM)
  701. + rsc->getNumGpuParamBlockBuffers(GPT_HULL_PROGRAM) + rsc->getNumGpuParamBlockBuffers(GPT_DOMAIN_PROGRAM)
  702. + rsc->getNumGpuParamBlockBuffers(GPT_COMPUTE_PROGRAM));
  703. rsc->setCapability(RSC_SHADER_SUBROUTINE);
  704. }
  705. rsc->setCapability(RSC_USER_CLIP_PLANES);
  706. rsc->setCapability(RSC_VERTEX_FORMAT_UBYTE4);
  707. // Adapter details
  708. const DXGI_ADAPTER_DESC& adapterID = mActiveD3DDriver->getAdapterIdentifier();
  709. // Determine vendor
  710. switch(adapterID.VendorId)
  711. {
  712. case 0x10DE:
  713. rsc->setVendor(GPU_NVIDIA);
  714. break;
  715. case 0x1002:
  716. rsc->setVendor(GPU_AMD);
  717. break;
  718. case 0x163C:
  719. case 0x8086:
  720. rsc->setVendor(GPU_INTEL);
  721. break;
  722. default:
  723. rsc->setVendor(GPU_UNKNOWN);
  724. break;
  725. };
  726. rsc->setCapability(RSC_INFINITE_FAR_PLANE);
  727. rsc->setCapability(RSC_TEXTURE_3D);
  728. rsc->setCapability(RSC_NON_POWER_OF_2_TEXTURES);
  729. rsc->setCapability(RSC_HWRENDER_TO_TEXTURE);
  730. rsc->setCapability(RSC_TEXTURE_FLOAT);
  731. rsc->setNumMultiRenderTargets(D3D11_SIMULTANEOUS_RENDER_TARGET_COUNT);
  732. rsc->setCapability(RSC_MRT_DIFFERENT_BIT_DEPTHS);
  733. rsc->setCapability(RSC_POINT_SPRITES);
  734. rsc->setCapability(RSC_POINT_EXTENDED_PARAMETERS);
  735. rsc->setMaxPointSize(256);
  736. rsc->setCapability(RSC_VERTEX_TEXTURE_FETCH);
  737. rsc->setCapability(RSC_MIPMAP_LOD_BIAS);
  738. rsc->setCapability(RSC_PERSTAGECONSTANT);
  739. return rsc;
  740. }
  741. void D3D11RenderAPI::determineMultisampleSettings(UINT32 multisampleCount, DXGI_FORMAT format, DXGI_SAMPLE_DESC* outputSampleDesc)
  742. {
  743. bool tryCSAA = false; // Note: Disabled for now, but leaving the code for later so it might be useful
  744. enum CSAAMode { CSAA_Normal, CSAA_Quality };
  745. CSAAMode csaaMode = CSAA_Normal;
  746. bool foundValid = false;
  747. size_t origNumSamples = multisampleCount;
  748. while (!foundValid)
  749. {
  750. // Deal with special cases
  751. if (tryCSAA)
  752. {
  753. switch(multisampleCount)
  754. {
  755. case 8:
  756. if (csaaMode == CSAA_Quality)
  757. {
  758. outputSampleDesc->Count = 8;
  759. outputSampleDesc->Quality = 8;
  760. }
  761. else
  762. {
  763. outputSampleDesc->Count = 4;
  764. outputSampleDesc->Quality = 8;
  765. }
  766. break;
  767. case 16:
  768. if (csaaMode == CSAA_Quality)
  769. {
  770. outputSampleDesc->Count = 8;
  771. outputSampleDesc->Quality = 16;
  772. }
  773. else
  774. {
  775. outputSampleDesc->Count = 4;
  776. outputSampleDesc->Quality = 16;
  777. }
  778. break;
  779. }
  780. }
  781. else // !CSAA
  782. {
  783. outputSampleDesc->Count = multisampleCount == 0 ? 1 : multisampleCount;
  784. outputSampleDesc->Quality = D3D11_STANDARD_MULTISAMPLE_PATTERN;
  785. }
  786. HRESULT hr;
  787. UINT outQuality;
  788. hr = mDevice->getD3D11Device()->CheckMultisampleQualityLevels(format, outputSampleDesc->Count, &outQuality);
  789. if (SUCCEEDED(hr) && (!tryCSAA || outQuality > outputSampleDesc->Quality))
  790. {
  791. foundValid = true;
  792. }
  793. else
  794. {
  795. // Downgrade
  796. if (tryCSAA && multisampleCount == 8)
  797. {
  798. // For CSAA, we'll try downgrading with quality mode at all samples.
  799. // then try without quality, then drop CSAA
  800. if (csaaMode == CSAA_Quality)
  801. {
  802. // Drop quality first
  803. csaaMode = CSAA_Normal;
  804. }
  805. else
  806. {
  807. // Drop CSAA entirely
  808. tryCSAA = false;
  809. }
  810. // Return to original requested samples
  811. multisampleCount = static_cast<UINT32>(origNumSamples);
  812. }
  813. else
  814. {
  815. // Drop samples
  816. multisampleCount--;
  817. if (multisampleCount == 1)
  818. {
  819. // Ran out of options, no multisampling
  820. multisampleCount = 0;
  821. foundValid = true;
  822. }
  823. }
  824. }
  825. }
  826. }
  827. VertexElementType D3D11RenderAPI::getColorVertexElementType() const
  828. {
  829. return VET_COLOR_ABGR;
  830. }
  831. void D3D11RenderAPI::convertProjectionMatrix(const Matrix4& matrix, Matrix4& dest)
  832. {
  833. dest = matrix;
  834. // Convert depth range from [-1,+1] to [0,1]
  835. dest[2][0] = (dest[2][0] + dest[3][0]) / 2;
  836. dest[2][1] = (dest[2][1] + dest[3][1]) / 2;
  837. dest[2][2] = (dest[2][2] + dest[3][2]) / 2;
  838. dest[2][3] = (dest[2][3] + dest[3][3]) / 2;
  839. }
  840. float D3D11RenderAPI::getHorizontalTexelOffset()
  841. {
  842. return 0.0f;
  843. }
  844. float D3D11RenderAPI::getVerticalTexelOffset()
  845. {
  846. return 0.0f;
  847. }
  848. float D3D11RenderAPI::getMinimumDepthInputValue()
  849. {
  850. return 0.0f;
  851. }
  852. float D3D11RenderAPI::getMaximumDepthInputValue()
  853. {
  854. return 1.0f;
  855. }
  856. GpuParamBlockDesc D3D11RenderAPI::generateParamBlockDesc(const String& name, Vector<GpuParamDataDesc>& params)
  857. {
  858. GpuParamBlockDesc block;
  859. block.blockSize = 0;
  860. block.isShareable = true;
  861. block.name = name;
  862. block.slot = 0;
  863. for (auto& param : params)
  864. {
  865. const GpuParamDataTypeInfo& typeInfo = GpuParams::PARAM_SIZES.lookup[param.type];
  866. UINT32 size = typeInfo.size / 4;
  867. if (param.arraySize > 1)
  868. {
  869. // Arrays perform no packing and their elements are always padded and aligned to four component vectors
  870. UINT32 alignOffset = size % typeInfo.baseTypeSize;
  871. if (alignOffset != 0)
  872. {
  873. UINT32 padding = (typeInfo.baseTypeSize - alignOffset);
  874. size += padding;
  875. }
  876. alignOffset = block.blockSize % typeInfo.baseTypeSize;
  877. if (alignOffset != 0)
  878. {
  879. UINT32 padding = (typeInfo.baseTypeSize - alignOffset);
  880. block.blockSize += padding;
  881. }
  882. param.elementSize = size;
  883. param.arrayElementStride = size;
  884. param.cpuMemOffset = block.blockSize;
  885. param.gpuMemOffset = 0;
  886. block.blockSize += size * param.arraySize;
  887. }
  888. else
  889. {
  890. // Pack everything as tightly as possible as long as the data doesn't cross 16 byte boundary
  891. UINT32 alignOffset = block.blockSize % 4;
  892. if (alignOffset != 0 && size > (4 - alignOffset))
  893. {
  894. UINT32 padding = (4 - alignOffset);
  895. block.blockSize += padding;
  896. }
  897. param.elementSize = size;
  898. param.arrayElementStride = size;
  899. param.cpuMemOffset = block.blockSize;
  900. param.gpuMemOffset = 0;
  901. block.blockSize += size;
  902. }
  903. param.paramBlockSlot = 0;
  904. }
  905. // Constant buffer size must always be a multiple of 16
  906. if (block.blockSize % 4 != 0)
  907. block.blockSize += (4 - (block.blockSize % 4));
  908. return block;
  909. }
  910. /************************************************************************/
  911. /* PRIVATE */
  912. /************************************************************************/
  913. void D3D11RenderAPI::applyInputLayout()
  914. {
  915. if(mActiveVertexDeclaration == nullptr)
  916. {
  917. LOGWRN("Cannot apply input layout without a vertex declaration. Set vertex declaration before calling this method.");
  918. return;
  919. }
  920. if(mActiveVertexShader == nullptr)
  921. {
  922. LOGWRN("Cannot apply input layout without a vertex shader. Set vertex shader before calling this method.");
  923. return;
  924. }
  925. ID3D11InputLayout* ia = mIAManager->retrieveInputLayout(mActiveVertexShader->getInputDeclaration(), mActiveVertexDeclaration, *mActiveVertexShader);
  926. mDevice->getImmediateContext()->IASetInputLayout(ia);
  927. }
  928. }