DxilShaderFlags.cpp 20 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545
  1. ///////////////////////////////////////////////////////////////////////////////
  2. // //
  3. // DxilShaderFlags.cpp //
  4. // Copyright (C) Microsoft Corporation. All rights reserved. //
  5. // This file is distributed under the University of Illinois Open Source //
  6. // License. See LICENSE.TXT for details. //
  7. // //
  8. ///////////////////////////////////////////////////////////////////////////////
  9. #include "dxc/DXIL/DxilModule.h"
  10. #include "dxc/DXIL/DxilShaderFlags.h"
  11. #include "dxc/DXIL/DxilOperations.h"
  12. #include "dxc/DXIL/DxilResource.h"
  13. #include "dxc/Support/Global.h"
  14. #include "llvm/IR/LLVMContext.h"
  15. #include "llvm/IR/Instructions.h"
  16. #include "llvm/IR/Constants.h"
  17. #include "llvm/Support/Casting.h"
  18. #include "dxc/DXIL/DxilEntryProps.h"
  19. #include "dxc/DXIL/DxilInstructions.h"
  20. #include "dxc/DXIL/DxilResourceProperties.h"
  21. #include "dxc/DXIL/DxilUtil.h"
  22. using namespace hlsl;
  23. using namespace llvm;
  24. ShaderFlags::ShaderFlags():
  25. m_bDisableOptimizations(false)
  26. , m_bDisableMathRefactoring(false)
  27. , m_bEnableDoublePrecision(false)
  28. , m_bForceEarlyDepthStencil(false)
  29. , m_bEnableRawAndStructuredBuffers(false)
  30. , m_bLowPrecisionPresent(false)
  31. , m_bEnableDoubleExtensions(false)
  32. , m_bEnableMSAD(false)
  33. , m_bAllResourcesBound(false)
  34. , m_bViewportAndRTArrayIndex(false)
  35. , m_bInnerCoverage(false)
  36. , m_bStencilRef(false)
  37. , m_bTiledResources(false)
  38. , m_bUAVLoadAdditionalFormats(false)
  39. , m_bLevel9ComparisonFiltering(false)
  40. , m_b64UAVs(false)
  41. , m_UAVsAtEveryStage(false)
  42. , m_bCSRawAndStructuredViaShader4X(false)
  43. , m_bROVS(false)
  44. , m_bWaveOps(false)
  45. , m_bInt64Ops(false)
  46. , m_bViewID(false)
  47. , m_bBarycentrics(false)
  48. , m_bUseNativeLowPrecision(false)
  49. , m_bShadingRate(false)
  50. , m_bRaytracingTier1_1(false)
  51. , m_bSamplerFeedback(false)
  52. , m_bAtomicInt64OnTypedResource(false)
  53. , m_bAtomicInt64OnGroupShared(false)
  54. , m_bDerivativesInMeshAndAmpShaders(false)
  55. , m_align0(0)
  56. , m_align1(0)
  57. {
  58. // Silence unused field warnings
  59. (void)m_align0;
  60. (void)m_align1;
  61. }
  62. uint64_t ShaderFlags::GetFeatureInfo() const {
  63. uint64_t Flags = 0;
  64. Flags |= m_bEnableDoublePrecision ? hlsl::DXIL::ShaderFeatureInfo_Doubles : 0;
  65. Flags |= m_bLowPrecisionPresent && !m_bUseNativeLowPrecision
  66. ? hlsl::DXIL::ShaderFeatureInfo_MinimumPrecision
  67. : 0;
  68. Flags |= m_bLowPrecisionPresent && m_bUseNativeLowPrecision
  69. ? hlsl::DXIL::ShaderFeatureInfo_NativeLowPrecision
  70. : 0;
  71. Flags |= m_bEnableDoubleExtensions
  72. ? hlsl::DXIL::ShaderFeatureInfo_11_1_DoubleExtensions
  73. : 0;
  74. Flags |= m_bWaveOps ? hlsl::DXIL::ShaderFeatureInfo_WaveOps : 0;
  75. Flags |= m_bInt64Ops ? hlsl::DXIL::ShaderFeatureInfo_Int64Ops : 0;
  76. Flags |= m_bROVS ? hlsl::DXIL::ShaderFeatureInfo_ROVs : 0;
  77. Flags |=
  78. m_bViewportAndRTArrayIndex
  79. ? hlsl::DXIL::
  80. ShaderFeatureInfo_ViewportAndRTArrayIndexFromAnyShaderFeedingRasterizer
  81. : 0;
  82. Flags |= m_bInnerCoverage ? hlsl::DXIL::ShaderFeatureInfo_InnerCoverage : 0;
  83. Flags |= m_bStencilRef ? hlsl::DXIL::ShaderFeatureInfo_StencilRef : 0;
  84. Flags |= m_bTiledResources ? hlsl::DXIL::ShaderFeatureInfo_TiledResources : 0;
  85. Flags |=
  86. m_bEnableMSAD ? hlsl::DXIL::ShaderFeatureInfo_11_1_ShaderExtensions : 0;
  87. Flags |=
  88. m_bCSRawAndStructuredViaShader4X
  89. ? hlsl::DXIL::
  90. ShaderFeatureInfo_ComputeShadersPlusRawAndStructuredBuffersViaShader4X
  91. : 0;
  92. Flags |=
  93. m_UAVsAtEveryStage ? hlsl::DXIL::ShaderFeatureInfo_UAVsAtEveryStage : 0;
  94. Flags |= m_b64UAVs ? hlsl::DXIL::ShaderFeatureInfo_64UAVs : 0;
  95. Flags |= m_bLevel9ComparisonFiltering
  96. ? hlsl::DXIL::ShaderFeatureInfo_LEVEL9ComparisonFiltering
  97. : 0;
  98. Flags |= m_bUAVLoadAdditionalFormats
  99. ? hlsl::DXIL::ShaderFeatureInfo_TypedUAVLoadAdditionalFormats
  100. : 0;
  101. Flags |= m_bViewID ? hlsl::DXIL::ShaderFeatureInfo_ViewID : 0;
  102. Flags |= m_bBarycentrics ? hlsl::DXIL::ShaderFeatureInfo_Barycentrics : 0;
  103. Flags |= m_bShadingRate ? hlsl::DXIL::ShaderFeatureInfo_ShadingRate : 0;
  104. Flags |= m_bRaytracingTier1_1 ? hlsl::DXIL::ShaderFeatureInfo_Raytracing_Tier_1_1 : 0;
  105. Flags |= m_bSamplerFeedback ? hlsl::DXIL::ShaderFeatureInfo_SamplerFeedback : 0;
  106. Flags |= m_bAtomicInt64OnTypedResource ? hlsl::DXIL::ShaderFeatureInfo_AtomicInt64OnTypedResource : 0;
  107. Flags |= m_bAtomicInt64OnGroupShared ? hlsl::DXIL::ShaderFeatureInfo_AtomicInt64OnGroupShared : 0;
  108. Flags |= m_bDerivativesInMeshAndAmpShaders ? hlsl::DXIL::ShaderFeatureInfo_DerivativesInMeshAndAmpShaders : 0;
  109. return Flags;
  110. }
  111. uint64_t ShaderFlags::GetShaderFlagsRaw() const {
  112. union Cast {
  113. Cast(const ShaderFlags &flags) {
  114. shaderFlags = flags;
  115. }
  116. ShaderFlags shaderFlags;
  117. uint64_t rawData;
  118. };
  119. static_assert(sizeof(uint64_t) == sizeof(ShaderFlags),
  120. "size must match to make sure no undefined bits when cast");
  121. Cast rawCast(*this);
  122. return rawCast.rawData;
  123. }
  124. void ShaderFlags::SetShaderFlagsRaw(uint64_t data) {
  125. union Cast {
  126. Cast(uint64_t data) {
  127. rawData = data;
  128. }
  129. ShaderFlags shaderFlags;
  130. uint64_t rawData;
  131. };
  132. Cast rawCast(data);
  133. *this = rawCast.shaderFlags;
  134. }
  135. uint64_t ShaderFlags::GetShaderFlagsRawForCollection() {
  136. // This should be all the flags that can be set by DxilModule::CollectShaderFlags.
  137. ShaderFlags Flags;
  138. Flags.SetEnableDoublePrecision(true);
  139. Flags.SetInt64Ops(true);
  140. Flags.SetLowPrecisionPresent(true);
  141. Flags.SetEnableDoubleExtensions(true);
  142. Flags.SetWaveOps(true);
  143. Flags.SetTiledResources(true);
  144. Flags.SetEnableMSAD(true);
  145. Flags.SetUAVLoadAdditionalFormats(true);
  146. Flags.SetStencilRef(true);
  147. Flags.SetInnerCoverage(true);
  148. Flags.SetViewportAndRTArrayIndex(true);
  149. Flags.Set64UAVs(true);
  150. Flags.SetUAVsAtEveryStage(true);
  151. Flags.SetEnableRawAndStructuredBuffers(true);
  152. Flags.SetCSRawAndStructuredViaShader4X(true);
  153. Flags.SetViewID(true);
  154. Flags.SetBarycentrics(true);
  155. Flags.SetShadingRate(true);
  156. Flags.SetRaytracingTier1_1(true);
  157. Flags.SetSamplerFeedback(true);
  158. Flags.SetAtomicInt64OnTypedResource(true);
  159. Flags.SetAtomicInt64OnGroupShared(true);
  160. Flags.SetDerivativesInMeshAndAmpShaders(true);
  161. return Flags.GetShaderFlagsRaw();
  162. }
  163. unsigned ShaderFlags::GetGlobalFlags() const {
  164. unsigned Flags = 0;
  165. Flags |= m_bDisableOptimizations ? DXIL::kDisableOptimizations : 0;
  166. Flags |= m_bDisableMathRefactoring ? DXIL::kDisableMathRefactoring : 0;
  167. Flags |= m_bEnableDoublePrecision ? DXIL::kEnableDoublePrecision : 0;
  168. Flags |= m_bForceEarlyDepthStencil ? DXIL::kForceEarlyDepthStencil : 0;
  169. Flags |= m_bEnableRawAndStructuredBuffers ? DXIL::kEnableRawAndStructuredBuffers : 0;
  170. Flags |= m_bLowPrecisionPresent && !m_bUseNativeLowPrecision? DXIL::kEnableMinPrecision : 0;
  171. Flags |= m_bEnableDoubleExtensions ? DXIL::kEnableDoubleExtensions : 0;
  172. Flags |= m_bEnableMSAD ? DXIL::kEnableMSAD : 0;
  173. Flags |= m_bAllResourcesBound ? DXIL::kAllResourcesBound : 0;
  174. return Flags;
  175. }
  176. // Given a CreateHandle call, returns arbitrary ConstantInt rangeID
  177. // Note: HLSL is currently assuming that rangeID is a constant value, but this code is assuming
  178. // that it can be either constant, phi node, or select instruction
  179. static ConstantInt *GetArbitraryConstantRangeID(CallInst *handleCall) {
  180. Value *rangeID =
  181. handleCall->getArgOperand(DXIL::OperandIndex::kCreateHandleResIDOpIdx);
  182. ConstantInt *ConstantRangeID = dyn_cast<ConstantInt>(rangeID);
  183. while (ConstantRangeID == nullptr) {
  184. if (ConstantInt *CI = dyn_cast<ConstantInt>(rangeID)) {
  185. ConstantRangeID = CI;
  186. } else if (PHINode *PN = dyn_cast<PHINode>(rangeID)) {
  187. rangeID = PN->getIncomingValue(0);
  188. } else if (SelectInst *SI = dyn_cast<SelectInst>(rangeID)) {
  189. rangeID = SI->getTrueValue();
  190. } else {
  191. return nullptr;
  192. }
  193. }
  194. return ConstantRangeID;
  195. }
  196. // Given a handle type, find an arbitrary call instructions to create handle
  197. static CallInst *FindCallToCreateHandle(Value *handleType) {
  198. Value *curVal = handleType;
  199. CallInst *CI = dyn_cast<CallInst>(handleType);
  200. while (CI == nullptr) {
  201. if (PHINode *PN = dyn_cast<PHINode>(curVal)) {
  202. curVal = PN->getIncomingValue(0);
  203. }
  204. else if (SelectInst *SI = dyn_cast<SelectInst>(curVal)) {
  205. curVal = SI->getTrueValue();
  206. }
  207. else {
  208. return nullptr;
  209. }
  210. CI = dyn_cast<CallInst>(curVal);
  211. }
  212. return CI;
  213. }
  214. DxilResourceProperties GetResourcePropertyFromHandleCall(const hlsl::DxilModule *M, CallInst *handleCall) {
  215. DxilResourceProperties RP;
  216. ConstantInt *HandleOpCodeConst = cast<ConstantInt>(
  217. handleCall->getArgOperand(DXIL::OperandIndex::kOpcodeIdx));
  218. DXIL::OpCode handleOp = static_cast<DXIL::OpCode>(HandleOpCodeConst->getLimitedValue());
  219. if (handleOp == DXIL::OpCode::CreateHandle) {
  220. if (ConstantInt *resClassArg =
  221. dyn_cast<ConstantInt>(handleCall->getArgOperand(
  222. DXIL::OperandIndex::kCreateHandleResClassOpIdx))) {
  223. DXIL::ResourceClass resClass = static_cast<DXIL::ResourceClass>(
  224. resClassArg->getLimitedValue());
  225. ConstantInt *rangeID = GetArbitraryConstantRangeID(handleCall);
  226. if (rangeID) {
  227. DxilResource resource;
  228. if (resClass == DXIL::ResourceClass::UAV)
  229. resource = M->GetUAV(rangeID->getLimitedValue());
  230. else if (resClass == DXIL::ResourceClass::SRV)
  231. resource = M->GetSRV(rangeID->getLimitedValue());
  232. RP = resource_helper::loadPropsFromResourceBase(&resource);
  233. }
  234. }
  235. }
  236. else if (handleOp == DXIL::OpCode::CreateHandleForLib) {
  237. // If library handle, find DxilResource by checking the name
  238. if (LoadInst *LI = dyn_cast<LoadInst>(handleCall->getArgOperand(
  239. DXIL::OperandIndex::kCreateHandleForLibResOpIdx))) {
  240. Value *resType = LI->getOperand(0);
  241. for (auto &&res : M->GetUAVs()) {
  242. if (res->GetGlobalSymbol() == resType) {
  243. RP = resource_helper::loadPropsFromResourceBase(res.get());
  244. }
  245. }
  246. }
  247. } else if (handleOp == DXIL::OpCode::AnnotateHandle) {
  248. DxilInst_AnnotateHandle annotateHandle(cast<Instruction>(handleCall));
  249. Type *ResPropTy = M->GetOP()->GetResourcePropertiesType();
  250. RP = resource_helper::loadPropsFromAnnotateHandle(annotateHandle, ResPropTy, *M->GetShaderModel());
  251. }
  252. return RP;
  253. }
  254. ShaderFlags ShaderFlags::CollectShaderFlags(const Function *F,
  255. const hlsl::DxilModule *M) {
  256. ShaderFlags flag;
  257. // Module level options
  258. flag.SetUseNativeLowPrecision(!M->GetUseMinPrecision());
  259. flag.SetDisableOptimizations(M->GetDisableOptimization());
  260. flag.SetAllResourcesBound(M->GetAllResourcesBound());
  261. bool hasDouble = false;
  262. // ddiv dfma drcp d2i d2u i2d u2d.
  263. // fma has dxil op. Others should check IR instruction div/cast.
  264. bool hasDoubleExtension = false;
  265. bool has64Int = false;
  266. bool has16 = false;
  267. bool hasWaveOps = false;
  268. bool hasCheckAccessFully = false;
  269. bool hasMSAD = false;
  270. bool hasStencilRef = false;
  271. bool hasInnerCoverage = false;
  272. bool hasViewID = false;
  273. bool hasMulticomponentUAVLoads = false;
  274. bool hasViewportOrRTArrayIndex = false;
  275. bool hasShadingRate = false;
  276. bool hasSamplerFeedback = false;
  277. bool hasRaytracingTier1_1 = false;
  278. bool hasAtomicInt64OnTypedResource = false;
  279. bool hasAtomicInt64OnGroupShared = false;
  280. bool hasDerivativesInMeshAndAmpShaders = false;
  281. // Try to maintain compatibility with a v1.0 validator if that's what we have.
  282. uint32_t valMajor, valMinor;
  283. M->GetValidatorVersion(valMajor, valMinor);
  284. bool hasMulticomponentUAVLoadsBackCompat = valMajor == 1 && valMinor == 0;
  285. bool hasViewportOrRTArrayIndexBackCombat = valMajor == 1 && valMinor < 4;
  286. Type *int16Ty = Type::getInt16Ty(F->getContext());
  287. Type *int64Ty = Type::getInt64Ty(F->getContext());
  288. for (const BasicBlock &BB : F->getBasicBlockList()) {
  289. for (const Instruction &I : BB.getInstList()) {
  290. // Skip none dxil function call.
  291. if (const CallInst *CI = dyn_cast<CallInst>(&I)) {
  292. if (!OP::IsDxilOpFunc(CI->getCalledFunction()))
  293. continue;
  294. }
  295. Type *Ty = I.getType();
  296. bool isDouble = Ty->isDoubleTy();
  297. bool isHalf = Ty->isHalfTy();
  298. bool isInt16 = Ty == int16Ty;
  299. bool isInt64 = Ty == int64Ty;
  300. if (isa<ExtractElementInst>(&I) ||
  301. isa<InsertElementInst>(&I))
  302. continue;
  303. for (Value *operand : I.operands()) {
  304. Type *Ty = operand->getType();
  305. isDouble |= Ty->isDoubleTy();
  306. isHalf |= Ty->isHalfTy();
  307. isInt16 |= Ty == int16Ty;
  308. isInt64 |= Ty == int64Ty;
  309. }
  310. if (isDouble) {
  311. hasDouble = true;
  312. switch (I.getOpcode()) {
  313. case Instruction::FDiv:
  314. case Instruction::UIToFP:
  315. case Instruction::SIToFP:
  316. case Instruction::FPToUI:
  317. case Instruction::FPToSI:
  318. hasDoubleExtension = true;
  319. break;
  320. }
  321. }
  322. if (isInt64) {
  323. has64Int = true;
  324. switch (I.getOpcode()) {
  325. case Instruction::AtomicCmpXchg:
  326. case Instruction::AtomicRMW:
  327. hasAtomicInt64OnGroupShared = true;
  328. break;
  329. }
  330. }
  331. has16 |= isHalf;
  332. has16 |= isInt16;
  333. if (const CallInst *CI = dyn_cast<CallInst>(&I)) {
  334. if (!OP::IsDxilOpFunc(CI->getCalledFunction()))
  335. continue;
  336. Value *opcodeArg = CI->getArgOperand(DXIL::OperandIndex::kOpcodeIdx);
  337. ConstantInt *opcodeConst = dyn_cast<ConstantInt>(opcodeArg);
  338. DXASSERT(opcodeConst, "DXIL opcode arg must be immediate");
  339. unsigned opcode = opcodeConst->getLimitedValue();
  340. DXASSERT(opcode < static_cast<unsigned>(DXIL::OpCode::NumOpCodes),
  341. "invalid DXIL opcode");
  342. DXIL::OpCode dxilOp = static_cast<DXIL::OpCode>(opcode);
  343. if (hlsl::OP::IsDxilOpWave(dxilOp))
  344. hasWaveOps = true;
  345. switch (dxilOp) {
  346. case DXIL::OpCode::CheckAccessFullyMapped:
  347. hasCheckAccessFully = true;
  348. break;
  349. case DXIL::OpCode::Msad:
  350. hasMSAD = true;
  351. break;
  352. case DXIL::OpCode::BufferLoad:
  353. case DXIL::OpCode::TextureLoad: {
  354. if (hasMulticomponentUAVLoads) continue;
  355. // This is the old-style computation (overestimating requirements).
  356. Value *resHandle = CI->getArgOperand(DXIL::OperandIndex::kBufferStoreHandleOpIdx);
  357. CallInst *handleCall = FindCallToCreateHandle(resHandle);
  358. // Check if this is a library handle or general create handle
  359. if (handleCall) {
  360. DxilResourceProperties RP = GetResourcePropertyFromHandleCall(M, handleCall);
  361. if (RP.isUAV()) {
  362. // Validator 1.0 assumes that all uav load is multi component load.
  363. if (hasMulticomponentUAVLoadsBackCompat) {
  364. hasMulticomponentUAVLoads = true;
  365. continue;
  366. } else {
  367. if (DXIL::IsTyped(RP.getResourceKind()) &&
  368. RP.Typed.CompCount > 1)
  369. hasMulticomponentUAVLoads = true;
  370. }
  371. }
  372. }
  373. } break;
  374. case DXIL::OpCode::Fma:
  375. hasDoubleExtension |= isDouble;
  376. break;
  377. case DXIL::OpCode::InnerCoverage:
  378. hasInnerCoverage = true;
  379. break;
  380. case DXIL::OpCode::ViewID:
  381. hasViewID = true;
  382. break;
  383. case DXIL::OpCode::AllocateRayQuery:
  384. case DXIL::OpCode::GeometryIndex:
  385. hasRaytracingTier1_1 = true;
  386. break;
  387. case DXIL::OpCode::AtomicBinOp:
  388. case DXIL::OpCode::AtomicCompareExchange:
  389. if (isInt64) {
  390. Value *resHandle = CI->getArgOperand(DXIL::OperandIndex::kAtomicBinOpHandleOpIdx);
  391. CallInst *handleCall = FindCallToCreateHandle(resHandle);
  392. DxilResourceProperties RP = GetResourcePropertyFromHandleCall(M, handleCall);
  393. if (DXIL::IsTyped(RP.getResourceKind()))
  394. hasAtomicInt64OnTypedResource = true;
  395. }
  396. break;
  397. case DXIL::OpCode::DerivFineX:
  398. case DXIL::OpCode::DerivFineY:
  399. case DXIL::OpCode::DerivCoarseX:
  400. case DXIL::OpCode::DerivCoarseY:
  401. case DXIL::OpCode::CalculateLOD:
  402. case DXIL::OpCode::Sample:
  403. case DXIL::OpCode::SampleBias:
  404. case DXIL::OpCode::SampleCmp: {
  405. const ShaderModel *pSM = M->GetShaderModel();
  406. if (pSM->IsAS() || pSM->IsMS())
  407. hasDerivativesInMeshAndAmpShaders = true;
  408. } break;
  409. default:
  410. // Normal opcodes.
  411. break;
  412. }
  413. }
  414. }
  415. }
  416. // If this function is a shader, add flags based on signatures
  417. if (M->HasDxilEntryProps(F)) {
  418. const DxilEntryProps &entryProps = M->GetDxilEntryProps(F);
  419. // Val ver < 1.4 has a bug where input case was always clobbered by the
  420. // output check. The only case where it made a difference such that an
  421. // incorrect flag would be set was for the HS and DS input cases.
  422. // It was also checking PS input and output, but PS output could not have
  423. // the semantic, and since it was clobbering the result, it would always
  424. // clear it. Since this flag should not be set for PS at all,
  425. // it produced the correct result for PS by accident.
  426. bool checkInputRTArrayIndex = entryProps.props.IsGS();
  427. if (!hasViewportOrRTArrayIndexBackCombat)
  428. checkInputRTArrayIndex |= entryProps.props.IsDS() ||
  429. entryProps.props.IsHS();
  430. bool checkOutputRTArrayIndex =
  431. entryProps.props.IsVS() || entryProps.props.IsDS() ||
  432. entryProps.props.IsHS();
  433. for (auto &&E : entryProps.sig.InputSignature.GetElements()) {
  434. switch (E->GetKind()) {
  435. case Semantic::Kind::ViewPortArrayIndex:
  436. case Semantic::Kind::RenderTargetArrayIndex:
  437. if (checkInputRTArrayIndex)
  438. hasViewportOrRTArrayIndex = true;
  439. break;
  440. case Semantic::Kind::ShadingRate:
  441. hasShadingRate = true;
  442. break;
  443. default:
  444. break;
  445. }
  446. }
  447. for (auto &&E : entryProps.sig.OutputSignature.GetElements()) {
  448. switch (E->GetKind()) {
  449. case Semantic::Kind::ViewPortArrayIndex:
  450. case Semantic::Kind::RenderTargetArrayIndex:
  451. if (checkOutputRTArrayIndex)
  452. hasViewportOrRTArrayIndex = true;
  453. break;
  454. case Semantic::Kind::StencilRef:
  455. if (entryProps.props.IsPS())
  456. hasStencilRef = true;
  457. break;
  458. case Semantic::Kind::InnerCoverage:
  459. if (entryProps.props.IsPS())
  460. hasInnerCoverage = true;
  461. break;
  462. case Semantic::Kind::ShadingRate:
  463. hasShadingRate = true;
  464. break;
  465. default:
  466. break;
  467. }
  468. }
  469. }
  470. if (!hasRaytracingTier1_1) {
  471. if (const DxilSubobjects *pSubobjects = M->GetSubobjects()) {
  472. for (const auto &it : pSubobjects->GetSubobjects()) {
  473. switch (it.second->GetKind()) {
  474. case DXIL::SubobjectKind::RaytracingPipelineConfig1:
  475. hasRaytracingTier1_1 = true;
  476. break;
  477. case DXIL::SubobjectKind::StateObjectConfig: {
  478. uint32_t Flags;
  479. if (it.second->GetStateObjectConfig(Flags) &&
  480. ((Flags & ~(unsigned)DXIL::StateObjectFlags::ValidMask_1_4) != 0))
  481. hasRaytracingTier1_1 = true;
  482. } break;
  483. default:
  484. break;
  485. }
  486. if (hasRaytracingTier1_1)
  487. break;
  488. }
  489. }
  490. }
  491. flag.SetEnableDoublePrecision(hasDouble);
  492. flag.SetStencilRef(hasStencilRef);
  493. flag.SetInnerCoverage(hasInnerCoverage);
  494. flag.SetInt64Ops(has64Int);
  495. flag.SetLowPrecisionPresent(has16);
  496. flag.SetEnableDoubleExtensions(hasDoubleExtension);
  497. flag.SetWaveOps(hasWaveOps);
  498. flag.SetTiledResources(hasCheckAccessFully);
  499. flag.SetEnableMSAD(hasMSAD);
  500. flag.SetUAVLoadAdditionalFormats(hasMulticomponentUAVLoads);
  501. flag.SetViewID(hasViewID);
  502. flag.SetViewportAndRTArrayIndex(hasViewportOrRTArrayIndex);
  503. flag.SetShadingRate(hasShadingRate);
  504. flag.SetSamplerFeedback(hasSamplerFeedback);
  505. flag.SetRaytracingTier1_1(hasRaytracingTier1_1);
  506. flag.SetAtomicInt64OnTypedResource(hasAtomicInt64OnTypedResource);
  507. flag.SetAtomicInt64OnGroupShared(hasAtomicInt64OnGroupShared);
  508. flag.SetDerivativesInMeshAndAmpShaders(hasDerivativesInMeshAndAmpShaders);
  509. return flag;
  510. }
  511. void ShaderFlags::CombineShaderFlags(const ShaderFlags &other) {
  512. SetShaderFlagsRaw(GetShaderFlagsRaw() | other.GetShaderFlagsRaw());
  513. }