7 years ago · a26681c807
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -84,6 +84,12 @@ option(HLSL_ENABLE_FIXED_VER "Sets up fixed version information." OFF) # HLSL Ch
 
															 option(HLSL_ENABLE_ANALYZE "Enables compiler analysis during compilation." OFF) # HLSL Change
														
 
															 option(HLSL_OPTIONAL_PROJS_IN_DEFAULT "Include optional projects in default build target." OFF) # HLSL Change
														
 
															+# HLSL Change Starts - set flag for Appveyor CI
														
 
															+if ( "$ENV{CI}" AND "$ENV{APPVEYOR}" )
														
 
															+  add_definitions(-DDXC_ON_APPVEYOR_CI)
														
 
															+endif()
														
 
															+# HLSL Change ends
														
 
															+
														
 
															 # SPIRV change starts
														
 
															 option(ENABLE_SPIRV_CODEGEN "Enables SPIR-V code generation." OFF)
														
 
															 option(SPIRV_BUILD_TESTS "Build targets for the SPIR-V unit tests." OFF)
														
--- a/README.md
+++ b/README.md
@@ -67,15 +67,12 @@ To run shaders compiled as DXIL, you will need support from the operating system
 
															 Hardware GPU support for DXIL is provided by the following vendors:
														
 
															 #### NVIDIA
														
 
															-NVIDIA's r387 drivers (r387.92 and later) provide release mode support for DXIL
														
 
															-1.0 and Shader Model 6.0 on Win10 FCU and later, and experimental mode support
														
 
															-for DXIL 1.1 and Shader Model 6.1. This driver can be downloaded from
														
 
															-[geforce.com](https://www.geforce.com/drivers). Direct links for r388.59 (most
														
 
															-current as of this update) are provided below:
														
 
															+NVIDIA's r396 drivers (r397.64 and later) provide release mode support for DXIL
														
 
															+1.1 and Shader Model 6.1 on Win10 1709 and later, and experimental mode support
														
 
															+for DXIL 1.2 and Shader Model 6.2 on Win10 1803 and later. These drivers also
														
 
															+support DXR in experimental mode.
														
 
															-[Win10 Installer](http://uk.download.nvidia.com/Windows/388.59/388.59-desktop-win10-64bit-international-whql.exe)
														
 
															-
														
 
															-[Release Notes](http://us.download.nvidia.com/Windows/388.59/388.59-win10-win8-win7-desktop-release-notes.pdf)
														
 
															+Drivers can be downloaded from [geforce.com](https://www.geforce.com/drivers).
														
 
															 #### AMD
														
 
															 AMD's latest driver with support for DXIL 1.0 and Shader Model 6 in experimental mode is [Radeon Software Crimson ReLive Edition 17.4.2](http://support.amd.com/en-us/kb-articles/Pages/Radeon-Software-Crimson-ReLive-Edition-17.4.2-Release-Notes.aspx).
														
--- a/appveyor.yml
+++ b/appveyor.yml
@@ -10,6 +10,7 @@ clone_depth: 1
 
															 environment:
														
 
															   HLSL_SRC_DIR: c:\projects\DirectXShaderCompiler
														
 
															   HLSL_BLD_DIR: c:\projects\DirectXShaderCompiler\build
														
 
															+  ARTIFACTS_ZIP_NAME: dxc-artifacts.zip
														
 
															 install:
														
 
															 - cmd: git submodule update --init
														
@@ -25,11 +26,13 @@ test_script:
 
															 - cmd: call utils\hct\hcttest -rel spirv_only
														
 
															 after_test:
														
 
															-- cmd: cd build\%CONFIGURATION%\bin
														
 
															-- cmd: 7z a artifacts.zip d*.exe d*.dll HLSLHost.exe
														
 
															+- cmd: cd build\%CONFIGURATION%
														
 
															+- cmd: echo %APPVEYOR_REPO_COMMIT% > GIT-COMMIT.txt
														
 
															+- cmd: xcopy "%HLSL_SRC_DIR%\include\dxc" include\dxc /s /i /y
														
 
															+- cmd: 7z a %ARTIFACTS_ZIP_NAME% include lib\d*.lib bin\d*.exe bin\d*.dll bin\d*.pdb bin\HLSLHost.exe GIT-COMMIT.txt
														
 
															 artifacts:
														
 
															-- path: build\$(configuration)\bin\artifacts.zip
														
 
															+- path: build\$(configuration)\$(ARTIFACTS_ZIP_NAME)
														
 
															 notifications:
														
 
															 - provider: GitHubPullRequest
														
--- a/docs/SPIR-V.rst
+++ b/docs/SPIR-V.rst
@@ -120,7 +120,7 @@ decorated by the ``Position``, ``ClipDistance``, ``CullDistance`` builtin,
 
															 and two of them are decorated by the ``Location`` decoration. (Note that
														
 
															 ``clip0`` and ``clip1`` are concatenated, also ``cull0`` and ``cull1``.
														
 
															 The ``ClipDistance`` and ``CullDistance`` builtins are special and explained
														
 
															-in the `gl_PerVertex`_ section.)
														
 
															+in the `ClipDistance & CullDistance`_ section.)
														
 
															 Flattening is infective because of Vulkan interface matching rules. If we
														
 
															 flatten a struct in the output of a previous stage, which may create multiple
														
@@ -133,25 +133,6 @@ hull/domain/geometry shader, their inputs/outputs have an additional arrayness.
 
															 So if we are seeing an array of structs in these shaders, we need to flatten
														
 
															 them into arrays of its fields.
														
 
															-Lastly, to satisfy the type requirements on builtins, after flattening, the
														
 
															-variables decorated with ``Position``, ``ClipDistance``, and ``CullDistance``
														
 
															-builtins are grouped into struct, like ``gl_PerVertex`` for certain shader stage
														
 
															-interface:
														
 
															-
														
 
															-============ ===== ======
														
 
															-Shader Stage Input Output
														
 
															-============ ===== ======
														
 
															-    VS         X     G
														
 
															-    HS         G     G
														
 
															-    DS         G     G
														
 
															-    GS         G     S
														
 
															-    PS         S     X
														
 
															-============ ===== ======
														
 
															-
														
 
															-(``X``: Not applicable, ``G``: Grouped, ``S``: separated)
														
 
															-
														
 
															-More details in the `gl_PerVertex`_ section.
														
 
															-
														
 
															 Vulkan specific features
														
 
															 ------------------------
														
@@ -275,6 +256,8 @@ The namespace ``vk`` will be used for all Vulkan attributes:
 
															 - ``builtin("X")``: For specifying an entity should be translated into a certain
														
 
															   Vulkan builtin variable. Allowed on function parameters, function returns,
														
 
															   and struct fields.
														
 
															+- ``index(X)``: For specifying the index at a specific pixel shader output
														
 
															+  location. Used for dual-source blending.
														
 
															 Only ``vk::`` attributes in the above list are supported. Other attributes will
														
 
															 result in warnings and be ignored by the compiler. All C++11 attributes will
														
@@ -576,6 +559,18 @@ HLSL Interpolation Modifier SPIR-V Decoration   SPIR-V Capability
 
															 ``sample``                  ``Sample``        ``SampleRateShading``
														
 
															 =========================== ================= =====================
														
 
															+Arrays
														
 
															+------
														
 
															+
														
 
															+Sized (either explicitly or implicitly) arrays are translated into SPIR-V
														
 
															+`OpTypeArray`. Unsized arrays are translated into `OpTypeRuntimeArray`.
														
 
															+
														
 
															+Arrays, if used for external resources (residing in SPIR-V `Uniform` or
														
 
															+`UniformConstant` storage class), will need layout decorations like SPIR-V
														
 
															+`ArrayStride` decoration. For arrays of opaque types, e.g., HLSL textures
														
 
															+or samplers, we don't decorate with `ArrayStride` decorations since there is
														
 
															+no meaningful strides. Similarly for arrays of structured/byte buffers.
														
 
															+
														
 
															 User-defined types
														
 
															 ------------------
														
@@ -603,22 +598,22 @@ are translated into SPIR-V ``OpTypeImage``, with parameters:
 
															 ----------------------- -------------------------- ------------------------------------------------------------------------------------------
														
 
															      Texture Type         Descriptor Type    RO/RW    Storage Class        Dim    Depth Arrayed MS Sampled   Image Format      Capability
														
 
															 ======================= ==================== ===== =================== ========== ===== ======= == ======= ================ =================
														
 
															-``Texture1D``           Sampled Image         RO   ``UniformConstant`` ``1D``      0       0    0    1     ``Unknown``
														
 
															-``Texture2D``           Sampled Image         RO   ``UniformConstant`` ``2D``      0       0    0    1     ``Unknown``
														
 
															-``Texture3D``           Sampled Image         RO   ``UniformConstant`` ``3D``      0       0    0    1     ``Unknown``
														
 
															-``TextureCube``         Sampled Image         RO   ``UniformConstant`` ``Cube``    0       0    0    1     ``Unknown``
														
 
															-``Texture1DArray``      Sampled Image         RO   ``UniformConstant`` ``1D``      0       1    0    1     ``Unknown``
														
 
															-``Texture2DArray``      Sampled Image         RO   ``UniformConstant`` ``2D``      0       1    0    1     ``Unknown``
														
 
															-``Texture2DMS``         Sampled Image         RO   ``UniformConstant`` ``2D``      0       0    1    1     ``Unknown``
														
 
															-``Texture2DMSArray``    Sampled Image         RO   ``UniformConstant`` ``2D``      0       1    1    1     ``Unknown``      ``ImageMSArray``
														
 
															-``TextureCubeArray``    Sampled Image         RO   ``UniformConstant`` ``3D``      0       1    0    1     ``Unknown``
														
 
															-``Buffer<T>``           Uniform Texel Buffer  RO   ``UniformConstant`` ``Buffer``  0       0    0    1     Depends on ``T`` ``SampledBuffer``
														
 
															-``RWBuffer<T>``         Storage Texel Buffer  RW   ``UniformConstant`` ``Buffer``  0       0    0    2     Depends on ``T`` ``SampledBuffer``
														
 
															-``RWTexture1D<T>``      Storage Image         RW   ``UniformConstant`` ``1D``      0       0    0    2     Depends on ``T``
														
 
															-``RWTexture2D<T>``      Storage Image         RW   ``UniformConstant`` ``2D``      0       0    0    2     Depends on ``T``
														
 
															-``RWTexture3D<T>``      Storage Image         RW   ``UniformConstant`` ``3D``      0       0    0    2     Depends on ``T``
														
 
															-``RWTexture1DArray<T>`` Storage Image         RW   ``UniformConstant`` ``1D``      0       1    0    2     Depends on ``T``
														
 
															-``RWTexture2DArray<T>`` Storage Image         RW   ``UniformConstant`` ``2D``      0       1    0    2     Depends on ``T``
														
 
															+``Texture1D``           Sampled Image         RO   ``UniformConstant`` ``1D``      2       0    0    1     ``Unknown``
														
 
															+``Texture2D``           Sampled Image         RO   ``UniformConstant`` ``2D``      2       0    0    1     ``Unknown``
														
 
															+``Texture3D``           Sampled Image         RO   ``UniformConstant`` ``3D``      2       0    0    1     ``Unknown``
														
 
															+``TextureCube``         Sampled Image         RO   ``UniformConstant`` ``Cube``    2       0    0    1     ``Unknown``
														
 
															+``Texture1DArray``      Sampled Image         RO   ``UniformConstant`` ``1D``      2       1    0    1     ``Unknown``
														
 
															+``Texture2DArray``      Sampled Image         RO   ``UniformConstant`` ``2D``      2       1    0    1     ``Unknown``
														
 
															+``Texture2DMS``         Sampled Image         RO   ``UniformConstant`` ``2D``      2       0    1    1     ``Unknown``
														
 
															+``Texture2DMSArray``    Sampled Image         RO   ``UniformConstant`` ``2D``      2       1    1    1     ``Unknown``      ``ImageMSArray``
														
 
															+``TextureCubeArray``    Sampled Image         RO   ``UniformConstant`` ``3D``      2       1    0    1     ``Unknown``
														
 
															+``Buffer<T>``           Uniform Texel Buffer  RO   ``UniformConstant`` ``Buffer``  2       0    0    1     Depends on ``T`` ``SampledBuffer``
														
 
															+``RWBuffer<T>``         Storage Texel Buffer  RW   ``UniformConstant`` ``Buffer``  2       0    0    2     Depends on ``T`` ``SampledBuffer``
														
 
															+``RWTexture1D<T>``      Storage Image         RW   ``UniformConstant`` ``1D``      2       0    0    2     Depends on ``T``
														
 
															+``RWTexture2D<T>``      Storage Image         RW   ``UniformConstant`` ``2D``      2       0    0    2     Depends on ``T``
														
 
															+``RWTexture3D<T>``      Storage Image         RW   ``UniformConstant`` ``3D``      2       0    0    2     Depends on ``T``
														
 
															+``RWTexture1DArray<T>`` Storage Image         RW   ``UniformConstant`` ``1D``      2       1    0    2     Depends on ``T``
														
 
															+``RWTexture2DArray<T>`` Storage Image         RW   ``UniformConstant`` ``2D``      2       1    0    2     Depends on ``T``
														
 
															 ======================= ==================== ===== =================== ========== ===== ======= == ======= ================ =================
														
 
															 The meanings of the headers in the above table is explained in ``OpTypeImage``
														
@@ -1212,22 +1207,8 @@ flattening all structs if structs are used as function parameters or returns.
 
															 There is an exception to the above rule for SV_Target[N]. It will always be
														
 
															 mapped to ``Location`` number N.
														
 
															-``gl_PerVertex``
														
 
															-~~~~~~~~~~~~~~~~
														
 
															-
														
 
															-Variables annotated with ``SV_Position``, ``SV_ClipDistanceX``, and
														
 
															-``SV_CullDistanceX`` are mapped into fields of a ``gl_PerVertex`` struct:
														
 
															-
														
 
															-.. code:: hlsl
														
 
															-
														
 
															-    struct gl_PerVertex {
														
 
															-        float4 gl_Position;       // SPIR-V BuiltIn Position
														
 
															-        float  gl_PointSize;      // No HLSL equivalent
														
 
															-        float  gl_ClipDistance[]; // SPIR-V BuiltIn ClipDistance
														
 
															-        float  gl_CullDistance[]; // SPIR-V BuiltIn CullDistance
														
 
															-    };
														
 
															-
														
 
															-This mimics how these builtins are handled in GLSL.
														
 
															+``ClipDistance & CullDistance``
														
 
															+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
														
 
															 Variables decorated with ``SV_ClipDistanceX`` can be float or vector of float
														
 
															 type. To map them into one float array in the struct, we firstly sort them
														
@@ -1298,13 +1279,6 @@ If there is no register specification, the corresponding resource will be
 
															 assigned to the next available binding number, starting from 0, in descriptor
														
 
															 set #0.
														
 
															-Error checking
														
 
															-~~~~~~~~~~~~~~
														
 
															-
														
 
															-Trying to reuse the same binding number of the same descriptor set results in
														
 
															-a compiler error, unless we have exactly two resources and one is an image and
														
 
															-the other is a sampler. This is to support the Vulkan combined image sampler.
														
 
															-
														
 
															 Summary
														
 
															 ~~~~~~~
														
@@ -1886,6 +1860,35 @@ HLSL Intrinsic Function   GLSL Extended Instruction
 
															 ``trunc``               ``Trunc``
														
 
															 ======================= ===================================
														
 
															+Synchronization intrinsics
														
 
															+~~~~~~~~~~~~~~~~~~~~~~~~~~
														
 
															+
														
 
															+Synchronization intrinsics are translated into ``OpMemoryBarrier`` (for those
														
 
															+non-``WithGroupSync`` variants) or ``OpControlBarrier`` (for those ``WithGroupSync``
														
 
															+variants) instructions with parameters:
														
 
															+
														
 
															+======================= ============ ===== ======= ========= ==============
														
 
															+       HLSL                SPIR-V          SPIR-V Memory Semantics
														
 
															+----------------------- ------------ --------------------------------------
														
 
															+     Intrinsic          Memory Scope Image Uniform Workgroup AcquireRelease
														
 
															+======================= ============ ===== ======= ========= ==============
														
 
															+``AllMemoryBarrier``    Device       ✓       ✓         ✓          ✓
														
 
															+``DeviceMemoryBarrier`` Device       ✓       ✓                    ✓
														
 
															+``GroupMemoryBarrier``  Workgroup                       ✓          ✓
														
 
															+======================= ============ ===== ======= ========= ==============
														
 
															+
														
 
															+For the ``*WithGroupSync`` intrinsics, SPIR-V memory scope and semantics are the
														
 
															+same as their counterparts in the above. They have an additional execution
														
 
															+scope:
														
 
															+
														
 
															+==================================== ======================
														
 
															+       HLSL Intrinsic                SPIR-V Execution Scope
														
 
															+==================================== ======================
														
 
															+``AllMemoryBarrierWithGroupSync``    Workgroup
														
 
															+``DeviceMemoryBarrierWithGroupSync`` Workgroup
														
 
															+``GroupMemoryBarrierWithGroupSync``  Workgroup
														
 
															+==================================== ======================
														
 
															+
														
 
															 HLSL OO features
														
 
															 ================
														
@@ -2692,9 +2695,6 @@ codegen for Vulkan:
 
															 - ``-fvk-t-shift N M``, similar to ``-fvk-b-shift``, but for t-type registers.
														
 
															 - ``-fvk-s-shift N M``, similar to ``-fvk-b-shift``, but for s-type registers.
														
 
															 - ``-fvk-u-shift N M``, similar to ``-fvk-b-shift``, but for u-type registers.
														
 
															-- ``-fvk-ignore-unused-resources``: Avoids emitting SPIR-V code for resources
														
 
															-  defined but not statically referenced by the call tree of the entry point
														
 
															-  in question.
														
 
															 - ``-fvk-use-gl-layout``: Uses strict OpenGL ``std140``/``std430``
														
 
															   layout rules for resources.
														
 
															 - ``-fvk-use-dx-layout``: Uses DirectX layout rules for resources.
														
@@ -2711,6 +2711,8 @@ codegen for Vulkan:
 
															 - ``-fspv-target-env=<env>``: Specifies the target environment for this compilation.
														
 
															   The current valid options are ``vulkan1.0`` and ``vulkan1.1``. If no target
														
 
															   environment is provided, ``vulkan1.0`` is used as default.
														
 
															+- ``-Wno-vk-ignored-features``: Does not emit warnings on ignored features
														
 
															+  resulting from no Vulkan support, e.g., cbuffer member initializer.
														
 
															 Unsupported HLSL Features
														
 
															 =========================
														
--- a/external/GTestConfig.cmake
+++ b/external/GTestConfig.cmake
@@ -21,9 +21,6 @@ include_directories(
 
															 if(WIN32)
														
 
															   add_definitions(-DGTEST_OS_WINDOWS=1)
														
 
															-  # GoogleTest uses std::tr1, which is deprecated in VS2017.
														
 
															-  # The following is an escape-hatch macro to silence the deprecation warnings.
														
 
															-  add_definitions(-D_SILENCE_TR1_NAMESPACE_DEPRECATION_WARNING)
														
 
															 endif()
														
 
															 if(SUPPORTS_VARIADIC_MACROS_FLAG)
														
--- a/external/SPIRV-Headers
+++ b/external/SPIRV-Headers
@@ -1 +1 @@
 
															-Subproject commit 3a4dbdde9a9b2cf23736694ba70262dce27fbeaa
														
 
															+Subproject commit 3ce3e49d73b8abbf2ffe33f829f941fb2a40f552
														
--- a/external/SPIRV-Tools
+++ b/external/SPIRV-Tools
@@ -1 +1 @@
 
															-Subproject commit 42840d15e4bf5cba4a7345639b409c6e962b96c2
														
 
															+Subproject commit b09e3ce8427c7cfffcc4950f5bd05fa4c586b23c
														
--- a/external/googletest
+++ b/external/googletest
@@ -1 +1 @@
 
															-Subproject commit 82febb8eafc0425601b0d46567dc66c7750233ff
														
 
															+Subproject commit 08d5b1f33af8c18785fb8ca02792b5fac81e248f
														
--- a/external/re2
+++ b/external/re2
@@ -1 +1 @@
 
															-Subproject commit f2cc1aeb5de463c45d020c446cbcb028385b49f3
														
 
															+Subproject commit 1c7eb5604bc46c0198fc7bc35b32985ffe57ca93
														
--- a/include/dxc/HLSL/DxilConstants.h
+++ b/include/dxc/HLSL/DxilConstants.h
@@ -1053,22 +1053,12 @@ namespace DXIL {
 
															   };
														
 
															-  // TODO: revisit data layout descriptions for the following:
														
 
															-  //      - x64 pointers?
														
 
															-  //      - Keep elf manging(m:e)?
														
 
															-
														
 
															-  // For legacy data layout, everything less than 32 align to 32.
														
 
															-  static const char* kLegacyLayoutString = "e-m:e-p:32:32-i1:32-i8:32-i16:32-i32:32-i64:64-f16:32-f32:32-f:64:64-n8:16:32:64";
														
 
															-
														
 
															-  // New data layout with native low precision types
														
 
															-  static const char* kNewLayoutString = "e-m:e-p:32:32-i1:32-i8:8-i16:16-i32:32-i64:64-f16:16-f32:32-f64:64-n8:16:32:64";
														
 
															-
														
 
															-  // Function Attributes
														
 
															-  // TODO: consider generating attributes from hctdb
														
 
															-  static const char* kFP32DenormKindString          = "fp32-denorm-mode";
														
 
															-  static const char* kFP32DenormValueAnyString      = "any";
														
 
															-  static const char* kFP32DenormValuePreserveString = "preserve";
														
 
															-  static const char* kFP32DenormValueFtzString      = "ftz";
														
 
															+  extern const char* kLegacyLayoutString;
														
 
															+  extern const char* kNewLayoutString;
														
 
															+  extern const char* kFP32DenormKindString;
														
 
															+  extern const char* kFP32DenormValueAnyString;
														
 
															+  extern const char* kFP32DenormValuePreserveString;
														
 
															+  extern const char* kFP32DenormValueFtzString;
														
 
															 } // namespace DXIL
														
--- a/include/dxc/HLSL/DxilMetadataHelper.h
+++ b/include/dxc/HLSL/DxilMetadataHelper.h
@@ -81,6 +81,12 @@ public:
 
															   // ViewId state.
														
 
															   static const char kDxilViewIdStateMDName[];
														
 
															+  // Source info.
														
 
															+  static const char kDxilSourceContentsMDName[];
														
 
															+  static const char kDxilSourceDefinesMDName[];
														
 
															+  static const char kDxilSourceMainFileNameMDName[];
														
 
															+  static const char kDxilSourceArgsMDName[];
														
 
															+
														
 
															   // Function props.
														
 
															   static const char kDxilFunctionPropertiesMDName[];
														
 
															   static const char kDxilEntrySignaturesMDName[];
														
--- a/include/dxc/HLSL/DxilPipelineStateValidation.h
+++ b/include/dxc/HLSL/DxilPipelineStateValidation.h
@@ -25,34 +25,40 @@ inline uint32_t PSVComputeInputOutputTableSize(uint32_t InputVectors, uint32_t O
 
															 #define PSVALIGN(ptr, alignbits) (((ptr) + ((1 << (alignbits))-1)) & ~((1 << (alignbits))-1))
														
 
															 #define PSVALIGN4(ptr) (((ptr) + 3) & ~3)
														
 
															+struct VSInfo {
														
 
															+  char OutputPositionPresent;
														
 
															+};
														
 
															+struct HSInfo {
														
 
															+  uint32_t InputControlPointCount;      // max control points == 32
														
 
															+  uint32_t OutputControlPointCount;     // max control points == 32
														
 
															+  uint32_t TessellatorDomain;           // hlsl::DXIL::TessellatorDomain/D3D11_SB_TESSELLATOR_DOMAIN
														
 
															+  uint32_t TessellatorOutputPrimitive;  // hlsl::DXIL::TessellatorOutputPrimitive/D3D11_SB_TESSELLATOR_OUTPUT_PRIMITIVE
														
 
															+};
														
 
															+struct DSInfo {
														
 
															+  uint32_t InputControlPointCount;      // max control points == 32
														
 
															+  char OutputPositionPresent;
														
 
															+  uint32_t TessellatorDomain;           // hlsl::DXIL::TessellatorDomain/D3D11_SB_TESSELLATOR_DOMAIN
														
 
															+};
														
 
															+struct GSInfo {
														
 
															+  uint32_t InputPrimitive;              // hlsl::DXIL::InputPrimitive/D3D10_SB_PRIMITIVE
														
 
															+  uint32_t OutputTopology;              // hlsl::DXIL::PrimitiveTopology/D3D10_SB_PRIMITIVE_TOPOLOGY
														
 
															+  uint32_t OutputStreamMask;            // max streams == 4
														
 
															+  char OutputPositionPresent;
														
 
															+};
														
 
															+struct PSInfo {
														
 
															+  char DepthOutput;
														
 
															+  char SampleFrequency;
														
 
															+};
														
 
															+
														
 
															 // Versioning is additive and based on size
														
 
															 struct PSVRuntimeInfo0
														
 
															 {
														
 
															   union {
														
 
															-    struct VSInfo {
														
 
															-      char OutputPositionPresent;
														
 
															-    } VS;
														
 
															-    struct HSInfo {
														
 
															-      uint32_t InputControlPointCount;      // max control points == 32
														
 
															-      uint32_t OutputControlPointCount;     // max control points == 32
														
 
															-      uint32_t TessellatorDomain;           // hlsl::DXIL::TessellatorDomain/D3D11_SB_TESSELLATOR_DOMAIN
														
 
															-      uint32_t TessellatorOutputPrimitive;  // hlsl::DXIL::TessellatorOutputPrimitive/D3D11_SB_TESSELLATOR_OUTPUT_PRIMITIVE
														
 
															-    } HS;
														
 
															-    struct DSInfo {
														
 
															-      uint32_t InputControlPointCount;      // max control points == 32
														
 
															-      char OutputPositionPresent;
														
 
															-      uint32_t TessellatorDomain;           // hlsl::DXIL::TessellatorDomain/D3D11_SB_TESSELLATOR_DOMAIN
														
 
															-    } DS;
														
 
															-    struct GSInfo {
														
 
															-      uint32_t InputPrimitive;              // hlsl::DXIL::InputPrimitive/D3D10_SB_PRIMITIVE
														
 
															-      uint32_t OutputTopology;              // hlsl::DXIL::PrimitiveTopology/D3D10_SB_PRIMITIVE_TOPOLOGY
														
 
															-      uint32_t OutputStreamMask;            // max streams == 4
														
 
															-      char OutputPositionPresent;
														
 
															-    } GS;
														
 
															-    struct PSInfo {
														
 
															-      char DepthOutput;
														
 
															-      char SampleFrequency;
														
 
															-    } PS;
														
 
															+    VSInfo VS;
														
 
															+    HSInfo HS;
														
 
															+    DSInfo DS;
														
 
															+    GSInfo GS;
														
 
															+    PSInfo PS;
														
 
															   };
														
 
															   uint32_t MinimumExpectedWaveLaneCount;  // minimum lane count required, 0 if unused
														
 
															   uint32_t MaximumExpectedWaveLaneCount;  // maximum lane count required, 0xffffffff if unused
														
@@ -228,7 +234,7 @@ struct PSVSemanticIndexes {
 
															   uint32_t Offset;
														
 
															   PSVSemanticIndexes() : Offset(0) {}
														
 
															   PSVSemanticIndexes(uint32_t offset) : Offset(offset) {}
														
 
															-  uint32_t *Get(const PSVSemanticIndexTable &table) const { table.Get(Offset); }
														
 
															+  const uint32_t *Get(const PSVSemanticIndexTable &table) const { return table.Get(Offset); }
														
 
															 };
														
 
															 enum class PSVSemanticKind : uint8_t    // DXIL::SemanticKind
														
--- a/include/dxc/HLSL/DxilSigPoint.inl
+++ b/include/dxc/HLSL/DxilSigPoint.inl
@@ -49,37 +49,37 @@ const SigPoint SigPoint::ms_SigPoints[kNumSigPointRecords] = {
 
															 // <py::lines('INTERPRETATION-TABLE')>hctdb_instrhelp.get_interpretation_table()</py>
														
 
															 // INTERPRETATION-TABLE:BEGIN
														
 
															-//   Semantic,               VSIn,         VSOut, PCIn,         HSIn,         HSCPIn, HSCPOut, PCOut,      DSIn,         DSCPIn, DSOut, GSVIn, GSIn,         GSOut, PSIn,          PSOut,         CSIn
														
 
															-#define DO_INTERPRETATION_TABLE(DO) \
														
 
															-  DO(Arbitrary,              Arb,          Arb,   NA,           NA,           Arb,    Arb,     Arb,        Arb,          Arb,    Arb,   Arb,   NA,           Arb,   Arb,           NA,            NA) \
														
 
															-  DO(VertexID,               SV,           NA,    NA,           NA,           NA,     NA,      NA,         NA,           NA,     NA,    NA,    NA,           NA,    NA,            NA,            NA) \
														
 
															-  DO(InstanceID,             SV,           Arb,   NA,           NA,           Arb,    Arb,     NA,         NA,           Arb,    Arb,   Arb,   NA,           Arb,   Arb,           NA,            NA) \
														
 
															-  DO(Position,               Arb,          SV,    NA,           NA,           SV,     SV,      Arb,        Arb,          SV,     SV,    SV,    NA,           SV,    SV,            NA,            NA) \
														
 
															-  DO(RenderTargetArrayIndex, Arb,          SV,    NA,           NA,           SV,     SV,      Arb,        Arb,          SV,     SV,    SV,    NA,           SV,    SV,            NA,            NA) \
														
 
															-  DO(ViewPortArrayIndex,     Arb,          SV,    NA,           NA,           SV,     SV,      Arb,        Arb,          SV,     SV,    SV,    NA,           SV,    SV,            NA,            NA) \
														
 
															-  DO(ClipDistance,           Arb,          SV,    NA,           NA,           SV,     SV,      Arb,        Arb,          SV,     SV,    SV,    NA,           SV,    SV,            NA,            NA) \
														
 
															-  DO(CullDistance,           Arb,          SV,    NA,           NA,           SV,     SV,      Arb,        Arb,          SV,     SV,    SV,    NA,           SV,    SV,            NA,            NA) \
														
 
															-  DO(OutputControlPointID,   NA,           NA,    NA,           NotInSig,     NA,     NA,      NA,         NA,           NA,     NA,    NA,    NA,           NA,    NA,            NA,            NA) \
														
 
															-  DO(DomainLocation,         NA,           NA,    NA,           NA,           NA,     NA,      NA,         NotInSig,     NA,     NA,    NA,    NA,           NA,    NA,            NA,            NA) \
														
 
															-  DO(PrimitiveID,            NA,           NA,    NotInSig,     NotInSig,     NA,     NA,      NA,         NotInSig,     NA,     NA,    NA,    Shadow,       SGV,   SGV,           NA,            NA) \
														
 
															-  DO(GSInstanceID,           NA,           NA,    NA,           NA,           NA,     NA,      NA,         NA,           NA,     NA,    NA,    NotInSig,     NA,    NA,            NA,            NA) \
														
 
															-  DO(SampleIndex,            NA,           NA,    NA,           NA,           NA,     NA,      NA,         NA,           NA,     NA,    NA,    NA,           NA,    Shadow _41,    NA,            NA) \
														
 
															-  DO(IsFrontFace,            NA,           NA,    NA,           NA,           NA,     NA,      NA,         NA,           NA,     NA,    NA,    NA,           SGV,   SGV,           NA,            NA) \
														
 
															-  DO(Coverage,               NA,           NA,    NA,           NA,           NA,     NA,      NA,         NA,           NA,     NA,    NA,    NA,           NA,    NotInSig _50,  NotPacked _41, NA) \
														
 
															-  DO(InnerCoverage,          NA,           NA,    NA,           NA,           NA,     NA,      NA,         NA,           NA,     NA,    NA,    NA,           NA,    NotInSig _50,  NA,            NA) \
														
 
															-  DO(Target,                 NA,           NA,    NA,           NA,           NA,     NA,      NA,         NA,           NA,     NA,    NA,    NA,           NA,    NA,            Target,        NA) \
														
 
															-  DO(Depth,                  NA,           NA,    NA,           NA,           NA,     NA,      NA,         NA,           NA,     NA,    NA,    NA,           NA,    NA,            NotPacked,     NA) \
														
 
															-  DO(DepthLessEqual,         NA,           NA,    NA,           NA,           NA,     NA,      NA,         NA,           NA,     NA,    NA,    NA,           NA,    NA,            NotPacked _50, NA) \
														
 
															-  DO(DepthGreaterEqual,      NA,           NA,    NA,           NA,           NA,     NA,      NA,         NA,           NA,     NA,    NA,    NA,           NA,    NA,            NotPacked _50, NA) \
														
 
															-  DO(StencilRef,             NA,           NA,    NA,           NA,           NA,     NA,      NA,         NA,           NA,     NA,    NA,    NA,           NA,    NA,            NotPacked _50, NA) \
														
 
															-  DO(DispatchThreadID,       NA,           NA,    NA,           NA,           NA,     NA,      NA,         NA,           NA,     NA,    NA,    NA,           NA,    NA,            NA,            NotInSig) \
														
 
															-  DO(GroupID,                NA,           NA,    NA,           NA,           NA,     NA,      NA,         NA,           NA,     NA,    NA,    NA,           NA,    NA,            NA,            NotInSig) \
														
 
															-  DO(GroupIndex,             NA,           NA,    NA,           NA,           NA,     NA,      NA,         NA,           NA,     NA,    NA,    NA,           NA,    NA,            NA,            NotInSig) \
														
 
															-  DO(GroupThreadID,          NA,           NA,    NA,           NA,           NA,     NA,      NA,         NA,           NA,     NA,    NA,    NA,           NA,    NA,            NA,            NotInSig) \
														
 
															-  DO(TessFactor,             NA,           NA,    NA,           NA,           NA,     NA,      TessFactor, TessFactor,   NA,     NA,    NA,    NA,           NA,    NA,            NA,            NA) \
														
 
															-  DO(InsideTessFactor,       NA,           NA,    NA,           NA,           NA,     NA,      TessFactor, TessFactor,   NA,     NA,    NA,    NA,           NA,    NA,            NA,            NA) \
														
 
															-  DO(ViewID,                 NotInSig _61, NA,    NotInSig _61, NotInSig _61, NA,     NA,      NA,         NotInSig _61, NA,     NA,    NA,    NotInSig _61, NA,    NotInSig _61,  NA,            NA) \
														
 
															-  DO(Barycentrics,           NA,           NA,    NA,           NA,           NA,     NA,      NA,         NA,           NA,     NA,    NA,    NA,           NA,    NotPacked _61, NA,            NA)
														
 
															+//  Semantic            VSIn,           VSOut,  PCIn,            HSIn,            HSCPIn, HSCPOut, PCOut,         DSIn,            DSCPIn, DSOut,  GSVIn,  GSIn,            GSOut,  PSIn,             PSOut,            CSIn
														
 
															+#define DO_INTERPRETATION_TABLE(D) \
														
 
															+  {/*Arbitrary*/        D(Arb),         D(Arb), D(NA),           D(NA),           D(Arb), D(Arb),  D(Arb),        D(Arb),          D(Arb), D(Arb), D(Arb), D(NA),           D(Arb), D(Arb),           D(NA),            D(NA)}, \
														
 
															+  {/*VertexID*/         D(SV),          D(NA),  D(NA),           D(NA),           D(NA),  D(NA),   D(NA),         D(NA),           D(NA),  D(NA),  D(NA),  D(NA),           D(NA),  D(NA),            D(NA),            D(NA)}, \
														
 
															+  {/*InstanceID*/       D(SV),          D(Arb), D(NA),           D(NA),           D(Arb), D(Arb),  D(NA),         D(NA),           D(Arb), D(Arb), D(Arb), D(NA),           D(Arb), D(Arb),           D(NA),            D(NA)}, \
														
 
															+  {/*Position*/         D(Arb),         D(SV),  D(NA),           D(NA),           D(SV),  D(SV),   D(Arb),        D(Arb),          D(SV),  D(SV),  D(SV),  D(NA),           D(SV),  D(SV),            D(NA),            D(NA)}, \
														
 
															+  {/*RenderTgArrayIdx*/ D(Arb),         D(SV),  D(NA),           D(NA),           D(SV),  D(SV),   D(Arb),        D(Arb),          D(SV),  D(SV),  D(SV),  D(NA),           D(SV),  D(SV),            D(NA),            D(NA)}, \
														
 
															+  {/*ViewPortArrayIdx*/ D(Arb),         D(SV),  D(NA),           D(NA),           D(SV),  D(SV),   D(Arb),        D(Arb),          D(SV),  D(SV),  D(SV),  D(NA),           D(SV),  D(SV),            D(NA),            D(NA)}, \
														
 
															+  {/*ClipDistance*/     D(Arb),         D(SV),  D(NA),           D(NA),           D(SV),  D(SV),   D(Arb),        D(Arb),          D(SV),  D(SV),  D(SV),  D(NA),           D(SV),  D(SV),            D(NA),            D(NA)}, \
														
 
															+  {/*CullDistance*/     D(Arb),         D(SV),  D(NA),           D(NA),           D(SV),  D(SV),   D(Arb),        D(Arb),          D(SV),  D(SV),  D(SV),  D(NA),           D(SV),  D(SV),            D(NA),            D(NA)}, \
														
 
															+  {/*OutputControlPtID*/D(NA),          D(NA),  D(NA),           D(NotInSig),     D(NA),  D(NA),   D(NA),         D(NA),           D(NA),  D(NA),  D(NA),  D(NA),           D(NA),  D(NA),            D(NA),            D(NA)}, \
														
 
															+  {/*DomainLocation*/   D(NA),          D(NA),  D(NA),           D(NA),           D(NA),  D(NA),   D(NA),         D(NotInSig),     D(NA),  D(NA),  D(NA),  D(NA),           D(NA),  D(NA),            D(NA),            D(NA)}, \
														
 
															+  {/*PrimitiveID*/      D(NA),          D(NA),  D(NotInSig),     D(NotInSig),     D(NA),  D(NA),   D(NA),         D(NotInSig),     D(NA),  D(NA),  D(NA),  D(Shadow),       D(SGV), D(SGV),           D(NA),            D(NA)}, \
														
 
															+  {/*GSInstanceID*/     D(NA),          D(NA),  D(NA),           D(NA),           D(NA),  D(NA),   D(NA),         D(NA),           D(NA),  D(NA),  D(NA),  D(NotInSig),     D(NA),  D(NA),            D(NA),            D(NA)}, \
														
 
															+  {/*SampleIndex*/      D(NA),          D(NA),  D(NA),           D(NA),           D(NA),  D(NA),   D(NA),         D(NA),           D(NA),  D(NA),  D(NA),  D(NA),           D(NA),  D(Shadow _41),    D(NA),            D(NA)}, \
														
 
															+  {/*IsFrontFace*/      D(NA),          D(NA),  D(NA),           D(NA),           D(NA),  D(NA),   D(NA),         D(NA),           D(NA),  D(NA),  D(NA),  D(NA),           D(SGV), D(SGV),           D(NA),            D(NA)}, \
														
 
															+  {/*Coverage*/         D(NA),          D(NA),  D(NA),           D(NA),           D(NA),  D(NA),   D(NA),         D(NA),           D(NA),  D(NA),  D(NA),  D(NA),           D(NA),  D(NotInSig _50),  D(NotPacked _41), D(NA)}, \
														
 
															+  {/*InnerCoverage*/    D(NA),          D(NA),  D(NA),           D(NA),           D(NA),  D(NA),   D(NA),         D(NA),           D(NA),  D(NA),  D(NA),  D(NA),           D(NA),  D(NotInSig _50),  D(NA),            D(NA)}, \
														
 
															+  {/*Target*/           D(NA),          D(NA),  D(NA),           D(NA),           D(NA),  D(NA),   D(NA),         D(NA),           D(NA),  D(NA),  D(NA),  D(NA),           D(NA),  D(NA),            D(Target),        D(NA)}, \
														
 
															+  {/*Depth*/            D(NA),          D(NA),  D(NA),           D(NA),           D(NA),  D(NA),   D(NA),         D(NA),           D(NA),  D(NA),  D(NA),  D(NA),           D(NA),  D(NA),            D(NotPacked),     D(NA)}, \
														
 
															+  {/*DepthLessEqual*/   D(NA),          D(NA),  D(NA),           D(NA),           D(NA),  D(NA),   D(NA),         D(NA),           D(NA),  D(NA),  D(NA),  D(NA),           D(NA),  D(NA),            D(NotPacked _50), D(NA)}, \
														
 
															+  {/*DepthGreaterEqual*/D(NA),          D(NA),  D(NA),           D(NA),           D(NA),  D(NA),   D(NA),         D(NA),           D(NA),  D(NA),  D(NA),  D(NA),           D(NA),  D(NA),            D(NotPacked _50), D(NA)}, \
														
 
															+  {/*StencilRef*/       D(NA),          D(NA),  D(NA),           D(NA),           D(NA),  D(NA),   D(NA),         D(NA),           D(NA),  D(NA),  D(NA),  D(NA),           D(NA),  D(NA),            D(NotPacked _50), D(NA)}, \
														
 
															+  {/*DispatchThreadID*/ D(NA),          D(NA),  D(NA),           D(NA),           D(NA),  D(NA),   D(NA),         D(NA),           D(NA),  D(NA),  D(NA),  D(NA),           D(NA),  D(NA),            D(NA),            D(NotInSig)}, \
														
 
															+  {/*GroupID*/          D(NA),          D(NA),  D(NA),           D(NA),           D(NA),  D(NA),   D(NA),         D(NA),           D(NA),  D(NA),  D(NA),  D(NA),           D(NA),  D(NA),            D(NA),            D(NotInSig)}, \
														
 
															+  {/*GroupIndex*/       D(NA),          D(NA),  D(NA),           D(NA),           D(NA),  D(NA),   D(NA),         D(NA),           D(NA),  D(NA),  D(NA),  D(NA),           D(NA),  D(NA),            D(NA),            D(NotInSig)}, \
														
 
															+  {/*GroupThreadID*/    D(NA),          D(NA),  D(NA),           D(NA),           D(NA),  D(NA),   D(NA),         D(NA),           D(NA),  D(NA),  D(NA),  D(NA),           D(NA),  D(NA),            D(NA),            D(NotInSig)}, \
														
 
															+  {/*TessFactor*/       D(NA),          D(NA),  D(NA),           D(NA),           D(NA),  D(NA),   D(TessFactor), D(TessFactor),   D(NA),  D(NA),  D(NA),  D(NA),           D(NA),  D(NA),            D(NA),            D(NA)}, \
														
 
															+  {/*InsideTessFactor*/ D(NA),          D(NA),  D(NA),           D(NA),           D(NA),  D(NA),   D(TessFactor), D(TessFactor),   D(NA),  D(NA),  D(NA),  D(NA),           D(NA),  D(NA),            D(NA),            D(NA)}, \
														
 
															+  {/*ViewID*/           D(NotInSig _61),D(NA),  D(NotInSig _61), D(NotInSig _61), D(NA),  D(NA),   D(NA),         D(NotInSig _61), D(NA),  D(NA),  D(NA),  D(NotInSig _61), D(NA),  D(NotInSig _61),  D(NA),            D(NA)}, \
														
 
															+  {/*Barycentrics*/     D(NA),          D(NA),  D(NA),           D(NA),           D(NA),  D(NA),   D(NA),         D(NA),           D(NA),  D(NA),  D(NA),  D(NA),           D(NA),  D(NotPacked _61), D(NA),            D(NA)}, \
														
 
															 // INTERPRETATION-TABLE:END
														
 
															 const VersionedSemanticInterpretation SigPoint::ms_SemanticInterpretationTable[(unsigned)DXIL::SemanticKind::Invalid][(unsigned)SigPoint::Kind::Invalid] = {
														
@@ -87,10 +87,7 @@ const VersionedSemanticInterpretation SigPoint::ms_SemanticInterpretationTable[(
 
															 #define _50 ,5,0
														
 
															 #define _61 ,6,1
														
 
															 #define DO(k) VersionedSemanticInterpretation(DXIL::SemanticInterpretationKind::k)
														
 
															-#define DO_ROW(SEM, VSIn, VSOut, PCIn, HSIn, HSCPIn, HSCPOut, PCOut, DSIn, DSCPIn, DSOut, GSVIn, GSIn, GSOut, PSIn, PSOut, CSIn) \
														
 
															-  { DO(VSIn), DO(VSOut), DO(PCIn), DO(HSIn), DO(HSCPIn), DO(HSCPOut), DO(PCOut), DO(DSIn), DO(DSCPIn), DO(DSOut), DO(GSVIn), DO(GSIn), DO(GSOut), DO(PSIn), DO(PSOut), DO(CSIn) },
														
 
															-  DO_INTERPRETATION_TABLE(DO_ROW)
														
 
															-#undef DO_ROW
														
 
															+  DO_INTERPRETATION_TABLE(DO)
														
 
															 #undef DO
														
 
															 };
														
--- a/include/dxc/HLSL/DxilSignatureAllocator.h
+++ b/include/dxc/HLSL/DxilSignatureAllocator.h
@@ -54,20 +54,20 @@ public:
 
															       dataBitWidth(DXIL::SignatureDataWidth::Undefined),
														
 
															       indexFlags(0)
														
 
															     {}
														
 
															-    __override ~DummyElement() {}
														
 
															-    __override uint32_t GetID() const { return id; }
														
 
															-    __override DXIL::SemanticKind GetKind() const { return kind; }
														
 
															-    __override DXIL::InterpolationMode GetInterpolationMode() const { return interpolation; }
														
 
															-    __override DXIL::SemanticInterpretationKind GetInterpretation() const { return interpretation; }
														
 
															-    __override DXIL::SignatureDataWidth GetDataBitWidth() const { return dataBitWidth; }
														
 
															-    __override uint32_t GetRows() const { return rows; }
														
 
															-    __override uint32_t GetCols() const { return cols; }
														
 
															-    __override bool IsAllocated() const { return row != (uint32_t)-1; }
														
 
															-    __override uint32_t GetStartRow() const { return row; }
														
 
															-    __override uint32_t GetStartCol() const { return col; }
														
 
															-
														
 
															-    __override void ClearLocation() { row = col = (uint32_t)-1; }
														
 
															-    __override void SetLocation(uint32_t Row, uint32_t Col) { row = Row; col = Col; }
														
 
															+    ~DummyElement() override {}
														
 
															+    uint32_t GetID() const override { return id; }
														
 
															+    DXIL::SemanticKind GetKind() const override { return kind; }
														
 
															+    DXIL::InterpolationMode GetInterpolationMode() const override { return interpolation; }
														
 
															+    DXIL::SemanticInterpretationKind GetInterpretation() const override { return interpretation; }
														
 
															+    DXIL::SignatureDataWidth GetDataBitWidth() const override { return dataBitWidth; }
														
 
															+    uint32_t GetRows() const override { return rows; }
														
 
															+    uint32_t GetCols() const override { return cols; }
														
 
															+    bool IsAllocated() const override { return row != (uint32_t)-1; }
														
 
															+    uint32_t GetStartRow() const override { return row; }
														
 
															+    uint32_t GetStartCol() const override { return col; }
														
 
															+
														
 
															+    void ClearLocation() override { row = col = (uint32_t)-1; }
														
 
															+    void SetLocation(uint32_t Row, uint32_t Col) override { row = Row; col = Col; }
														
 
															   };
														
 
															   // index flags
														
--- a/include/dxc/HLSL/DxilSignatureElement.h
+++ b/include/dxc/HLSL/DxilSignatureElement.h
@@ -114,12 +114,12 @@ class DxilPackElement : public DxilSignatureAllocator::PackElement {
 
															 public:
														
 
															   DxilPackElement(DxilSignatureElement *pSE, bool useMinPrecision) : m_pSE(pSE), m_bUseMinPrecision(useMinPrecision) {}
														
 
															-  __override ~DxilPackElement() {}
														
 
															-  __override uint32_t GetID() const { return m_pSE->GetID(); }
														
 
															-  __override DXIL::SemanticKind GetKind() const { return m_pSE->GetKind(); }
														
 
															-  __override DXIL::InterpolationMode GetInterpolationMode() const { return m_pSE->GetInterpolationMode()->GetKind(); }
														
 
															-  __override DXIL::SemanticInterpretationKind GetInterpretation() const { return m_pSE->GetInterpretation(); }
														
 
															-  __override DXIL::SignatureDataWidth GetDataBitWidth() const {
														
 
															+  ~DxilPackElement() override {}
														
 
															+  uint32_t GetID() const override { return m_pSE->GetID(); }
														
 
															+  DXIL::SemanticKind GetKind() const override { return m_pSE->GetKind(); }
														
 
															+  DXIL::InterpolationMode GetInterpolationMode() const override { return m_pSE->GetInterpolationMode()->GetKind(); }
														
 
															+  DXIL::SemanticInterpretationKind GetInterpretation() const override { return m_pSE->GetInterpretation(); }
														
 
															+  DXIL::SignatureDataWidth GetDataBitWidth() const override {
														
 
															     uint8_t size = m_pSE->GetCompType().GetSizeInBits();
														
 
															     // bool, min precision, or 32 bit types map to 32 bit size.
														
 
															     if (size == 16) {
														
@@ -130,17 +130,17 @@ public:
 
															     }
														
 
															     return DXIL::SignatureDataWidth::Undefined;
														
 
															   }
														
 
															-  __override uint32_t GetRows() const { return m_pSE->GetRows(); }
														
 
															-  __override uint32_t GetCols() const { return m_pSE->GetCols(); }
														
 
															-  __override bool IsAllocated() const { return m_pSE->IsAllocated(); }
														
 
															-  __override uint32_t GetStartRow() const { return m_pSE->GetStartRow(); }
														
 
															-  __override uint32_t GetStartCol() const { return m_pSE->GetStartCol(); }
														
 
															+  uint32_t GetRows() const override { return m_pSE->GetRows(); }
														
 
															+  uint32_t GetCols() const override { return m_pSE->GetCols(); }
														
 
															+  bool IsAllocated() const override { return m_pSE->IsAllocated(); }
														
 
															+  uint32_t GetStartRow() const override { return m_pSE->GetStartRow(); }
														
 
															+  uint32_t GetStartCol() const override { return m_pSE->GetStartCol(); }
														
 
															-  __override void ClearLocation() {
														
 
															+  void ClearLocation() override {
														
 
															     m_pSE->SetStartRow(-1);
														
 
															     m_pSE->SetStartCol(-1);
														
 
															   }
														
 
															-  __override void SetLocation(uint32_t Row, uint32_t Col) {
														
 
															+  void SetLocation(uint32_t Row, uint32_t Col) override {
														
 
															     m_pSE->SetStartRow(Row);
														
 
															     m_pSE->SetStartCol(Col);
														
 
															   }
														
--- a/include/dxc/HLSL/DxilSpanAllocator.h
+++ b/include/dxc/HLSL/DxilSpanAllocator.h
@@ -58,7 +58,7 @@ public:
 
															     auto next = m_Spans.lower_bound(Span(nullptr, pos, end));
														
 
															     if (next == m_Spans.end() || end < next->start)
														
 
															       return true;  // it fits here
														
 
															-    return Find(size, result.first, pos, align);
														
 
															+    return Find(size, next, pos, align);
														
 
															   }
														
 
															   // allocate element size in first available space, returns false on failure
														
--- a/include/dxc/HLSL/ViewIDPipelineValidation.inl
+++ b/include/dxc/HLSL/ViewIDPipelineValidation.inl
@@ -238,10 +238,10 @@ public:
 
															       m_GSRastStreamIndex(gsRastStreamIndex)
														
 
															   {}
														
 
															   virtual ~ViewIDValidator_impl() {}
														
 
															-  __override Result ValidateStage(const DxilPipelineStateValidation &PSV,
														
 
															-                                  bool bFinalStage,
														
 
															-                                  bool bExpandInputOnly,
														
 
															-                                  unsigned &mismatchElementId) {
														
 
															+  Result ValidateStage(const DxilPipelineStateValidation &PSV,
														
 
															+                       bool bFinalStage,
														
 
															+                       bool bExpandInputOnly,
														
 
															+                       unsigned &mismatchElementId) override {
														
 
															     if (!PSV.GetPSVRuntimeInfo0())
														
 
															       return Result::InvalidPSV;
														
 
															     if (!PSV.GetPSVRuntimeInfo1())
														
--- a/include/dxc/Support/DxcLangExtensionsHelper.h
+++ b/include/dxc/Support/DxcLangExtensionsHelper.h
@@ -192,7 +192,7 @@ public:
 
															     return SemanticDefineValidationResult{ warning, error };
														
 
															   }
														
 
															-  __override void SetupSema(clang::Sema &S) {
														
 
															+  void SetupSema(clang::Sema &S) override {
														
 
															     clang::ExternalASTSource *astSource = S.getASTContext().getExternalSource();
														
 
															     if (clang::ExternalSemaSource *externalSema =
														
 
															             llvm::dyn_cast_or_null<clang::ExternalSemaSource>(astSource)) {
														
@@ -202,13 +202,13 @@ public:
 
															     }
														
 
															   }
														
 
															-  __override void SetupPreprocessorOptions(clang::PreprocessorOptions &PPOpts) {
														
 
															+  void SetupPreprocessorOptions(clang::PreprocessorOptions &PPOpts) override {
														
 
															     for (const auto & define : m_defines) {
														
 
															       PPOpts.addMacroDef(llvm::StringRef(define.c_str()));
														
 
															     }
														
 
															   }
														
 
															-  __override DxcLangExtensionsHelper *GetDxcLangExtensionsHelper() {
														
 
															+  DxcLangExtensionsHelper *GetDxcLangExtensionsHelper() override {
														
 
															     return this;
														
 
															   }
														
@@ -220,27 +220,27 @@ public:
 
															 // Use this macro to embed an implementation that will delegate to a field.
														
 
															 // Note that QueryInterface still needs to return the vtable.
														
 
															 #define DXC_LANGEXTENSIONS_HELPER_IMPL(_helper_field_) \
														
 
															-  __override HRESULT STDMETHODCALLTYPE RegisterIntrinsicTable(_In_ IDxcIntrinsicTable *pTable) { \
														
 
															+  HRESULT STDMETHODCALLTYPE RegisterIntrinsicTable(_In_ IDxcIntrinsicTable *pTable) override { \
														
 
															     DxcThreadMalloc TM(m_pMalloc); \
														
 
															     return (_helper_field_).RegisterIntrinsicTable(pTable); \
														
 
															   } \
														
 
															-  __override HRESULT STDMETHODCALLTYPE RegisterSemanticDefine(LPCWSTR name) { \
														
 
															+  HRESULT STDMETHODCALLTYPE RegisterSemanticDefine(LPCWSTR name) override { \
														
 
															     DxcThreadMalloc TM(m_pMalloc); \
														
 
															     return (_helper_field_).RegisterSemanticDefine(name); \
														
 
															   } \
														
 
															-  __override HRESULT STDMETHODCALLTYPE RegisterSemanticDefineExclusion(LPCWSTR name) { \
														
 
															+  HRESULT STDMETHODCALLTYPE RegisterSemanticDefineExclusion(LPCWSTR name) override { \
														
 
															     DxcThreadMalloc TM(m_pMalloc); \
														
 
															     return (_helper_field_).RegisterSemanticDefineExclusion(name); \
														
 
															   } \
														
 
															-  __override HRESULT STDMETHODCALLTYPE RegisterDefine(LPCWSTR name) { \
														
 
															+  HRESULT STDMETHODCALLTYPE RegisterDefine(LPCWSTR name) override { \
														
 
															     DxcThreadMalloc TM(m_pMalloc); \
														
 
															     return (_helper_field_).RegisterDefine(name); \
														
 
															   } \
														
 
															-  __override HRESULT STDMETHODCALLTYPE SetSemanticDefineValidator(_In_ IDxcSemanticDefineValidator* pValidator) { \
														
 
															+  HRESULT STDMETHODCALLTYPE SetSemanticDefineValidator(_In_ IDxcSemanticDefineValidator* pValidator) override { \
														
 
															     DxcThreadMalloc TM(m_pMalloc); \
														
 
															     return (_helper_field_).SetSemanticDefineValidator(pValidator); \
														
 
															   } \
														
 
															-  __override HRESULT STDMETHODCALLTYPE SetSemanticDefineMetaDataName(LPCSTR name) { \
														
 
															+  HRESULT STDMETHODCALLTYPE SetSemanticDefineMetaDataName(LPCSTR name) override { \
														
 
															     DxcThreadMalloc TM(m_pMalloc); \
														
 
															     return (_helper_field_).SetSemanticDefineMetaDataName(name); \
														
 
															   } \
														
--- a/include/dxc/Support/FileIOHelper.h
+++ b/include/dxc/Support/FileIOHelper.h
@@ -53,7 +53,7 @@ public:
 
															   }
														
 
															   explicit CDxcTMHeapPtr(_In_ T* pData) throw() :
														
 
															-    CDxcTMHeapPtr<T, CDxcThreadMallocAllocator>(pData)
														
 
															+    CHeapPtr<T, CDxcThreadMallocAllocator>(pData)
														
 
															   {
														
 
															   }
														
 
															 };
														
--- a/include/dxc/Support/HLSLOptions.h
+++ b/include/dxc/Support/HLSLOptions.h
@@ -162,11 +162,11 @@ public:
 
															   // SPIRV Change Starts
														
 
															 #ifdef ENABLE_SPIRV_CODEGEN
														
 
															   bool GenSPIRV;                           // OPT_spirv
														
 
															-  bool VkIgnoreUnusedResources;            // OPT_fvk_ignore_used_resources
														
 
															   bool VkInvertY;                          // OPT_fvk_invert_y
														
 
															   bool VkUseGlLayout;                      // OPT_fvk_use_gl_layout
														
 
															   bool VkUseDxLayout;                      // OPT_fvk_use_dx_layout
														
 
															   bool SpvEnableReflect;                   // OPT_fspv_reflect
														
 
															+  bool VkNoWarnIgnoredFeatures;            // OPT_Wno_vk_ignored_features
														
 
															   llvm::StringRef VkStageIoOrder;          // OPT_fvk_stage_io_order
														
 
															   llvm::SmallVector<int32_t, 4> VkBShift;  // OPT_fvk_b_shift
														
 
															   llvm::SmallVector<int32_t, 4> VkTShift;  // OPT_fvk_t_shift
														
--- a/include/dxc/Support/HLSLOptions.td
+++ b/include/dxc/Support/HLSLOptions.td
@@ -237,8 +237,6 @@ def auto_binding_space : Separate<["-", "/"], "auto-binding-space">, Group<hlslc
 
															 // SPIRV Change Starts
														
 
															 def spirv : Flag<["-"], "spirv">, Group<spirv_Group>, Flags<[CoreOption, DriverOption]>,
														
 
															   HelpText<"Generate SPIR-V code">;
														
 
															-def fvk_ignore_unused_resources : Flag<["-"], "fvk-ignore-unused-resources">, Group<spirv_Group>, Flags<[CoreOption, DriverOption]>,
														
 
															-  HelpText<"Do not emit SPIR-V code for unused resources">;
														
 
															 def fvk_stage_io_order_EQ : Joined<["-"], "fvk-stage-io-order=">, Group<spirv_Group>, Flags<[CoreOption, DriverOption, HelpHidden]>,
														
 
															   HelpText<"Specify Vulkan stage I/O location assignment order">;
														
 
															 def fvk_b_shift : MultiArg<["-"], "fvk-b-shift", 2>, MetaVarName<"<shift> <space>">, Group<spirv_Group>, Flags<[CoreOption, DriverOption]>,
														
@@ -261,6 +259,8 @@ def fspv_extension_EQ : Joined<["-"], "fspv-extension=">, Group<spirv_Group>, Fl
 
															   HelpText<"Specify SPIR-V extension permitted to use">;
														
 
															 def fspv_target_env_EQ : Joined<["-"], "fspv-target-env=">, Group<spirv_Group>, Flags<[CoreOption, DriverOption]>,
														
 
															   HelpText<"Specify the target environment: vulkan1.0 (default) or vulkan1.1">;
														
 
															+def Wno_vk_ignored_features : Joined<["-"], "Wno-vk-ignored-features">, Group<spirv_Group>, Flags<[CoreOption, DriverOption, HelpHidden]>,
														
 
															+  HelpText<"Do not emit warnings for ingored features resulting from no Vulkan support">;
														
 
															 // SPIRV Change Ends
														
 
															 //////////////////////////////////////////////////////////////////////////////
														
--- a/include/dxc/Support/dxcapi.impl.h
+++ b/include/dxc/Support/dxcapi.impl.h
@@ -97,7 +97,7 @@ public:
 
															     return CreateFromResultErrorStatus(resultBlob, errorBlob, status, pResult);
														
 
															   }
														
 
															-  __override HRESULT STDMETHODCALLTYPE GetStatus(_Out_ HRESULT *pStatus) {
														
 
															+  HRESULT STDMETHODCALLTYPE GetStatus(_Out_ HRESULT *pStatus) override {
														
 
															     if (pStatus == nullptr)
														
 
															       return E_INVALIDARG;
														
@@ -105,13 +105,13 @@ public:
 
															     return S_OK;
														
 
															   }
														
 
															-  __override HRESULT STDMETHODCALLTYPE
														
 
															-    GetResult(_COM_Outptr_result_maybenull_ IDxcBlob **ppResult) {
														
 
															+  HRESULT STDMETHODCALLTYPE
														
 
															+    GetResult(_COM_Outptr_result_maybenull_ IDxcBlob **ppResult) override {
														
 
															     return m_result.CopyTo(ppResult);
														
 
															   }
														
 
															-  __override HRESULT STDMETHODCALLTYPE
														
 
															-    GetErrorBuffer(_COM_Outptr_result_maybenull_ IDxcBlobEncoding **ppErrors) {
														
 
															+  HRESULT STDMETHODCALLTYPE
														
 
															+    GetErrorBuffer(_COM_Outptr_result_maybenull_ IDxcBlobEncoding **ppErrors) override {
														
 
															     return m_errors.CopyTo(ppErrors);
														
 
															   }
														
 
															 };
														
--- a/include/dxc/Support/microcom.h
+++ b/include/dxc/Support/microcom.h
@@ -139,21 +139,6 @@ void DxcCallDestructor(T *obj) {
 
															 /// marshaling. This will help catch marshaling problems early or avoid
														
 
															 /// them altogether.
														
 
															 /// </remarks>
														
 
															-template<typename... Ts, typename TObject>
														
 
															-HRESULT DoBasicQueryInterface(TObject* self, REFIID iid, void** ppvObject) {
														
 
															-  if (ppvObject == nullptr) return E_POINTER;
														
 
															-
														
 
															-  // Support INoMarshal to void GIT shenanigans.
														
 
															-  if (IsEqualIID(iid, __uuidof(IUnknown)) ||
														
 
															-    IsEqualIID(iid, __uuidof(INoMarshal))) {
														
 
															-    *ppvObject = reinterpret_cast<IUnknown*>(self);
														
 
															-    reinterpret_cast<IUnknown*>(self)->AddRef();
														
 
															-    return S_OK;
														
 
															-  }
														
 
															-
														
 
															-  return DoBasicQueryInterface_recurse<TObject, Ts...>(self, iid, ppvObject);
														
 
															-}
														
 
															-
														
 
															 template<typename TObject>
														
 
															 HRESULT DoBasicQueryInterface_recurse(TObject* self, REFIID iid, void** ppvObject) {
														
 
															   return E_NOINTERFACE;
														
@@ -168,6 +153,20 @@ HRESULT DoBasicQueryInterface_recurse(TObject* self, REFIID iid, void** ppvObjec
 
															   }
														
 
															   return DoBasicQueryInterface_recurse<TObject, Ts...>(self, iid, ppvObject);
														
 
															 }
														
 
															+template<typename... Ts, typename TObject>
														
 
															+HRESULT DoBasicQueryInterface(TObject* self, REFIID iid, void** ppvObject) {
														
 
															+  if (ppvObject == nullptr) return E_POINTER;
														
 
															+
														
 
															+  // Support INoMarshal to void GIT shenanigans.
														
 
															+  if (IsEqualIID(iid, __uuidof(IUnknown)) ||
														
 
															+    IsEqualIID(iid, __uuidof(INoMarshal))) {
														
 
															+    *ppvObject = reinterpret_cast<IUnknown*>(self);
														
 
															+    reinterpret_cast<IUnknown*>(self)->AddRef();
														
 
															+    return S_OK;
														
 
															+  }
														
 
															+
														
 
															+  return DoBasicQueryInterface_recurse<TObject, Ts...>(self, iid, ppvObject);
														
 
															+}
														
 
															 template <typename T>
														
 
															 HRESULT AssignToOut(T value, _Out_ T* pResult) {
														
--- a/include/dxc/dxcapi.internal.h
+++ b/include/dxc/dxcapi.internal.h
@@ -22,11 +22,11 @@ typedef interface ID3D10Blob ID3D10Blob;
 
															 ///////////////////////////////////////////////////////////////////////////////
														
 
															 // Intrinsic definitions.
														
 
															-#define AR_QUAL_IN             0x0000000000000010UI64
														
 
															-#define AR_QUAL_OUT            0x0000000000000020UI64
														
 
															-#define AR_QUAL_CONST          0x0000000000000200UI64
														
 
															-#define AR_QUAL_ROWMAJOR       0x0000000000000400UI64
														
 
															-#define AR_QUAL_COLMAJOR       0x0000000000000800UI64
														
 
															+#define AR_QUAL_IN             0x0000000000000010ULL
														
 
															+#define AR_QUAL_OUT            0x0000000000000020ULL
														
 
															+#define AR_QUAL_CONST          0x0000000000000200ULL
														
 
															+#define AR_QUAL_ROWMAJOR       0x0000000000000400ULL
														
 
															+#define AR_QUAL_COLMAJOR       0x0000000000000800ULL
														
 
															 #define AR_QUAL_IN_OUT (AR_QUAL_IN | AR_QUAL_OUT)
														
--- a/include/llvm/IR/DiagnosticPrinter.h
+++ b/include/llvm/IR/DiagnosticPrinter.h
@@ -55,6 +55,8 @@ public:
 
															   // Other types.
														
 
															   virtual DiagnosticPrinter &operator<<(const SMDiagnostic &Diag) = 0;
														
 
															+  virtual DiagnosticPrinter &
														
 
															+  operator<<(std::ios_base &(*iomanip)(std::ios_base &)) = 0; // HLSL Change
														
 
															 };
														
 
															 /// \brief Basic diagnostic printer that uses an underlying raw_ostream.
														
@@ -88,6 +90,8 @@ public:
 
															   // Other types.
														
 
															   DiagnosticPrinter &operator<<(const SMDiagnostic &Diag) override;
														
 
															+  DiagnosticPrinter &operator<<(
														
 
															+      std::ios_base &(*iomanip)(std::ios_base &)) override; // HLSL Change
														
 
															 };
														
 
															 } // End namespace llvm
														
--- a/include/llvm/Support/raw_ostream.h
+++ b/include/llvm/Support/raw_ostream.h
@@ -60,6 +60,10 @@ private:
 
															   /// this buffer.
														
 
															   char *OutBufStart, *OutBufEnd, *OutBufCur;
														
 
															+  /// The base in which numbers will be written. default is 10. 8 and 16 are
														
 
															+  /// also possible.
														
 
															+  int writeBase;  // HLSL Change
														
 
															+
														
 
															   enum BufferKind {
														
 
															     Unbuffered = 0,
														
 
															     InternalBuffer,
														
@@ -84,6 +88,7 @@ public:
 
															       : BufferMode(unbuffered ? Unbuffered : InternalBuffer) {
														
 
															     // Start out ready to flush.
														
 
															     OutBufStart = OutBufEnd = OutBufCur = nullptr;
														
 
															+    writeBase = 10; // HLSL Change
														
 
															   }
														
 
															   virtual ~raw_ostream();
														
@@ -213,6 +218,9 @@ public:
 
															   /// Output \p N in hexadecimal, without any prefix or padding.
														
 
															   raw_ostream &write_hex(unsigned long long N);
														
 
															+  /// Output \p N in writeBase, without any prefix or padding.
														
 
															+  raw_ostream &write_base(unsigned long long N); // HLSL Change
														
 
															+
														
 
															   /// Output \p Str, turning '\\', '\t', '\n', '"', and anything that doesn't
														
 
															   /// satisfy std::isprint into an escape sequence.
														
 
															   raw_ostream &write_escaped(StringRef Str, bool UseHexEscapes = false);
														
@@ -228,7 +236,10 @@ public:
 
															   // Formatted output, see the formatHex() function in Support/Format.h.
														
 
															   raw_ostream &operator<<(const FormattedNumber &);
														
 
															-  
														
 
															+
														
 
															+  raw_ostream &
														
 
															+  operator<<(std::ios_base &(*iomanip)(std::ios_base &)); // HLSL Change
														
 
															+
														
 
															   /// indent - Insert 'NumSpaces' spaces.
														
 
															   raw_ostream &indent(unsigned NumSpaces);
														
@@ -402,7 +413,7 @@ public:
 
															   /// Manually flush the stream and close the file. Note that this does not call
														
 
															   /// fsync.
														
 
															-  void close();
														
 
															+  void close() override;
														
 
															   bool supportsSeeking() { return SupportsSeeking; }
														
--- a/lib/Analysis/DxilConstantFolding.cpp
+++ b/lib/Analysis/DxilConstantFolding.cpp
@@ -35,7 +35,7 @@
 
															 #include <algorithm>
														
 
															 #include <functional>
														
 
															-#include "dxc/HLSL/Dxil.h"
														
 
															+#include "dxc/HLSL/DXIL.h"
														
 
															 using namespace llvm;
														
 
															 using namespace hlsl;
														
--- a/lib/Bitcode/Reader/BitcodeReader.cpp
+++ b/lib/Bitcode/Reader/BitcodeReader.cpp
@@ -4814,7 +4814,7 @@ void report_fatal_error_handler(void *user_datam, const std::string &reason,
 
															   BitcodeDiagnosticInfo BDI(std::error_code(EINVAL, std::system_category()),
														
 
															                             DiagnosticSeverity::DS_Error, reason);
														
 
															   data->DiagnosticHandler(BDI);
														
 
															-  throw std::exception("Invalid bitcode");
														
 
															+  throw std::runtime_error("Invalid bitcode");
														
 
															 }
														
 
															 // HLSL Change Ends
														
--- a/lib/DxcSupport/FileIOHelper.cpp
+++ b/lib/DxcSupport/FileIOHelper.cpp
@@ -80,7 +80,7 @@ static HeapMalloc g_HeapMalloc;
 
															 namespace hlsl {
														
 
															-IMalloc *GetGlobalHeapMalloc() {
														
 
															+IMalloc *GetGlobalHeapMalloc() throw() {
														
 
															   return &g_HeapMalloc;
														
 
															 }
														
@@ -141,7 +141,7 @@ void WriteBinaryFile(LPCWSTR pFileName, const void *pData, DWORD DataSize) {
 
															 }
														
 
															 _Use_decl_annotations_
														
 
															-UINT32 DxcCodePageFromBytes(const char *bytes, size_t byteLen) {
														
 
															+UINT32 DxcCodePageFromBytes(const char *bytes, size_t byteLen) throw() {
														
 
															   UINT32 codePage;
														
 
															   if (byteLen >= 4) {
														
 
															     // Now try to use the BOM to check for Unicode encodings
														
@@ -321,7 +321,7 @@ static HRESULT CodePageBufferToUtf16(UINT32 codePage, LPCVOID bufferPointer,
 
															 _Use_decl_annotations_
														
 
															 HRESULT DxcCreateBlobFromBlob(
														
 
															-    IDxcBlob *pBlob, UINT32 offset, UINT32 length, IDxcBlob **ppResult) {
														
 
															+    IDxcBlob *pBlob, UINT32 offset, UINT32 length, IDxcBlob **ppResult) throw() {
														
 
															   if (pBlob == nullptr || ppResult == nullptr) {
														
 
															     return E_POINTER;
														
 
															   }
														
@@ -347,7 +347,7 @@ HRESULT DxcCreateBlobFromBlob(
 
															 _Use_decl_annotations_
														
 
															 HRESULT
														
 
															-DxcCreateBlobOnHeap(LPCVOID pData, UINT32 size, IDxcBlob **ppResult) {
														
 
															+DxcCreateBlobOnHeap(LPCVOID pData, UINT32 size, IDxcBlob **ppResult) throw() {
														
 
															   if (pData == nullptr || ppResult == nullptr) {
														
 
															     return E_POINTER;
														
 
															   }
														
@@ -362,7 +362,7 @@ DxcCreateBlobOnHeap(LPCVOID pData, UINT32 size, IDxcBlob **ppResult) {
 
															 _Use_decl_annotations_
														
 
															 HRESULT
														
 
															 DxcCreateBlobOnHeapCopy(_In_bytecount_(size) LPCVOID pData, UINT32 size,
														
 
															-                        _COM_Outptr_ IDxcBlob **ppResult) {
														
 
															+                        _COM_Outptr_ IDxcBlob **ppResult) throw() {
														
 
															   if (pData == nullptr || ppResult == nullptr) {
														
 
															     return E_POINTER;
														
 
															   }
														
@@ -415,7 +415,7 @@ DxcCreateBlobFromFile(IMalloc *pMalloc, LPCWSTR pFileName, UINT32 *pCodePage,
 
															 _Use_decl_annotations_
														
 
															 HRESULT DxcCreateBlobFromFile(LPCWSTR pFileName, UINT32 *pCodePage,
														
 
															-                              IDxcBlobEncoding **ppBlobEncoding) {
														
 
															+                              IDxcBlobEncoding **ppBlobEncoding) throw() {
														
 
															   CComPtr<IMalloc> pMalloc;
														
 
															   IFR(CoGetMalloc(1, &pMalloc));
														
 
															   return DxcCreateBlobFromFile(pMalloc, pFileName, pCodePage, ppBlobEncoding);
														
@@ -424,7 +424,7 @@ HRESULT DxcCreateBlobFromFile(LPCWSTR pFileName, UINT32 *pCodePage,
 
															 _Use_decl_annotations_
														
 
															 HRESULT
														
 
															 DxcCreateBlobWithEncodingSet(IMalloc *pMalloc, IDxcBlob *pBlob, UINT32 codePage,
														
 
															-                             IDxcBlobEncoding **ppBlobEncoding) {
														
 
															+                             IDxcBlobEncoding **ppBlobEncoding) throw() {
														
 
															   DXASSERT_NOMSG(pMalloc != nullptr);
														
 
															   DXASSERT_NOMSG(pBlob != nullptr);
														
 
															   DXASSERT_NOMSG(ppBlobEncoding != nullptr);
														
@@ -442,7 +442,7 @@ DxcCreateBlobWithEncodingSet(IMalloc *pMalloc, IDxcBlob *pBlob, UINT32 codePage,
 
															 _Use_decl_annotations_
														
 
															 HRESULT
														
 
															 DxcCreateBlobWithEncodingSet(IDxcBlob *pBlob, UINT32 codePage,
														
 
															-                             IDxcBlobEncoding **ppBlobEncoding) {
														
 
															+                             IDxcBlobEncoding **ppBlobEncoding) throw() {
														
 
															   return DxcCreateBlobWithEncodingSet(DxcGetThreadMallocNoRef(), pBlob,
														
 
															                                       codePage, ppBlobEncoding);
														
 
															 }
														
@@ -450,7 +450,7 @@ DxcCreateBlobWithEncodingSet(IDxcBlob *pBlob, UINT32 codePage,
 
															 _Use_decl_annotations_
														
 
															 HRESULT DxcCreateBlobWithEncodingFromPinned(LPCVOID pText, UINT32 size,
														
 
															                                             UINT32 codePage,
														
 
															-                                            IDxcBlobEncoding **pBlobEncoding) {
														
 
															+                                            IDxcBlobEncoding **pBlobEncoding) throw() {
														
 
															   *pBlobEncoding = nullptr;
														
 
															   InternalDxcBlobEncoding *internalEncoding;
														
@@ -467,7 +467,7 @@ _Use_decl_annotations_
 
															 HRESULT
														
 
															 DxcCreateBlobWithEncodingFromStream(IStream *pStream, bool newInstanceAlways,
														
 
															                                     UINT32 codePage,
														
 
															-                                    IDxcBlobEncoding **ppBlobEncoding) {
														
 
															+                                    IDxcBlobEncoding **ppBlobEncoding) throw() {
														
 
															   *ppBlobEncoding = nullptr;
														
 
															   if (pStream == nullptr) {
														
 
															     return S_OK;
														
@@ -496,7 +496,7 @@ DxcCreateBlobWithEncodingFromStream(IStream *pStream, bool newInstanceAlways,
 
															 _Use_decl_annotations_
														
 
															 HRESULT
														
 
															 DxcCreateBlobWithEncodingOnHeap(LPCVOID pText, UINT32 size, UINT32 codePage,
														
 
															-                                IDxcBlobEncoding **pBlobEncoding) {
														
 
															+                                IDxcBlobEncoding **pBlobEncoding) throw() {
														
 
															   *pBlobEncoding = nullptr;
														
 
															   InternalDxcBlobEncoding *internalEncoding;
														
@@ -511,7 +511,7 @@ DxcCreateBlobWithEncodingOnHeap(LPCVOID pText, UINT32 size, UINT32 codePage,
 
															 _Use_decl_annotations_
														
 
															 HRESULT
														
 
															 DxcCreateBlobWithEncodingOnHeapCopy(LPCVOID pText, UINT32 size, UINT32 codePage,
														
 
															-  IDxcBlobEncoding **pBlobEncoding) {
														
 
															+  IDxcBlobEncoding **pBlobEncoding) throw() {
														
 
															   *pBlobEncoding = nullptr;
														
 
															   CDxcMallocHeapPtr<char> heapCopy(DxcGetThreadMallocNoRef());
														
@@ -532,7 +532,7 @@ DxcCreateBlobWithEncodingOnHeapCopy(LPCVOID pText, UINT32 size, UINT32 codePage,
 
															 _Use_decl_annotations_
														
 
															 HRESULT
														
 
															 DxcCreateBlobWithEncodingOnMalloc(LPCVOID pText, IMalloc *pIMalloc, UINT32 size, UINT32 codePage,
														
 
															-  IDxcBlobEncoding **pBlobEncoding) {
														
 
															+  IDxcBlobEncoding **pBlobEncoding) throw() {
														
 
															   *pBlobEncoding = nullptr;
														
 
															   InternalDxcBlobEncoding* internalEncoding;
														
@@ -546,7 +546,7 @@ DxcCreateBlobWithEncodingOnMalloc(LPCVOID pText, IMalloc *pIMalloc, UINT32 size,
 
															 _Use_decl_annotations_
														
 
															 HRESULT
														
 
															 DxcCreateBlobWithEncodingOnMallocCopy(IMalloc *pIMalloc, LPCVOID pText, UINT32 size, UINT32 codePage,
														
 
															-  IDxcBlobEncoding **ppBlobEncoding) {
														
 
															+  IDxcBlobEncoding **ppBlobEncoding) throw() {
														
 
															   *ppBlobEncoding = nullptr;
														
 
															   void *pData = pIMalloc->Alloc(size);
														
 
															   if (pData == nullptr)
														
@@ -562,7 +562,7 @@ DxcCreateBlobWithEncodingOnMallocCopy(IMalloc *pIMalloc, LPCVOID pText, UINT32 s
 
															 _Use_decl_annotations_
														
 
															-HRESULT DxcGetBlobAsUtf8(IDxcBlob *pBlob, IDxcBlobEncoding **pBlobEncoding) {
														
 
															+HRESULT DxcGetBlobAsUtf8(IDxcBlob *pBlob, IDxcBlobEncoding **pBlobEncoding) throw() {
														
 
															   *pBlobEncoding = nullptr;
														
 
															   HRESULT hr;
														
@@ -654,7 +654,7 @@ HRESULT DxcGetBlobAsUtf8(IDxcBlob *pBlob, IDxcBlobEncoding **pBlobEncoding) {
 
															 HRESULT
														
 
															 DxcGetBlobAsUtf8NullTerm(_In_ IDxcBlob *pBlob,
														
 
															-                         _COM_Outptr_ IDxcBlobEncoding **ppBlobEncoding) {
														
 
															+                         _COM_Outptr_ IDxcBlobEncoding **ppBlobEncoding) throw() {
														
 
															   *ppBlobEncoding = nullptr;
														
 
															   HRESULT hr;
														
@@ -700,7 +700,7 @@ DxcGetBlobAsUtf8NullTerm(_In_ IDxcBlob *pBlob,
 
															 }
														
 
															 _Use_decl_annotations_
														
 
															-HRESULT DxcGetBlobAsUtf16(IDxcBlob *pBlob, IMalloc *pMalloc, IDxcBlobEncoding **pBlobEncoding) {
														
 
															+HRESULT DxcGetBlobAsUtf16(IDxcBlob *pBlob, IMalloc *pMalloc, IDxcBlobEncoding **pBlobEncoding) throw() {
														
 
															   *pBlobEncoding = nullptr;
														
 
															   HRESULT hr;
														
@@ -815,22 +815,26 @@ public:
 
															   }
														
 
															   // AbstractMemoryStream implementation.
														
 
															-  __override LPBYTE GetPtr() {
														
 
															+  LPBYTE GetPtr() throw() override {
														
 
															     return m_pMemory;
														
 
															   }
														
 
															-  __override ULONG GetPtrSize() {
														
 
															+  ULONG GetPtrSize() throw() override {
														
 
															     return m_size;
														
 
															   }
														
 
															-  __override LPBYTE Detach() {
														
 
															+  LPBYTE Detach() throw() override {
														
 
															     LPBYTE result = m_pMemory;
														
 
															     m_pMemory = nullptr;
														
 
															     Reset();
														
 
															     return result;
														
 
															   }
														
 
															-  __override HRESULT Reserve(ULONG targetSize) {
														
 
															+  UINT64 GetPosition() throw() override {
														
 
															+    return m_offset;
														
 
															+  }
														
 
															+
														
 
															+  HRESULT Reserve(ULONG targetSize) throw() override {
														
 
															     if (m_pMemory == nullptr) {
														
 
															       m_pMemory = (LPBYTE)m_pMalloc->Alloc(targetSize);
														
 
															       if (m_pMemory == nullptr) {
														
@@ -851,18 +855,15 @@ public:
 
															   }
														
 
															   // IDxcBlob implementation. Requires no further writes.
														
 
															-  __override LPVOID STDMETHODCALLTYPE GetBufferPointer(void) {
														
 
															+  LPVOID STDMETHODCALLTYPE GetBufferPointer(void) override {
														
 
															     return m_pMemory;
														
 
															   }
														
 
															-  __override SIZE_T STDMETHODCALLTYPE GetBufferSize(void) {
														
 
															+  SIZE_T STDMETHODCALLTYPE GetBufferSize(void) override {
														
 
															     return m_size;
														
 
															   }
														
 
															-  __override UINT64 GetPosition() {
														
 
															-    return m_offset;
														
 
															-  }
														
 
															   // ISequentialStream implementation.
														
 
															-  __override HRESULT STDMETHODCALLTYPE Read(void* pv, ULONG cb, ULONG* pcbRead) {
														
 
															+  HRESULT STDMETHODCALLTYPE Read(void* pv, ULONG cb, ULONG* pcbRead) override {
														
 
															     if (!pv || !pcbRead) return E_POINTER;
														
 
															     // If we seeked past the end, read nothing.
														
 
															     if (m_offset > m_size) {
														
@@ -876,7 +877,7 @@ public:
 
															     return (*pcbRead == cb) ? S_OK : S_FALSE;
														
 
															   }
														
 
															-  __override HRESULT STDMETHODCALLTYPE Write(void const* pv, ULONG cb, ULONG* pcbWritten) {
														
 
															+  HRESULT STDMETHODCALLTYPE Write(void const* pv, ULONG cb, ULONG* pcbWritten) override {
														
 
															     if (!pv || !pcbWritten) return E_POINTER;
														
 
															     if (cb + m_offset > m_allocSize) {
														
 
															       HRESULT hr = Grow(cb + m_offset);
														
@@ -894,7 +895,7 @@ public:
 
															   }
														
 
															   // IStream implementation.
														
 
															-  __override HRESULT STDMETHODCALLTYPE SetSize(ULARGE_INTEGER val) {
														
 
															+  HRESULT STDMETHODCALLTYPE SetSize(ULARGE_INTEGER val) override {
														
 
															     if (val.HighPart != 0) {
														
 
															       return E_OUTOFMEMORY;
														
 
															     }
														
@@ -912,31 +913,31 @@ public:
 
															     return S_OK;
														
 
															   }
														
 
															-  __override HRESULT STDMETHODCALLTYPE CopyTo(IStream *, ULARGE_INTEGER,
														
 
															+  HRESULT STDMETHODCALLTYPE CopyTo(IStream *, ULARGE_INTEGER,
														
 
															     ULARGE_INTEGER *,
														
 
															-    ULARGE_INTEGER *) {
														
 
															+    ULARGE_INTEGER *) override {
														
 
															     return E_NOTIMPL;
														
 
															   }
														
 
															-  __override HRESULT STDMETHODCALLTYPE Commit(DWORD) { return E_NOTIMPL; }
														
 
															+  HRESULT STDMETHODCALLTYPE Commit(DWORD) override { return E_NOTIMPL; }
														
 
															-  __override HRESULT STDMETHODCALLTYPE Revert(void) { return E_NOTIMPL; }
														
 
															+  HRESULT STDMETHODCALLTYPE Revert(void) override { return E_NOTIMPL; }
														
 
															-  __override HRESULT STDMETHODCALLTYPE LockRegion(ULARGE_INTEGER,
														
 
															-    ULARGE_INTEGER, DWORD) {
														
 
															+  HRESULT STDMETHODCALLTYPE LockRegion(ULARGE_INTEGER,
														
 
															+    ULARGE_INTEGER, DWORD) override {
														
 
															     return E_NOTIMPL;
														
 
															   }
														
 
															-  __override HRESULT STDMETHODCALLTYPE UnlockRegion(ULARGE_INTEGER,
														
 
															-    ULARGE_INTEGER, DWORD) {
														
 
															+  HRESULT STDMETHODCALLTYPE UnlockRegion(ULARGE_INTEGER,
														
 
															+    ULARGE_INTEGER, DWORD) override {
														
 
															     return E_NOTIMPL;
														
 
															   }
														
 
															-  __override HRESULT STDMETHODCALLTYPE Clone(IStream **) { return E_NOTIMPL; }
														
 
															+  HRESULT STDMETHODCALLTYPE Clone(IStream **) override { return E_NOTIMPL; }
														
 
															-  __override HRESULT STDMETHODCALLTYPE Seek(LARGE_INTEGER liDistanceToMove,
														
 
															+  HRESULT STDMETHODCALLTYPE Seek(LARGE_INTEGER liDistanceToMove,
														
 
															     DWORD dwOrigin,
														
 
															-    ULARGE_INTEGER *lpNewFilePointer) {
														
 
															+    ULARGE_INTEGER *lpNewFilePointer) override {
														
 
															     if (lpNewFilePointer != nullptr) {
														
 
															       lpNewFilePointer->QuadPart = 0;
														
 
															     }
														
@@ -968,8 +969,8 @@ public:
 
															     return S_OK;
														
 
															   }
														
 
															-  __override HRESULT STDMETHODCALLTYPE Stat(STATSTG *pStatstg,
														
 
															-    DWORD grfStatFlag) {
														
 
															+  HRESULT STDMETHODCALLTYPE Stat(STATSTG *pStatstg,
														
 
															+    DWORD grfStatFlag) override {
														
 
															     if (pStatstg == nullptr) {
														
 
															       return E_POINTER;
														
 
															     }
														
@@ -1003,8 +1004,8 @@ public:
 
															   }
														
 
															   // ISequentialStream implementation.
														
 
															-  __override HRESULT STDMETHODCALLTYPE Read(void *pv, ULONG cb,
														
 
															-    ULONG *pcbRead) {
														
 
															+  HRESULT STDMETHODCALLTYPE Read(void *pv, ULONG cb,
														
 
															+    ULONG *pcbRead) override {
														
 
															     if (!pv || !pcbRead)
														
 
															       return E_POINTER;
														
 
															     ULONG cbLeft = m_size - m_offset;
														
@@ -1014,40 +1015,40 @@ public:
 
															     return (*pcbRead == cb) ? S_OK : S_FALSE;
														
 
															   }
														
 
															-  __override HRESULT STDMETHODCALLTYPE Write(void const *, ULONG, ULONG *) {
														
 
															+  HRESULT STDMETHODCALLTYPE Write(void const *, ULONG, ULONG *) override {
														
 
															     return STG_E_ACCESSDENIED;
														
 
															   }
														
 
															   // IStream implementation.
														
 
															-  __override HRESULT STDMETHODCALLTYPE SetSize(ULARGE_INTEGER val) {
														
 
															+  HRESULT STDMETHODCALLTYPE SetSize(ULARGE_INTEGER val) override {
														
 
															     return STG_E_ACCESSDENIED;
														
 
															   }
														
 
															-  __override HRESULT STDMETHODCALLTYPE CopyTo(IStream *, ULARGE_INTEGER,
														
 
															+  HRESULT STDMETHODCALLTYPE CopyTo(IStream *, ULARGE_INTEGER,
														
 
															     ULARGE_INTEGER *,
														
 
															-    ULARGE_INTEGER *) {
														
 
															+    ULARGE_INTEGER *) override {
														
 
															     return E_NOTIMPL;
														
 
															   }
														
 
															-  __override HRESULT STDMETHODCALLTYPE Commit(DWORD) { return E_NOTIMPL; }
														
 
															+  HRESULT STDMETHODCALLTYPE Commit(DWORD) override { return E_NOTIMPL; }
														
 
															-  __override HRESULT STDMETHODCALLTYPE Revert(void) { return E_NOTIMPL; }
														
 
															+  HRESULT STDMETHODCALLTYPE Revert(void) override { return E_NOTIMPL; }
														
 
															-  __override HRESULT STDMETHODCALLTYPE LockRegion(ULARGE_INTEGER,
														
 
															-    ULARGE_INTEGER, DWORD) {
														
 
															+  HRESULT STDMETHODCALLTYPE LockRegion(ULARGE_INTEGER,
														
 
															+    ULARGE_INTEGER, DWORD) override {
														
 
															     return E_NOTIMPL;
														
 
															   }
														
 
															-  __override HRESULT STDMETHODCALLTYPE UnlockRegion(ULARGE_INTEGER,
														
 
															-    ULARGE_INTEGER, DWORD) {
														
 
															+  HRESULT STDMETHODCALLTYPE UnlockRegion(ULARGE_INTEGER,
														
 
															+    ULARGE_INTEGER, DWORD) override {
														
 
															     return E_NOTIMPL;
														
 
															   }
														
 
															-  __override HRESULT STDMETHODCALLTYPE Clone(IStream **) { return E_NOTIMPL; }
														
 
															+  HRESULT STDMETHODCALLTYPE Clone(IStream **) override { return E_NOTIMPL; }
														
 
															-  __override HRESULT STDMETHODCALLTYPE Seek(LARGE_INTEGER liDistanceToMove,
														
 
															+  HRESULT STDMETHODCALLTYPE Seek(LARGE_INTEGER liDistanceToMove,
														
 
															     DWORD dwOrigin,
														
 
															-    ULARGE_INTEGER *lpNewFilePointer) {
														
 
															+    ULARGE_INTEGER *lpNewFilePointer) override {
														
 
															     if (lpNewFilePointer != nullptr) {
														
 
															       lpNewFilePointer->QuadPart = 0;
														
 
															     }
														
@@ -1084,8 +1085,8 @@ public:
 
															     return S_OK;
														
 
															   }
														
 
															-  __override HRESULT STDMETHODCALLTYPE Stat(STATSTG *pStatstg,
														
 
															-    DWORD grfStatFlag) {
														
 
															+  HRESULT STDMETHODCALLTYPE Stat(STATSTG *pStatstg,
														
 
															+    DWORD grfStatFlag) override {
														
 
															     if (pStatstg == nullptr) {
														
 
															       return E_POINTER;
														
 
															     }
														
@@ -1096,7 +1097,7 @@ public:
 
															   }
														
 
															 };
														
 
															-HRESULT CreateMemoryStream(_In_ IMalloc *pMalloc, _COM_Outptr_ AbstractMemoryStream** ppResult) {
														
 
															+HRESULT CreateMemoryStream(_In_ IMalloc *pMalloc, _COM_Outptr_ AbstractMemoryStream** ppResult) throw() {
														
 
															   if (pMalloc == nullptr || ppResult == nullptr) {
														
 
															     return E_POINTER;
														
 
															   }
														
@@ -1106,7 +1107,7 @@ HRESULT CreateMemoryStream(_In_ IMalloc *pMalloc, _COM_Outptr_ AbstractMemoryStr
 
															   return (*ppResult == nullptr) ? E_OUTOFMEMORY : S_OK;
														
 
															 }
														
 
															-HRESULT CreateReadOnlyBlobStream(_In_ IDxcBlob *pSource, _COM_Outptr_ IStream** ppResult) {
														
 
															+HRESULT CreateReadOnlyBlobStream(_In_ IDxcBlob *pSource, _COM_Outptr_ IStream** ppResult) throw() {
														
 
															   if (pSource == nullptr || ppResult == nullptr) {
														
 
															     return E_POINTER;
														
 
															   }
														
--- a/lib/DxcSupport/HLSLOptions.cpp
+++ b/lib/DxcSupport/HLSLOptions.cpp
@@ -159,6 +159,8 @@ MainArgs::MainArgs(llvm::ArrayRef<llvm::StringRef> args) {
 
															 MainArgs& MainArgs::operator=(const MainArgs &other) {
														
 
															   Utf8StringVector.clear();
														
 
															   Utf8CharPtrVector.clear();
														
 
															+  Utf8StringVector.reserve(other.Utf8StringVector.size());
														
 
															+  Utf8CharPtrVector.reserve(other.Utf8StringVector.size());
														
 
															   for (const std::string &str : other.Utf8StringVector) {
														
 
															     Utf8StringVector.emplace_back(str);
														
 
															     Utf8CharPtrVector.push_back(Utf8StringVector.back().data());
														
@@ -464,7 +466,7 @@ int ReadDxcOpts(const OptTable *optionTable, unsigned flagsToInclude,
 
															     if (opts.AllResourcesBound || opts.AvoidFlowControl ||
														
 
															         opts.CodeGenHighLevel || opts.DebugInfo || opts.DefaultColMajor ||
														
 
															         opts.DefaultRowMajor || opts.Defines.size() != 0 ||
														
 
															-        opts.DisableOptimizations || 
														
 
															+        opts.DisableOptimizations ||
														
 
															         !opts.EntryPoint.empty() || !opts.ForceRootSigVer.empty() ||
														
 
															         opts.PreferFlowControl || !opts.TargetProfile.empty()) {
														
 
															       errors << "Cannot specify compilation options when reading a binary file.";
														
@@ -495,7 +497,7 @@ int ReadDxcOpts(const OptTable *optionTable, unsigned flagsToInclude,
 
															   opts.VkUseGlLayout = Args.hasFlag(OPT_fvk_use_gl_layout, OPT_INVALID, false);
														
 
															   opts.VkUseDxLayout = Args.hasFlag(OPT_fvk_use_dx_layout, OPT_INVALID, false);
														
 
															   opts.SpvEnableReflect = Args.hasFlag(OPT_fspv_reflect, OPT_INVALID, false);
														
 
															-  opts.VkIgnoreUnusedResources = Args.hasFlag(OPT_fvk_ignore_unused_resources, OPT_INVALID, false);
														
 
															+  opts.VkNoWarnIgnoredFeatures = Args.hasFlag(OPT_Wno_vk_ignored_features, OPT_INVALID, false);
														
 
															   // Collects the arguments for -fvk-{b|s|t|u}-shift.
														
 
															   const auto handleVkShiftArgs =
														
@@ -560,7 +562,7 @@ int ReadDxcOpts(const OptTable *optionTable, unsigned flagsToInclude,
 
															       Args.hasFlag(OPT_fvk_use_gl_layout, OPT_INVALID, false) ||
														
 
															       Args.hasFlag(OPT_fvk_use_dx_layout, OPT_INVALID, false) ||
														
 
															       Args.hasFlag(OPT_fspv_reflect, OPT_INVALID, false) ||
														
 
															-      Args.hasFlag(OPT_fvk_ignore_unused_resources, OPT_INVALID, false) ||
														
 
															+      Args.hasFlag(OPT_Wno_vk_ignored_features, OPT_INVALID, false) ||
														
 
															       !Args.getLastArgValue(OPT_fvk_stage_io_order_EQ).empty() ||
														
 
															       !Args.getLastArgValue(OPT_fspv_extension_EQ).empty() ||
														
 
															       !Args.getLastArgValue(OPT_fspv_target_env_EQ).empty() ||
														
--- a/lib/DxcSupport/LLVMBuild.txt
+++ b/lib/DxcSupport/LLVMBuild.txt
@@ -0,0 +1,21 @@
 
															+;===- ./lib/DxcSupport/LLVMBuild.txt ---------------------------*- Conf -*--===;
														
 
															+;
														
 
															+;                     The LLVM Compiler Infrastructure
														
 
															+;
														
 
															+; This file is distributed under the University of Illinois Open Source
														
 
															+; License. See LICENSE.TXT for details.
														
 
															+;
														
 
															+;===------------------------------------------------------------------------===;
														
 
															+;
														
 
															+; This is an LLVMBuild description file for the components in this subdirectory.
														
 
															+;
														
 
															+; For more information on the LLVMBuild system, please see:
														
 
															+;
														
 
															+;   http://llvm.org/docs/LLVMBuild.html
														
 
															+;
														
 
															+;===------------------------------------------------------------------------===;
														
 
															+
														
 
															+[component_0]
														
 
															+type = Library
														
 
															+name = DxcSupport
														
 
															+parent = Libraries
														
--- a/lib/DxcSupport/dxcmem.cpp
+++ b/lib/DxcSupport/dxcmem.cpp
@@ -32,7 +32,7 @@ IMalloc *DxcGetThreadMallocNoRef() throw();
 
															 _Ret_maybenull_ _Post_writable_byte_size_(nBytes) void *DxcThreadAlloc(size_t nBytes) throw();
														
 
															 void DxcThreadFree(void *) throw();
														
 
															-HRESULT DxcInitThreadMalloc() {
														
 
															+HRESULT DxcInitThreadMalloc() throw() {
														
 
															   DXASSERT(g_ThreadMallocTlsIndex == 0, "else InitThreadMalloc already called");
														
 
															   DXASSERT(g_pDefaultMalloc == nullptr, "else InitThreadMalloc already called");
														
@@ -51,7 +51,7 @@ HRESULT DxcInitThreadMalloc() {
 
															   return S_OK;
														
 
															 }
														
 
															-void DxcCleanupThreadMalloc() {
														
 
															+void DxcCleanupThreadMalloc() throw() {
														
 
															   if (g_ThreadMallocTlsIndex) {
														
 
															     TlsFree(g_ThreadMallocTlsIndex);
														
 
															     g_ThreadMallocTlsIndex = 0;
														
@@ -61,26 +61,26 @@ void DxcCleanupThreadMalloc() {
 
															   }
														
 
															 }
														
 
															-IMalloc *DxcGetThreadMallocNoRef() {
														
 
															+IMalloc *DxcGetThreadMallocNoRef() throw() {
														
 
															   DXASSERT(g_ThreadMallocTlsIndex != 0, "else prior to DxcInitThreadMalloc or after DxcCleanupThreadMalloc");
														
 
															   return reinterpret_cast<IMalloc *>(TlsGetValue(g_ThreadMallocTlsIndex));
														
 
															 }
														
 
															-void DxcClearThreadMalloc() {
														
 
															+void DxcClearThreadMalloc() throw() {
														
 
															   DXASSERT(g_ThreadMallocTlsIndex != 0, "else prior to DxcInitThreadMalloc or after DxcCleanupThreadMalloc");
														
 
															   IMalloc *pMalloc = DxcGetThreadMallocNoRef();
														
 
															   DXVERIFY_NOMSG(TlsSetValue(g_ThreadMallocTlsIndex, nullptr));
														
 
															   pMalloc->Release();
														
 
															 }
														
 
															-void DxcSetThreadMalloc(IMalloc *pMalloc) {
														
 
															+void DxcSetThreadMalloc(IMalloc *pMalloc) throw() {
														
 
															   DXASSERT(g_ThreadMallocTlsIndex != 0, "else prior to DxcInitThreadMalloc or after DxcCleanupThreadMalloc");
														
 
															   DXASSERT(DxcGetThreadMallocNoRef() == nullptr, "else nested allocation invoked");
														
 
															   DXVERIFY_NOMSG(TlsSetValue(g_ThreadMallocTlsIndex, pMalloc));
														
 
															   pMalloc->AddRef();
														
 
															 }
														
 
															-void DxcSetThreadMallocOrDefault(IMalloc *pMalloc) {
														
 
															+void DxcSetThreadMallocOrDefault(IMalloc *pMalloc) throw() {
														
 
															   DxcSetThreadMalloc(pMalloc ? pMalloc : g_pDefaultMalloc);
														
 
															 }
														
 
															-IMalloc *DxcSwapThreadMalloc(IMalloc *pMalloc, IMalloc **ppPrior) {
														
 
															+IMalloc *DxcSwapThreadMalloc(IMalloc *pMalloc, IMalloc **ppPrior) throw() {
														
 
															   DXASSERT(g_ThreadMallocTlsIndex != 0, "else prior to DxcInitThreadMalloc or after DxcCleanupThreadMalloc");
														
 
															   IMalloc *pPrior = DxcGetThreadMallocNoRef();
														
 
															   if (ppPrior) {
														
@@ -89,6 +89,6 @@ IMalloc *DxcSwapThreadMalloc(IMalloc *pMalloc, IMalloc **ppPrior) {
 
															   DXVERIFY_NOMSG(TlsSetValue(g_ThreadMallocTlsIndex, pMalloc));
														
 
															   return pMalloc;
														
 
															 }
														
 
															-IMalloc *DxcSwapThreadMallocOrDefault(IMalloc *pMallocOrNull, IMalloc **ppPrior) {
														
 
															+IMalloc *DxcSwapThreadMallocOrDefault(IMalloc *pMallocOrNull, IMalloc **ppPrior) throw() {
														
 
															   return DxcSwapThreadMalloc(pMallocOrNull ? pMallocOrNull : g_pDefaultMalloc, ppPrior);
														
 
															 }
														
--- a/lib/HLSL/DxcOptimizer.cpp
+++ b/lib/HLSL/DxcOptimizer.cpp
@@ -457,25 +457,25 @@ public:
 
															     return S_OK;
														
 
															   }
														
 
															-  __override HRESULT STDMETHODCALLTYPE GetOptionName(_COM_Outptr_ LPWSTR *ppResult) {
														
 
															+  HRESULT STDMETHODCALLTYPE GetOptionName(_COM_Outptr_ LPWSTR *ppResult) override {
														
 
															     return Utf8ToUtf16CoTaskMalloc(m_pOptionName, ppResult);
														
 
															   }
														
 
															-  __override HRESULT STDMETHODCALLTYPE GetDescription(_COM_Outptr_ LPWSTR *ppResult) {
														
 
															+  HRESULT STDMETHODCALLTYPE GetDescription(_COM_Outptr_ LPWSTR *ppResult) override {
														
 
															     return Utf8ToUtf16CoTaskMalloc(m_pDescription, ppResult);
														
 
															   }
														
 
															-  __override HRESULT STDMETHODCALLTYPE GetOptionArgCount(_Out_ UINT32 *pCount) {
														
 
															+  HRESULT STDMETHODCALLTYPE GetOptionArgCount(_Out_ UINT32 *pCount) override {
														
 
															     if (!pCount) return E_INVALIDARG;
														
 
															     *pCount = m_pArgDescriptions.size();
														
 
															     return S_OK;
														
 
															   }
														
 
															-  __override HRESULT STDMETHODCALLTYPE GetOptionArgName(UINT32 argIndex, LPWSTR *ppResult) {
														
 
															+  HRESULT STDMETHODCALLTYPE GetOptionArgName(UINT32 argIndex, LPWSTR *ppResult) override {
														
 
															     if (!ppResult) return E_INVALIDARG;
														
 
															     if (argIndex >= m_pArgNames.size()) return E_INVALIDARG;
														
 
															     return Utf8ToUtf16CoTaskMalloc(m_pArgNames[argIndex], ppResult);
														
 
															   }
														
 
															-  __override HRESULT STDMETHODCALLTYPE GetOptionArgDescription(UINT32 argIndex, LPWSTR *ppResult) {
														
 
															+  HRESULT STDMETHODCALLTYPE GetOptionArgDescription(UINT32 argIndex, LPWSTR *ppResult) override {
														
 
															     if (!ppResult) return E_INVALIDARG;
														
 
															     if (argIndex >= m_pArgDescriptions.size()) return E_INVALIDARG;
														
 
															     return Utf8ToUtf16CoTaskMalloc(m_pArgDescriptions[argIndex], ppResult);
														
@@ -498,14 +498,14 @@ public:
 
															   HRESULT Initialize();
														
 
															   const PassInfo *getPassByID(llvm::AnalysisID PassID);
														
 
															   const PassInfo *getPassByName(const char *pName);
														
 
															-  __override HRESULT STDMETHODCALLTYPE GetAvailablePassCount(_Out_ UINT32 *pCount) {
														
 
															+  HRESULT STDMETHODCALLTYPE GetAvailablePassCount(_Out_ UINT32 *pCount) override {
														
 
															     return AssignToOut<UINT32>(m_passes.size(), pCount);
														
 
															   }
														
 
															-  __override HRESULT STDMETHODCALLTYPE GetAvailablePass(UINT32 index, _COM_Outptr_ IDxcOptimizerPass** ppResult);
														
 
															-  __override HRESULT STDMETHODCALLTYPE RunOptimizer(IDxcBlob *pBlob,
														
 
															+  HRESULT STDMETHODCALLTYPE GetAvailablePass(UINT32 index, _COM_Outptr_ IDxcOptimizerPass** ppResult) override;
														
 
															+  HRESULT STDMETHODCALLTYPE RunOptimizer(IDxcBlob *pBlob,
														
 
															     _In_count_(optionCount) LPCWSTR *ppOptions, UINT32 optionCount,
														
 
															     _COM_Outptr_ IDxcBlob **ppOutputModule,
														
 
															-    _COM_Outptr_opt_ IDxcBlobEncoding **ppOutputText);
														
 
															+    _COM_Outptr_opt_ IDxcBlobEncoding **ppOutputText) override;
														
 
															 };
														
 
															 class CapturePassManager : public llvm::legacy::PassManagerBase {
														
@@ -516,7 +516,7 @@ public:
 
															     for (auto P : Passes) delete P;
														
 
															   }
														
 
															-  __override void add(Pass *P) {
														
 
															+  void add(Pass *P) override {
														
 
															     Passes.push_back(P);
														
 
															   }
														
@@ -535,7 +535,7 @@ HRESULT DxcOptimizer::Initialize() {
 
															     struct PRL : public PassRegistrationListener {
														
 
															       std::vector<const PassInfo *> *Passes;
														
 
															-      __override void passEnumerate(const PassInfo * PI) {
														
 
															+      void passEnumerate(const PassInfo * PI) override {
														
 
															         DXASSERT(nullptr != PI->getNormalCtor(), "else cannot construct");
														
 
															         Passes->push_back(PI);
														
 
															       }
														
--- a/lib/HLSL/DxilAddPixelHitInstrumentation.cpp
+++ b/lib/HLSL/DxilAddPixelHitInstrumentation.cpp
@@ -75,7 +75,7 @@ bool DxilAddPixelHitInstrumentation::runOnModule(Module &M)
 
															   // about the shader having selected components that don't include x or y.
														
 
															   // If not present, we add it.
														
 
															   if ( SV_Position == InputElements.end() ) {
														
 
															-    auto SVPosition = std::make_unique<DxilSignatureElement>(DXIL::SigPointKind::PSIn);
														
 
															+    auto SVPosition = llvm::make_unique<DxilSignatureElement>(DXIL::SigPointKind::PSIn);
														
 
															     SVPosition->Initialize("Position", hlsl::CompType::getF32(), hlsl::DXIL::InterpolationMode::Linear, 1, 4, SVPositionIndex == -1 ? 0 : SVPositionIndex, 0);
														
 
															     SVPosition->AppendSemanticIndex(0);
														
 
															     SVPosition->SetSigPointKind(DXIL::SigPointKind::PSIn);
														
--- a/lib/HLSL/DxilContainerAssembler.cpp
+++ b/lib/HLSL/DxilContainerAssembler.cpp
@@ -242,11 +242,11 @@ public:
 
															     calcSizes();
														
 
															   }
														
 
															-  __override uint32_t size() const {
														
 
															+  uint32_t size() const override {
														
 
															     return m_lastOffset;
														
 
															   }
														
 
															-  __override void write(AbstractMemoryStream *pStream) {
														
 
															+  void write(AbstractMemoryStream *pStream) override {
														
 
															     UINT64 startPos = pStream->GetPosition();
														
 
															     const std::vector<std::unique_ptr<hlsl::DxilSignatureElement>> &elements = m_signature.GetElements();
														
@@ -332,10 +332,10 @@ public:
 
															   DxilFeatureInfoWriter(const DxilModule &M) {
														
 
															     featureInfo.FeatureFlags = M.m_ShaderFlags.GetFeatureInfo();
														
 
															   }
														
 
															-  __override uint32_t size() const {
														
 
															+  uint32_t size() const override {
														
 
															     return sizeof(DxilShaderFeatureInfo);
														
 
															   }
														
 
															-  __override void write(AbstractMemoryStream *pStream) {
														
 
															+  void write(AbstractMemoryStream *pStream) override {
														
 
															     IFT(WriteStreamValue(pStream, featureInfo.FeatureFlags));
														
 
															   }
														
 
															 };
														
@@ -488,11 +488,11 @@ public:
 
															       DXASSERT(false, "PSV InitNew failed computing size!");
														
 
															     }
														
 
															   }
														
 
															-  __override uint32_t size() const {
														
 
															+  uint32_t size() const override {
														
 
															     return m_PSVBufferSize;
														
 
															   }
														
 
															-  __override void write(AbstractMemoryStream *pStream) {
														
 
															+  void write(AbstractMemoryStream *pStream) override {
														
 
															     m_PSVBuffer.resize(m_PSVBufferSize);
														
 
															     if (!m_PSV.InitNew(m_PSVInitInfo, m_PSVBuffer.data(), &m_PSVBufferSize)) {
														
 
															       DXASSERT(false, "PSV InitNew failed!");
														
@@ -1059,11 +1059,11 @@ private:
 
															   llvm::SmallVector<DxilPart, 8> m_Parts;
														
 
															 public:
														
 
															-  __override void AddPart(uint32_t FourCC, uint32_t Size, WriteFn Write) {
														
 
															+  void AddPart(uint32_t FourCC, uint32_t Size, WriteFn Write) override {
														
 
															     m_Parts.emplace_back(FourCC, Size, Write);
														
 
															   }
														
 
															-  __override uint32_t size() const {
														
 
															+  uint32_t size() const override {
														
 
															     uint32_t partSize = 0;
														
 
															     for (auto &part : m_Parts) {
														
 
															       partSize += part.Header.PartSize;
														
@@ -1071,7 +1071,7 @@ public:
 
															     return (uint32_t)GetDxilContainerSizeFromParts((uint32_t)m_Parts.size(), partSize);
														
 
															   }
														
 
															-  __override void write(AbstractMemoryStream *pStream) {
														
 
															+  void write(AbstractMemoryStream *pStream) override {
														
 
															     DxilContainerHeader header;
														
 
															     const uint32_t PartCount = (uint32_t)m_Parts.size();
														
 
															     uint32_t containerSizeInBytes = size();
														
@@ -1247,7 +1247,9 @@ void hlsl::SerializeDxilContainerForModule(DxilModule *pModule,
 
															       // If the debug name should be specific to the sources, base the name on the debug
														
 
															       // bitcode, which will include the source references, line numbers, etc. Otherwise,
														
 
															       // do it exclusively on the target shader bitcode.
														
 
															-      pHashStream = (int)(Flags & SerializeDxilFlags::DebugNameDependOnSource) ? pModuleBitcode : pProgramStream;
														
 
															+      pHashStream = (int)(Flags & SerializeDxilFlags::DebugNameDependOnSource)
														
 
															+                        ? CComPtr<AbstractMemoryStream>(pModuleBitcode)
														
 
															+                        : CComPtr<AbstractMemoryStream>(pProgramStream);
														
 
															       const uint32_t DebugInfoNameHashLen = 32;   // 32 chars of MD5
														
 
															       const uint32_t DebugInfoNameSuffix = 4;     // '.lld'
														
 
															       const uint32_t DebugInfoNameNullAndPad = 4; // '\0\0\0\0'
														
--- a/lib/HLSL/DxilContainerReflection.cpp
+++ b/lib/HLSL/DxilContainerReflection.cpp
@@ -60,12 +60,12 @@ public:
 
															     return DoBasicQueryInterface<IDxcContainerReflection>(this, iid, ppvObject);
														
 
															   }
														
 
															-  __override HRESULT STDMETHODCALLTYPE Load(_In_ IDxcBlob *pContainer);
														
 
															-  __override HRESULT STDMETHODCALLTYPE GetPartCount(_Out_ UINT32 *pResult);
														
 
															-  __override HRESULT STDMETHODCALLTYPE GetPartKind(UINT32 idx, _Out_ UINT32 *pResult);
														
 
															-  __override HRESULT STDMETHODCALLTYPE GetPartContent(UINT32 idx, _COM_Outptr_ IDxcBlob **ppResult);
														
 
															-  __override HRESULT STDMETHODCALLTYPE FindFirstPartKind(UINT32 kind, _Out_ UINT32 *pResult);
														
 
															-  __override HRESULT STDMETHODCALLTYPE GetPartReflection(UINT32 idx, REFIID iid, _COM_Outptr_ void **ppvObject);
														
 
															+  HRESULT STDMETHODCALLTYPE Load(_In_ IDxcBlob *pContainer) override;
														
 
															+  HRESULT STDMETHODCALLTYPE GetPartCount(_Out_ UINT32 *pResult) override;
														
 
															+  HRESULT STDMETHODCALLTYPE GetPartKind(UINT32 idx, _Out_ UINT32 *pResult) override;
														
 
															+  HRESULT STDMETHODCALLTYPE GetPartContent(UINT32 idx, _COM_Outptr_ IDxcBlob **ppResult) override;
														
 
															+  HRESULT STDMETHODCALLTYPE FindFirstPartKind(UINT32 kind, _Out_ UINT32 *pResult) override;
														
 
															+  HRESULT STDMETHODCALLTYPE GetPartReflection(UINT32 idx, REFIID iid, _COM_Outptr_ void **ppvObject) override;
														
 
															 };
														
 
															 class CShaderReflectionConstantBuffer;
														
--- a/lib/HLSL/DxilDebugInstrumentation.cpp
+++ b/lib/HLSL/DxilDebugInstrumentation.cpp
@@ -264,7 +264,7 @@ DxilDebugInstrumentation::SystemValueIndices DxilDebugInstrumentation::addRequir
 
															     // about the shader having selected components that don't include x or y.
														
 
															     // If not present, we add it.
														
 
															     if (Existing_SV_Position == InputElements.end()) {
														
 
															-      auto Added_SV_Position = std::make_unique<DxilSignatureElement>(DXIL::SigPointKind::PSIn);
														
 
															+      auto Added_SV_Position = llvm::make_unique<DxilSignatureElement>(DXIL::SigPointKind::PSIn);
														
 
															       Added_SV_Position->Initialize("Position", hlsl::CompType::getF32(), hlsl::DXIL::InterpolationMode::Linear, 1, 4);
														
 
															       Added_SV_Position->AppendSemanticIndex(0);
														
 
															       Added_SV_Position->SetSigPointKind(DXIL::SigPointKind::PSIn);
														
@@ -286,7 +286,7 @@ DxilDebugInstrumentation::SystemValueIndices DxilDebugInstrumentation::addRequir
 
															         return Element->GetSemantic()->GetKind() == hlsl::DXIL::SemanticKind::VertexID; });
														
 
															       if (Existing_SV_VertexId == InputElements.end()) {
														
 
															-        auto Added_SV_VertexId = std::make_unique<DxilSignatureElement>(DXIL::SigPointKind::VSIn);
														
 
															+        auto Added_SV_VertexId = llvm::make_unique<DxilSignatureElement>(DXIL::SigPointKind::VSIn);
														
 
															         Added_SV_VertexId->Initialize("VertexId", hlsl::CompType::getF32(), hlsl::DXIL::InterpolationMode::Undefined, 1, 1);
														
 
															         Added_SV_VertexId->AppendSemanticIndex(0);
														
 
															         Added_SV_VertexId->SetSigPointKind(DXIL::SigPointKind::VSIn);
														
@@ -306,7 +306,7 @@ DxilDebugInstrumentation::SystemValueIndices DxilDebugInstrumentation::addRequir
 
															         return Element->GetSemantic()->GetKind() == hlsl::DXIL::SemanticKind::InstanceID; });
														
 
															       if (Existing_SV_InstanceId == InputElements.end()) {
														
 
															-        auto Added_SV_InstanceId = std::make_unique<DxilSignatureElement>(DXIL::SigPointKind::VSIn);
														
 
															+        auto Added_SV_InstanceId = llvm::make_unique<DxilSignatureElement>(DXIL::SigPointKind::VSIn);
														
 
															         Added_SV_InstanceId->Initialize("InstanceId", hlsl::CompType::getF32(), hlsl::DXIL::InterpolationMode::Undefined, 1, 1);
														
 
															         Added_SV_InstanceId->AppendSemanticIndex(0);
														
 
															         Added_SV_InstanceId->SetSigPointKind(DXIL::SigPointKind::VSIn);
														
--- a/lib/HLSL/DxilGenerationPass.cpp
+++ b/lib/HLSL/DxilGenerationPass.cpp
@@ -153,26 +153,26 @@ void InitDxilModuleFromHLModule(HLModule &H, DxilModule &M, DxilEntrySignature *
 
															   // Resources
														
 
															   for (auto && C : H.GetCBuffers()) {
														
 
															-    auto b = make_unique<DxilCBuffer>();
														
 
															+    auto b = llvm::make_unique<DxilCBuffer>();
														
 
															     InitResourceBase(C.get(), b.get());
														
 
															     b->SetSize(C->GetSize());
														
 
															     LLVMUsed.emplace_back(cast<GlobalVariable>(b->GetGlobalSymbol()));
														
 
															     M.AddCBuffer(std::move(b));
														
 
															   }
														
 
															   for (auto && C : H.GetUAVs()) {
														
 
															-    auto b = make_unique<DxilResource>();
														
 
															+    auto b = llvm::make_unique<DxilResource>();
														
 
															     InitResource(C.get(), b.get());
														
 
															     LLVMUsed.emplace_back(cast<GlobalVariable>(b->GetGlobalSymbol()));
														
 
															     M.AddUAV(std::move(b));
														
 
															   }
														
 
															   for (auto && C : H.GetSRVs()) {
														
 
															-    auto b = make_unique<DxilResource>();
														
 
															+    auto b = llvm::make_unique<DxilResource>();
														
 
															     InitResource(C.get(), b.get());
														
 
															     LLVMUsed.emplace_back(cast<GlobalVariable>(b->GetGlobalSymbol()));
														
 
															     M.AddSRV(std::move(b));
														
 
															   }
														
 
															   for (auto && C : H.GetSamplers()) {
														
 
															-    auto b = make_unique<DxilSampler>();
														
 
															+    auto b = llvm::make_unique<DxilSampler>();
														
 
															     InitResourceBase(C.get(), b.get());
														
 
															     b->SetSamplerKind(C->GetSamplerKind());
														
 
															     LLVMUsed.emplace_back(cast<GlobalVariable>(b->GetGlobalSymbol()));
														
--- a/lib/HLSL/DxilLinker.cpp
+++ b/lib/HLSL/DxilLinker.cpp
@@ -727,7 +727,7 @@ DxilLinkJob::Link(std::pair<DxilFunctionLinkInfo *, DxilLib *> &entryLinkPair,
 
															     // Add signature.
														
 
															     DxilEntrySignature &entrySig = entryDM.GetDxilEntrySignature(entryFunc);
														
 
															     std::unique_ptr<DxilEntrySignature> newSig =
														
 
															-        std::make_unique<DxilEntrySignature>(entrySig);
														
 
															+        llvm::make_unique<DxilEntrySignature>(entrySig);
														
 
															     DM.ResetEntrySignature(newSig.release());
														
 
															   }
														
@@ -1017,7 +1017,7 @@ bool DxilLinkerImpl::RegisterLib(StringRef name,
 
															   pM->setModuleIdentifier(name);
														
 
															   std::unique_ptr<DxilLib> pLib =
														
 
															-      std::make_unique<DxilLib>(std::move(pM));
														
 
															+      llvm::make_unique<DxilLib>(std::move(pM));
														
 
															   m_LibMap[name] = std::move(pLib);
														
 
															   return true;
														
 
															 }
														
--- a/lib/HLSL/DxilMetadataHelper.cpp
+++ b/lib/HLSL/DxilMetadataHelper.cpp
@@ -58,6 +58,11 @@ const char DxilMDHelper::kDxilViewIdStateMDName[]                     = "dx.view
 
															 const char DxilMDHelper::kDxilFunctionPropertiesMDName[]              = "dx.func.props";
														
 
															 const char DxilMDHelper::kDxilEntrySignaturesMDName[]                 = "dx.func.signatures";
														
 
															+const char DxilMDHelper::kDxilSourceContentsMDName[]                  = "dx.source.contents";
														
 
															+const char DxilMDHelper::kDxilSourceDefinesMDName[]                   = "dx.source.defines";
														
 
															+const char DxilMDHelper::kDxilSourceMainFileNameMDName[]              = "dx.source.mainFileName";
														
 
															+const char DxilMDHelper::kDxilSourceArgsMDName[]                      = "dx.source.args";
														
 
															+
														
 
															 static std::array<const char *, 7> DxilMDNames = {
														
 
															   DxilMDHelper::kDxilVersionMDName,
														
 
															   DxilMDHelper::kDxilShaderModelMDName,
														
--- a/lib/HLSL/DxilModule.cpp
+++ b/lib/HLSL/DxilModule.cpp
@@ -44,7 +44,7 @@ public:
 
															     : DiagnosticInfo(DK_FirstPluginKind, DiagnosticSeverity::DS_Error),
														
 
															     m_message(str) { }
														
 
															-  __override void print(DiagnosticPrinter &DP) const {
														
 
															+  void print(DiagnosticPrinter &DP) const override {
														
 
															     DP << m_message;
														
 
															   }
														
 
															 };
														
@@ -59,10 +59,10 @@ namespace hlsl {
 
															 DxilModule::DxilModule(Module *pModule)
														
 
															 : m_Ctx(pModule->getContext())
														
 
															 , m_pModule(pModule)
														
 
															-, m_pOP(std::make_unique<OP>(pModule->getContext(), pModule))
														
 
															-, m_pTypeSystem(std::make_unique<DxilTypeSystem>(pModule))
														
 
															-, m_pViewIdState(std::make_unique<DxilViewIdState>(this))
														
 
															-, m_pMDHelper(std::make_unique<DxilMDHelper>(pModule, std::make_unique<DxilExtraPropertyHelper>(pModule)))
														
 
															+, m_pOP(llvm::make_unique<OP>(pModule->getContext(), pModule))
														
 
															+, m_pTypeSystem(llvm::make_unique<DxilTypeSystem>(pModule))
														
 
															+, m_pViewIdState(llvm::make_unique<DxilViewIdState>(this))
														
 
															+, m_pMDHelper(llvm::make_unique<DxilMDHelper>(pModule, llvm::make_unique<DxilExtraPropertyHelper>(pModule)))
														
 
															 , m_pDebugInfoFinder(nullptr)
														
 
															 , m_pEntryFunc(nullptr)
														
 
															 , m_EntryName("")
														
@@ -608,8 +608,8 @@ void DxilModule::LoadDxilSamplerFromMDNode(llvm::MDNode *MD, DxilSampler &S) {
 
															 template <typename TResource>
														
 
															 static void RemoveResources(std::vector<std::unique_ptr<TResource>> &vec,
														
 
															                     std::unordered_set<unsigned> &immResID) {
														
 
															-  for (std::vector<std::unique_ptr<TResource>>::iterator p = vec.begin(); p != vec.end();) {
														
 
															-    std::vector<std::unique_ptr<TResource>>::iterator c = p++;
														
 
															+  for (auto p = vec.begin(); p != vec.end();) {
														
 
															+    auto c = p++;
														
 
															     if (immResID.count((*c)->GetID()) == 0) {
														
 
															       p = vec.erase(c);
														
 
															     }
														
@@ -1409,10 +1409,27 @@ void DxilModule::StripDebugRelatedCode() {
 
															       }
														
 
															     }
														
 
															   }
														
 
															+  // Remove dx.source metadata.
														
 
															+  if (NamedMDNode *contents = m_pModule->getNamedMetadata(
														
 
															+          DxilMDHelper::kDxilSourceContentsMDName)) {
														
 
															+    contents->eraseFromParent();
														
 
															+  }
														
 
															+  if (NamedMDNode *defines =
														
 
															+          m_pModule->getNamedMetadata(DxilMDHelper::kDxilSourceDefinesMDName)) {
														
 
															+    defines->eraseFromParent();
														
 
															+  }
														
 
															+  if (NamedMDNode *mainFileName = m_pModule->getNamedMetadata(
														
 
															+          DxilMDHelper::kDxilSourceMainFileNameMDName)) {
														
 
															+    mainFileName->eraseFromParent();
														
 
															+  }
														
 
															+  if (NamedMDNode *arguments =
														
 
															+          m_pModule->getNamedMetadata(DxilMDHelper::kDxilSourceArgsMDName)) {
														
 
															+    arguments->eraseFromParent();
														
 
															+  }
														
 
															 }
														
 
															 DebugInfoFinder &DxilModule::GetOrCreateDebugInfoFinder() {
														
 
															   if (m_pDebugInfoFinder == nullptr) {
														
 
															-    m_pDebugInfoFinder = std::make_unique<llvm::DebugInfoFinder>();
														
 
															+    m_pDebugInfoFinder = llvm::make_unique<llvm::DebugInfoFinder>();
														
 
															     m_pDebugInfoFinder->processModule(*m_pModule);
														
 
															   }
														
 
															   return *m_pDebugInfoFinder;
														
@@ -1491,7 +1508,7 @@ namespace llvm {
 
															 hlsl::DxilModule &Module::GetOrCreateDxilModule(bool skipInit) {
														
 
															   std::unique_ptr<hlsl::DxilModule> M;
														
 
															   if (!HasDxilModule()) {
														
 
															-    M = std::make_unique<hlsl::DxilModule>(this);
														
 
															+    M = llvm::make_unique<hlsl::DxilModule>(this);
														
 
															     if (!skipInit) {
														
 
															       M->LoadDxilMetadata();
														
 
															     }
														
--- a/lib/HLSL/DxilResource.cpp
+++ b/lib/HLSL/DxilResource.cpp
@@ -203,12 +203,12 @@ unsigned DxilResource::GetNumOffsets(Kind ResourceKind) {
 
															       0, // Invalid = 0,
														
 
															       1, // Texture1D,
														
 
															       2, // Texture2D,
														
 
															-      0, // Texture2DMS,
														
 
															+      2, // Texture2DMS,
														
 
															       3, // Texture3D,
														
 
															       0, // TextureCube,
														
 
															       1, // Texture1DArray,
														
 
															       2, // Texture2DArray,
														
 
															-      0, // Texture2DMSArray,
														
 
															+      2, // Texture2DMSArray,
														
 
															       0, // TextureCubeArray,
														
 
															       0, // TypedBuffer,
														
 
															       0, // RawBuffer,
														
--- a/lib/HLSL/DxilValidation.cpp
+++ b/lib/HLSL/DxilValidation.cpp
@@ -11,7 +11,7 @@
 
															 #include "dxc/HLSL/DxilValidation.h"
														
 
															 #include "dxc/HLSL/DxilGenerationPass.h"
														
 
															-#include "dxc/HLSL/DXILOperations.h"
														
 
															+#include "dxc/HLSL/DxilOperations.h"
														
 
															 #include "dxc/HLSL/DxilModule.h"
														
 
															 #include "dxc/HLSL/DxilShaderModel.h"
														
 
															 #include "dxc/HLSL/DxilContainer.h"
														
@@ -282,7 +282,7 @@ public:
 
															     : DiagnosticInfo(DK_FirstPluginKind, DiagnosticSeverity::DS_Error),
														
 
															     m_message(str) { }
														
 
															-  __override void print(DiagnosticPrinter &DP) const {
														
 
															+  void print(DiagnosticPrinter &DP) const override {
														
 
															     DP << m_message;
														
 
															   }
														
 
															 };
														
@@ -3612,7 +3612,7 @@ static void ValidateSignature(ValidationContext &ValCtx, const DxilSignature &S,
 
															       {32, ValCtx.DxilMod.GetUseMinPrecision()},
														
 
															       {32, ValCtx.DxilMod.GetUseMinPrecision()},
														
 
															       {32, ValCtx.DxilMod.GetUseMinPrecision()}};
														
 
															-  unordered_set<Semantic::Kind> semanticUsageSet[DXIL::kNumOutputStreams];
														
 
															+  unordered_set<unsigned> semanticUsageSet[DXIL::kNumOutputStreams];
														
 
															   StringMap<unordered_set<unsigned>> semanticIndexMap[DXIL::kNumOutputStreams];
														
 
															   unordered_set<unsigned> clipcullRowSet[DXIL::kNumOutputStreams];
														
 
															   unsigned clipcullComponents[DXIL::kNumOutputStreams] = {0, 0, 0, 0};
														
@@ -3638,7 +3638,7 @@ static void ValidateSignature(ValidationContext &ValCtx, const DxilSignature &S,
 
															     // Semantic index overlap check, keyed by name.
														
 
															     std::string nameUpper(E->GetName());
														
 
															-    std::transform(nameUpper.begin(), nameUpper.end(), nameUpper.begin(), toupper);
														
 
															+    std::transform(nameUpper.begin(), nameUpper.end(), nameUpper.begin(), ::toupper);
														
 
															     unordered_set<unsigned> &semIdxSet = semanticIndexMap[streamId][nameUpper];
														
 
															     for (unsigned semIdx : E->GetSemanticIndexVec()) {
														
 
															       if (semIdxSet.count(semIdx) > 0) {
														
@@ -3711,11 +3711,11 @@ static void ValidateSignature(ValidationContext &ValCtx, const DxilSignature &S,
 
															       break;
														
 
															     }
														
 
															     default:
														
 
															-      if (semanticUsageSet[streamId].count(semanticKind) > 0) {
														
 
															+      if (semanticUsageSet[streamId].count(static_cast<unsigned>(semanticKind)) > 0) {
														
 
															         ValCtx.EmitFormatError(ValidationRule::MetaDuplicateSysValue,
														
 
															                                {E->GetSemantic()->GetName()});
														
 
															       }
														
 
															-      semanticUsageSet[streamId].insert(semanticKind);
														
 
															+      semanticUsageSet[streamId].insert(static_cast<unsigned>(semanticKind));
														
 
															       break;
														
 
															     }
														
--- a/lib/HLSL/HLOperationLower.cpp
+++ b/lib/HLSL/HLOperationLower.cpp
@@ -9,6 +9,10 @@
 
															 //                                                                           //
														
 
															 ///////////////////////////////////////////////////////////////////////////////
														
 
															+#define _USE_MATH_DEFINES
														
 
															+#include <cmath>
														
 
															+#include <unordered_set>
														
 
															+
														
 
															 #include "dxc/HLSL/DxilModule.h"
														
 
															 #include "dxc/HLSL/DxilOperations.h"
														
 
															 #include "dxc/HLSL/HLMatrixLowerHelper.h"
														
@@ -23,7 +27,6 @@
 
															 #include "llvm/IR/IRBuilder.h"
														
 
															 #include "llvm/IR/Instructions.h"
														
 
															 #include "llvm/IR/Module.h"
														
 
															-#include <unordered_set>
														
 
															 using namespace llvm;
														
 
															 using namespace hlsl;
														
@@ -1274,8 +1277,6 @@ Value *TranslateAtan2(CallInst *CI, IntrinsicOp IOP, OP::OpCode opcode,
 
															   Value *atan =
														
 
															       TrivialDxilUnaryOperation(OP::OpCode::Atan, tan, hlslOP, Builder);
														
 
															-  // TODO: include M_PI from math.h.
														
 
															-  const double M_PI = 3.14159265358979323846;
														
 
															   // Modify atan result based on https://en.wikipedia.org/wiki/Atan2.
														
 
															   Type *Ty = x->getType();
														
 
															   Constant *pi = ConstantFP::get(Ty->getScalarType(), M_PI);
														
@@ -1407,8 +1408,6 @@ Value *TranslateDegrees(CallInst *CI, IntrinsicOp IOP, OP::OpCode opcode,
 
															   Type *Ty = CI->getType();
														
 
															   Value *val = CI->getArgOperand(HLOperandIndex::kUnaryOpSrc0Idx);
														
 
															   // 180/pi.
														
 
															-  // TODO: include M_PI from math.h.
														
 
															-  const double M_PI = 3.14159265358979323846;
														
 
															   Constant *toDegreeConst = ConstantFP::get(Ty->getScalarType(), 180 / M_PI);
														
 
															   if (Ty != Ty->getScalarType()) {
														
 
															     toDegreeConst =
														
@@ -1518,8 +1517,6 @@ Value *TranslateRadians(CallInst *CI, IntrinsicOp IOP, OP::OpCode opcode,
 
															   Type *Ty = CI->getType();
														
 
															   Value *val = CI->getArgOperand(HLOperandIndex::kUnaryOpSrc0Idx);
														
 
															   // pi/180.
														
 
															-  // TODO: include M_PI from math.h.
														
 
															-  const double M_PI = 3.14159265358979323846;
														
 
															   Constant *toRadianConst = ConstantFP::get(Ty->getScalarType(), M_PI / 180);
														
 
															   if (Ty != Ty->getScalarType()) {
														
 
															     toRadianConst =
														
@@ -1620,8 +1617,6 @@ Value *TranslateExp(CallInst *CI, IntrinsicOp IOP, OP::OpCode opcode,
 
															   IRBuilder<> Builder(CI);
														
 
															   Type *Ty = CI->getType();
														
 
															   Value *val = CI->getArgOperand(HLOperandIndex::kUnaryOpSrc0Idx);
														
 
															-  // TODO: include M_LOG2E from math.h.
														
 
															-  const double M_LOG2E = 1.44269504088896340736;
														
 
															   Constant *log2eConst = ConstantFP::get(Ty->getScalarType(), M_LOG2E);
														
 
															   if (Ty != Ty->getScalarType()) {
														
 
															     log2eConst =
														
@@ -1638,8 +1633,6 @@ Value *TranslateLog(CallInst *CI, IntrinsicOp IOP, OP::OpCode opcode,
 
															   IRBuilder<> Builder(CI);
														
 
															   Type *Ty = CI->getType();
														
 
															   Value *val = CI->getArgOperand(HLOperandIndex::kUnaryOpSrc0Idx);
														
 
															-  // TODO: include M_LN2 from math.h.
														
 
															-  const double M_LN2 = 0.693147180559945309417;
														
 
															   Constant *ln2Const = ConstantFP::get(Ty->getScalarType(), M_LN2);
														
 
															   if (Ty != Ty->getScalarType()) {
														
 
															     ln2Const = ConstantVector::getSplat(Ty->getVectorNumElements(), ln2Const);
														
@@ -1655,9 +1648,6 @@ Value *TranslateLog10(CallInst *CI, IntrinsicOp IOP, OP::OpCode opcode,
 
															   IRBuilder<> Builder(CI);
														
 
															   Type *Ty = CI->getType();
														
 
															   Value *val = CI->getArgOperand(HLOperandIndex::kUnaryOpSrc0Idx);
														
 
															-  // TODO: include M_LN2 from math.h.
														
 
															-  const double M_LN2 = 0.693147180559945309417;
														
 
															-  const double M_LN10 = 2.30258509299404568402;
														
 
															   Constant *log2_10Const = ConstantFP::get(Ty->getScalarType(), M_LN2 / M_LN10);
														
 
															   if (Ty != Ty->getScalarType()) {
														
 
															     log2_10Const =
														
--- a/lib/HLSL/LLVMBuild.txt
+++ b/lib/HLSL/LLVMBuild.txt
@@ -13,4 +13,4 @@
 
															 type = Library
														
 
															 name = HLSL
														
 
															 parent = Libraries
														
 
															-required_libraries = Core Support
														
 
															+required_libraries = BitReader Core DxcSupport IPA Support
														
--- a/lib/IR/DiagnosticPrinter.cpp
+++ b/lib/IR/DiagnosticPrinter.cpp
@@ -96,6 +96,14 @@ DiagnosticPrinter &DiagnosticPrinterRawOStream::operator<<(const Twine &Str) {
 
															   return *this;
														
 
															 }
														
 
															+// HLSL Change Starts
														
 
															+DiagnosticPrinter &DiagnosticPrinterRawOStream::
														
 
															+operator<<(std::ios_base &(*iomanip)(std::ios_base &)) {
														
 
															+  Stream << iomanip;
														
 
															+  return *this;
														
 
															+}
														
 
															+// HLSL Change Ends.
														
 
															+
														
 
															 // IR related types.
														
 
															 DiagnosticPrinter &DiagnosticPrinterRawOStream::operator<<(const Value &V) {
														
 
															   Stream << V.getName();
														
--- a/lib/LLVMBuild.txt
+++ b/lib/LLVMBuild.txt
@@ -22,6 +22,7 @@ subdirectories =
 
															  Bitcode
														
 
															  CodeGen
														
 
															  DebugInfo
														
 
															+ DxcSupport
														
 
															  ExecutionEngine
														
 
															  Linker
														
 
															  IR
														
--- a/lib/MSSupport/MSFileSystemImpl.cpp
+++ b/lib/MSSupport/MSFileSystemImpl.cpp
@@ -90,96 +90,96 @@ MSFileSystemForDisk::MSFileSystemForDisk()
 
															 }
														
 
															 _Use_decl_annotations_
														
 
															-BOOL MSFileSystemForDisk::FindNextFileW(HANDLE hFindFile, LPWIN32_FIND_DATAW lpFindFileData)
														
 
															+BOOL MSFileSystemForDisk::FindNextFileW(HANDLE hFindFile, LPWIN32_FIND_DATAW lpFindFileData) throw()
														
 
															 {
														
 
															   return ::FindNextFileW(hFindFile, lpFindFileData);
														
 
															 }
														
 
															 _Use_decl_annotations_
														
 
															-HANDLE MSFileSystemForDisk::FindFirstFileW(LPCWSTR lpFileName, LPWIN32_FIND_DATAW lpFindFileData)
														
 
															+HANDLE MSFileSystemForDisk::FindFirstFileW(LPCWSTR lpFileName, LPWIN32_FIND_DATAW lpFindFileData) throw()
														
 
															 {
														
 
															   return ::FindFirstFileW(lpFileName, lpFindFileData);
														
 
															 }
														
 
															-void MSFileSystemForDisk::FindClose(HANDLE findHandle)
														
 
															+void MSFileSystemForDisk::FindClose(HANDLE findHandle) throw()
														
 
															 {
														
 
															   ::FindClose(findHandle);
														
 
															 }
														
 
															 _Use_decl_annotations_
														
 
															-HANDLE MSFileSystemForDisk::CreateFileW(LPCWSTR lpFileName, DWORD dwDesiredAccess, DWORD dwShareMode, DWORD dwCreationDisposition, DWORD dwFlagsAndAttributes)
														
 
															+HANDLE MSFileSystemForDisk::CreateFileW(LPCWSTR lpFileName, DWORD dwDesiredAccess, DWORD dwShareMode, DWORD dwCreationDisposition, DWORD dwFlagsAndAttributes) throw()
														
 
															 {
														
 
															   return ::CreateFileW(lpFileName, dwDesiredAccess, dwShareMode, nullptr, dwCreationDisposition, dwFlagsAndAttributes, nullptr);
														
 
															 }
														
 
															 _Use_decl_annotations_
														
 
															-BOOL MSFileSystemForDisk::SetFileTime(HANDLE hFile, _In_opt_ const FILETIME *lpCreationTime, _In_opt_ const FILETIME *lpLastAccessTime, _In_opt_ const FILETIME *lpLastWriteTime)
														
 
															+BOOL MSFileSystemForDisk::SetFileTime(HANDLE hFile, _In_opt_ const FILETIME *lpCreationTime, _In_opt_ const FILETIME *lpLastAccessTime, _In_opt_ const FILETIME *lpLastWriteTime) throw()
														
 
															 {
														
 
															   return ::SetFileTime(hFile, lpCreationTime, lpLastAccessTime, lpLastWriteTime);
														
 
															 }
														
 
															 _Use_decl_annotations_
														
 
															-BOOL MSFileSystemForDisk::GetFileInformationByHandle(HANDLE hFile, LPBY_HANDLE_FILE_INFORMATION lpFileInformation)
														
 
															+BOOL MSFileSystemForDisk::GetFileInformationByHandle(HANDLE hFile, LPBY_HANDLE_FILE_INFORMATION lpFileInformation) throw()
														
 
															 {
														
 
															   return ::GetFileInformationByHandle(hFile, lpFileInformation);
														
 
															 }
														
 
															 _Use_decl_annotations_
														
 
															-DWORD MSFileSystemForDisk::GetFileType(HANDLE hFile)
														
 
															+DWORD MSFileSystemForDisk::GetFileType(HANDLE hFile) throw()
														
 
															 {
														
 
															   return ::GetFileType(hFile);
														
 
															 }
														
 
															 _Use_decl_annotations_
														
 
															-BOOL MSFileSystemForDisk::CreateHardLinkW(LPCWSTR lpFileName, LPCWSTR lpExistingFileName)
														
 
															+BOOL MSFileSystemForDisk::CreateHardLinkW(LPCWSTR lpFileName, LPCWSTR lpExistingFileName) throw()
														
 
															 {
														
 
															   return ::CreateHardLinkW(lpFileName, lpExistingFileName, nullptr);
														
 
															 }
														
 
															 _Use_decl_annotations_
														
 
															-BOOL MSFileSystemForDisk::MoveFileExW(LPCWSTR lpExistingFileName, LPCWSTR lpNewFileName, DWORD dwFlags)
														
 
															+BOOL MSFileSystemForDisk::MoveFileExW(LPCWSTR lpExistingFileName, LPCWSTR lpNewFileName, DWORD dwFlags) throw()
														
 
															 {
														
 
															   return ::MoveFileExW(lpExistingFileName, lpNewFileName, dwFlags);
														
 
															 }
														
 
															 _Use_decl_annotations_
														
 
															-DWORD MSFileSystemForDisk::GetFileAttributesW(LPCWSTR lpFileName)
														
 
															+DWORD MSFileSystemForDisk::GetFileAttributesW(LPCWSTR lpFileName) throw()
														
 
															 {
														
 
															   return ::GetFileAttributesW(lpFileName);
														
 
															 }
														
 
															 _Use_decl_annotations_
														
 
															-BOOL MSFileSystemForDisk::CloseHandle(HANDLE hObject)
														
 
															+BOOL MSFileSystemForDisk::CloseHandle(HANDLE hObject) throw()
														
 
															 {
														
 
															   return ::CloseHandle(hObject);
														
 
															 }
														
 
															 _Use_decl_annotations_
														
 
															-BOOL MSFileSystemForDisk::DeleteFileW(LPCWSTR lpFileName)
														
 
															+BOOL MSFileSystemForDisk::DeleteFileW(LPCWSTR lpFileName) throw()
														
 
															 {
														
 
															   return ::DeleteFileW(lpFileName);
														
 
															 }
														
 
															 _Use_decl_annotations_
														
 
															-BOOL MSFileSystemForDisk::RemoveDirectoryW(LPCWSTR lpFileName)
														
 
															+BOOL MSFileSystemForDisk::RemoveDirectoryW(LPCWSTR lpFileName) throw()
														
 
															 {
														
 
															   return ::RemoveDirectoryW(lpFileName);
														
 
															 }
														
 
															 _Use_decl_annotations_
														
 
															-BOOL MSFileSystemForDisk::CreateDirectoryW(LPCWSTR lpPathName)
														
 
															+BOOL MSFileSystemForDisk::CreateDirectoryW(LPCWSTR lpPathName) throw()
														
 
															 {
														
 
															   return ::CreateDirectoryW(lpPathName, nullptr);
														
 
															 }
														
 
															 _Use_decl_annotations_
														
 
															-DWORD MSFileSystemForDisk::GetCurrentDirectoryW(DWORD nBufferLength,  LPWSTR lpBuffer)
														
 
															+DWORD MSFileSystemForDisk::GetCurrentDirectoryW(DWORD nBufferLength,  LPWSTR lpBuffer) throw()
														
 
															 {
														
 
															   return ::GetCurrentDirectoryW(nBufferLength, lpBuffer);
														
 
															 }
														
 
															 _Use_decl_annotations_
														
 
															-DWORD MSFileSystemForDisk::GetMainModuleFileNameW(LPWSTR lpFilename, DWORD nSize)
														
 
															+DWORD MSFileSystemForDisk::GetMainModuleFileNameW(LPWSTR lpFilename, DWORD nSize) throw()
														
 
															 {
														
 
															   // Add some code to ensure that the result is null terminated.
														
 
															   if (nSize <= 1)
														
@@ -195,7 +195,7 @@ DWORD MSFileSystemForDisk::GetMainModuleFileNameW(LPWSTR lpFilename, DWORD nSize
 
															 }
														
 
															 _Use_decl_annotations_
														
 
															-DWORD MSFileSystemForDisk::GetTempPathW(DWORD nBufferLength, LPWSTR lpBuffer)
														
 
															+DWORD MSFileSystemForDisk::GetTempPathW(DWORD nBufferLength, LPWSTR lpBuffer) throw()
														
 
															 {
														
 
															   return ::GetTempPathW(nBufferLength, lpBuffer);
														
 
															 }
														
@@ -212,30 +212,30 @@ namespace {
 
															 }
														
 
															 _Use_decl_annotations_
														
 
															-BOOLEAN MSFileSystemForDisk::CreateSymbolicLinkW(LPCWSTR lpSymlinkFileName, LPCWSTR lpTargetFileName, DWORD dwFlags)
														
 
															+BOOLEAN MSFileSystemForDisk::CreateSymbolicLinkW(LPCWSTR lpSymlinkFileName, LPCWSTR lpTargetFileName, DWORD dwFlags) throw()
														
 
															 {
														
 
															   return create_symbolic_link_api(lpSymlinkFileName, lpTargetFileName, dwFlags);
														
 
															 }
														
 
															-bool MSFileSystemForDisk::SupportsCreateSymbolicLink()
														
 
															+bool MSFileSystemForDisk::SupportsCreateSymbolicLink() throw()
														
 
															 {
														
 
															   return create_symbolic_link_api != nullptr;
														
 
															 }
														
 
															 _Use_decl_annotations_
														
 
															-BOOL MSFileSystemForDisk::ReadFile(HANDLE hFile, LPVOID lpBuffer, DWORD nNumberOfBytesToRead, _Out_opt_ LPDWORD lpNumberOfBytesRead)
														
 
															+BOOL MSFileSystemForDisk::ReadFile(HANDLE hFile, LPVOID lpBuffer, DWORD nNumberOfBytesToRead, _Out_opt_ LPDWORD lpNumberOfBytesRead) throw()
														
 
															 {
														
 
															   return ::ReadFile(hFile, lpBuffer, nNumberOfBytesToRead, lpNumberOfBytesRead, nullptr);
														
 
															 }
														
 
															 _Use_decl_annotations_
														
 
															-HANDLE MSFileSystemForDisk::CreateFileMappingW(HANDLE hFile, DWORD flProtect, DWORD dwMaximumSizeHigh, DWORD dwMaximumSizeLow)
														
 
															+HANDLE MSFileSystemForDisk::CreateFileMappingW(HANDLE hFile, DWORD flProtect, DWORD dwMaximumSizeHigh, DWORD dwMaximumSizeLow) throw()
														
 
															 {
														
 
															   return ::CreateFileMappingW(hFile, nullptr, flProtect, dwMaximumSizeHigh, dwMaximumSizeLow, nullptr);
														
 
															 }
														
 
															 _Use_decl_annotations_
														
 
															-LPVOID MSFileSystemForDisk::MapViewOfFile(HANDLE hFileMappingObject, DWORD dwDesiredAccess, DWORD dwFileOffsetHigh, DWORD dwFileOffsetLow, SIZE_T dwNumberOfBytesToMap)
														
 
															+LPVOID MSFileSystemForDisk::MapViewOfFile(HANDLE hFileMappingObject, DWORD dwDesiredAccess, DWORD dwFileOffsetHigh, DWORD dwFileOffsetLow, SIZE_T dwNumberOfBytesToMap) throw()
														
 
															 {
														
 
															   return ::MapViewOfFile(hFileMappingObject, dwDesiredAccess, dwFileOffsetHigh, dwFileOffsetLow, dwNumberOfBytesToMap);
														
 
															 }
														
@@ -246,13 +246,13 @@ BOOL MSFileSystemForDisk::UnmapViewOfFile(LPCVOID lpBaseAddress) throw()
 
															   return ::UnmapViewOfFile(lpBaseAddress);
														
 
															 }
														
 
															-bool MSFileSystemForDisk::FileDescriptorIsDisplayed(int fd)
														
 
															+bool MSFileSystemForDisk::FileDescriptorIsDisplayed(int fd) throw()
														
 
															 {
														
 
															   DWORD Mode;  // Unused
														
 
															   return (GetConsoleMode((HANDLE)_get_osfhandle(fd), &Mode) != 0);
														
 
															 }
														
 
															-unsigned MSFileSystemForDisk::GetColumnCount(DWORD nStdHandle)
														
 
															+unsigned MSFileSystemForDisk::GetColumnCount(DWORD nStdHandle) throw()
														
 
															 {
														
 
															   unsigned Columns = 0;
														
 
															   CONSOLE_SCREEN_BUFFER_INFO csbi;
														
@@ -269,43 +269,43 @@ unsigned MSFileSystemForDisk::GetConsoleOutputTextAttributes() throw()
 
															   return 0;
														
 
															 }
														
 
															-void MSFileSystemForDisk::SetConsoleOutputTextAttributes(unsigned attributes)
														
 
															+void MSFileSystemForDisk::SetConsoleOutputTextAttributes(unsigned attributes) throw()
														
 
															 {
														
 
															   ::SetConsoleTextAttribute(GetStdHandle(STD_OUTPUT_HANDLE), attributes);
														
 
															 }
														
 
															-void MSFileSystemForDisk::ResetConsoleOutputTextAttributes()
														
 
															+void MSFileSystemForDisk::ResetConsoleOutputTextAttributes() throw()
														
 
															 {
														
 
															   ::SetConsoleTextAttribute(GetStdHandle(STD_OUTPUT_HANDLE), _defaultAttributes);
														
 
															 }
														
 
															-int MSFileSystemForDisk::open_osfhandle(intptr_t osfhandle, int flags)
														
 
															+int MSFileSystemForDisk::open_osfhandle(intptr_t osfhandle, int flags) throw()
														
 
															 {
														
 
															   return ::_open_osfhandle(osfhandle, flags);
														
 
															 }
														
 
															-intptr_t MSFileSystemForDisk::get_osfhandle(int fd)
														
 
															+intptr_t MSFileSystemForDisk::get_osfhandle(int fd) throw()
														
 
															 {
														
 
															   return ::_get_osfhandle(fd);
														
 
															 }
														
 
															-int MSFileSystemForDisk::close(int fd)
														
 
															+int MSFileSystemForDisk::close(int fd) throw()
														
 
															 {
														
 
															   return ::_close(fd);
														
 
															 }
														
 
															-long MSFileSystemForDisk::lseek(int fd, long offset, int origin)
														
 
															+long MSFileSystemForDisk::lseek(int fd, long offset, int origin) throw()
														
 
															 {
														
 
															   return ::_lseek(fd, offset, origin);
														
 
															 }
														
 
															-int MSFileSystemForDisk::setmode(int fd, int mode)
														
 
															+int MSFileSystemForDisk::setmode(int fd, int mode) throw()
														
 
															 {
														
 
															   return ::_setmode(fd, mode);
														
 
															 }
														
 
															 _Use_decl_annotations_
														
 
															-errno_t MSFileSystemForDisk::resize_file(LPCWSTR path, uint64_t size)
														
 
															+errno_t MSFileSystemForDisk::resize_file(LPCWSTR path, uint64_t size) throw()
														
 
															 {
														
 
															   int fd = ::_wopen(path, O_BINARY | _O_RDWR, S_IWRITE);
														
 
															   if (fd == -1)
														
@@ -320,13 +320,13 @@ errno_t MSFileSystemForDisk::resize_file(LPCWSTR path, uint64_t size)
 
															 }
														
 
															 _Use_decl_annotations_
														
 
															-int MSFileSystemForDisk::Read(int fd, void* buffer, unsigned int count)
														
 
															+int MSFileSystemForDisk::Read(int fd, void* buffer, unsigned int count) throw()
														
 
															 {
														
 
															   return ::_read(fd, buffer, count);
														
 
															 }
														
 
															 _Use_decl_annotations_
														
 
															-int MSFileSystemForDisk::Write(int fd, const void* buffer, unsigned int count)
														
 
															+int MSFileSystemForDisk::Write(int fd, const void* buffer, unsigned int count) throw()
														
 
															 {
														
 
															   return ::_write(fd, buffer, count);
														
 
															 }
														
@@ -338,7 +338,7 @@ int MSFileSystemForDisk::Write(int fd, const void* buffer, unsigned int count)
 
															 ///////////////////////////////////////////////////////////////////////////////////////////////////
														
 
															 // Externally visible functions.
														
 
															-HRESULT CreateMSFileSystemForDisk(_COM_Outptr_ ::llvm::sys::fs::MSFileSystem** pResult)
														
 
															+HRESULT CreateMSFileSystemForDisk(_COM_Outptr_ ::llvm::sys::fs::MSFileSystem** pResult) throw()
														
 
															 {
														
 
															   *pResult = new (std::nothrow) ::llvm::sys::fs::MSFileSystemForDisk();
														
 
															   return (*pResult != nullptr) ? S_OK : E_OUTOFMEMORY;
														
--- a/lib/Support/Debug.cpp
+++ b/lib/Support/Debug.cpp
@@ -80,8 +80,8 @@ namespace llvm {
 
															       ods_ostream() {
														
 
															         SetUnbuffered();
														
 
															       }
														
 
															-      __override uint64_t current_pos() const { return 0; }
														
 
															-      __override void write_impl(const char *Ptr, size_t Size) {
														
 
															+      uint64_t current_pos() const override { return 0; }
														
 
															+      void write_impl(const char *Ptr, size_t Size) override {
														
 
															         // Need a null-terminated string here.
														
 
															         char chunk[512];
														
 
															         while (Size > 0) {
														
--- a/lib/Support/raw_ostream.cpp
+++ b/lib/Support/raw_ostream.cpp
@@ -25,6 +25,7 @@
 
															 #include "llvm/Support/Program.h"
														
 
															 #include <cctype>
														
 
															 #include <cerrno>
														
 
															+#include <ios>
														
 
															 #include <sys/stat.h>
														
 
															 #include <system_error>
														
@@ -106,6 +107,16 @@ void raw_ostream::SetBufferAndMode(_In_opt_ char *BufferStart, size_t Size,
 
															 }
														
 
															 raw_ostream &raw_ostream::operator<<(unsigned long N) {
														
 
															+
														
 
															+  // HLSL Change Starts - Handle non-base10 printing
														
 
															+  if (writeBase != 10) {
														
 
															+    *this << '0';
														
 
															+    if (writeBase == 16)
														
 
															+      *this << 'x';
														
 
															+    return write_base((unsigned long long)N);
														
 
															+  }
														
 
															+  // HLSL Change Ends
														
 
															+
														
 
															   // Zero is a special case.
														
 
															   if (N == 0)
														
 
															     return *this << '0';
														
@@ -122,7 +133,7 @@ raw_ostream &raw_ostream::operator<<(unsigned long N) {
 
															 }
														
 
															 raw_ostream &raw_ostream::operator<<(long N) {
														
 
															-  if (N <  0) {
														
 
															+  if (N < 0 && writeBase == 10) {
														
 
															     *this << '-';
														
 
															     // Avoid undefined behavior on LONG_MIN with a cast.
														
 
															     N = -(unsigned long)N;
														
@@ -136,6 +147,15 @@ raw_ostream &raw_ostream::operator<<(unsigned long long N) {
 
															   if (N == static_cast<unsigned long>(N))
														
 
															     return this->operator<<(static_cast<unsigned long>(N));
														
 
															+  // HLSL Change Starts - Handle non-base10 printing
														
 
															+  if (writeBase != 10) {
														
 
															+    *this << '0';
														
 
															+    if (writeBase == 16)
														
 
															+      *this << 'x';
														
 
															+    return write_base((unsigned long long)N);
														
 
															+  }
														
 
															+  // HLSL Change Ends
														
 
															+
														
 
															   char NumberBuffer[20];
														
 
															   char *EndPtr = NumberBuffer+sizeof(NumberBuffer);
														
 
															   char *CurPtr = EndPtr;
														
@@ -148,7 +168,7 @@ raw_ostream &raw_ostream::operator<<(unsigned long long N) {
 
															 }
														
 
															 raw_ostream &raw_ostream::operator<<(long long N) {
														
 
															-  if (N < 0) {
														
 
															+  if (N < 0 && writeBase == 10) {
														
 
															     *this << '-';
														
 
															     // Avoid undefined behavior on INT64_MIN with a cast.
														
 
															     N = -(unsigned long long)N;
														
@@ -157,23 +177,33 @@ raw_ostream &raw_ostream::operator<<(long long N) {
 
															   return this->operator<<(static_cast<unsigned long long>(N));
														
 
															 }
														
 
															+// HLSL Change Starts - Generalize non-base10 printing.
														
 
															 raw_ostream &raw_ostream::write_hex(unsigned long long N) {
														
 
															+  int oldBase = writeBase;
														
 
															+  writeBase = 16;
														
 
															+  raw_ostream &rv = write_base(N);
														
 
															+  writeBase = oldBase;
														
 
															+  return rv;
														
 
															+}
														
 
															+
														
 
															+raw_ostream &raw_ostream::write_base(unsigned long long N) {
														
 
															   // Zero is a special case.
														
 
															   if (N == 0)
														
 
															     return *this << '0';
														
 
															   char NumberBuffer[20];
														
 
															-  char *EndPtr = NumberBuffer+sizeof(NumberBuffer);
														
 
															+  char *EndPtr = NumberBuffer + sizeof(NumberBuffer);
														
 
															   char *CurPtr = EndPtr;
														
 
															   while (N) {
														
 
															-    uintptr_t x = N % 16;
														
 
															+    uintptr_t x = N % writeBase;
														
 
															     *--CurPtr = (x < 10 ? '0' + x : 'a' + x - 10);
														
 
															-    N /= 16;
														
 
															+    N /= writeBase;
														
 
															   }
														
 
															-  return write(CurPtr, EndPtr-CurPtr);
														
 
															+  return write(CurPtr, EndPtr - CurPtr);
														
 
															 }
														
 
															+// HLSL Change Ends
														
 
															 raw_ostream &raw_ostream::write_escaped(StringRef Str,
														
 
															                                         bool UseHexEscapes) {
														
@@ -456,6 +486,19 @@ raw_ostream &raw_ostream::operator<<(const FormattedNumber &FN) {
 
															   }
														
 
															 }
														
 
															+// HLSL Change Starts - Add handling of numerical base IO manipulators.
														
 
															+raw_ostream &raw_ostream::
														
 
															+operator<<(std::ios_base &(*iomanip)(std::ios_base &)) {
														
 
															+  if (iomanip == std::hex)
														
 
															+    writeBase = 16;
														
 
															+  else if (iomanip == std::oct)
														
 
															+    writeBase = 8;
														
 
															+  else
														
 
															+    writeBase = 10;
														
 
															+
														
 
															+  return *this;
														
 
															+}
														
 
															+// HLSL Change Ends
														
 
															 /// indent - Insert 'NumSpaces' spaces.
														
 
															 raw_ostream &raw_ostream::indent(unsigned NumSpaces) {
														
--- a/lib/Transforms/IPO/GlobalDCE.cpp
+++ b/lib/Transforms/IPO/GlobalDCE.cpp
@@ -27,7 +27,7 @@
 
															 #include <unordered_map>
														
 
															 #include "dxc/HLSL/HLModule.h" // HLSL Change
														
 
															 #include "dxc/HLSL/DxilModule.h" // HLSL Change
														
 
															-#include "dxc/HLSL/DXILOperations.h" // HLSL Change
														
 
															+#include "dxc/HLSL/DxilOperations.h" // HLSL Change
														
 
															 #include "dxc/HLSL/DxilInstructions.h" // HLSL Change
														
 
															 using namespace llvm;
														
--- a/lib/Transforms/IPO/Inliner.cpp
+++ b/lib/Transforms/IPO/Inliner.cpp
@@ -83,7 +83,7 @@ Inliner::Inliner(char &ID)
 
															 Inliner::Inliner(char &ID, int Threshold, bool InsertLifetime)
														
 
															   : CallGraphSCCPass(ID), InlineThreshold(InlineLimit.getNumOccurrences() > 0 ?
														
 
															-                                          InlineLimit : Threshold),
														
 
															+                                          unsigned(InlineLimit) : Threshold),
														
 
															     InsertLifetime(InsertLifetime) {}
														
 
															 /// For this class, we declare that we require and preserve the call graph.
														
--- a/lib/Transforms/Scalar/LoopUnrollPass.cpp
+++ b/lib/Transforms/Scalar/LoopUnrollPass.cpp
@@ -101,13 +101,13 @@ namespace {
 
															   public:
														
 
															     static char ID; // Pass ID, replacement for typeid
														
 
															     LoopUnroll(int T = -1, int C = -1, int P = -1, int R = -1) : LoopPass(ID) {
														
 
															-      CurrentThreshold = (T == -1) ? UnrollThreshold : unsigned(T);
														
 
															+      CurrentThreshold = (T == -1) ? unsigned(UnrollThreshold) : unsigned(T);
														
 
															       CurrentPercentDynamicCostSavedThreshold =
														
 
															           UnrollPercentDynamicCostSavedThreshold;
														
 
															       CurrentDynamicCostSavingsDiscount = UnrollDynamicCostSavingsDiscount;
														
 
															-      CurrentCount = (C == -1) ? UnrollCount : unsigned(C);
														
 
															-      CurrentAllowPartial = (P == -1) ? UnrollAllowPartial : (bool)P;
														
 
															-      CurrentRuntime = (R == -1) ? UnrollRuntime : (bool)R;
														
 
															+      CurrentCount = (C == -1) ? unsigned(UnrollCount) : unsigned(C);
														
 
															+      CurrentAllowPartial = (P == -1) ? (bool)UnrollAllowPartial : (bool)P;
														
 
															+      CurrentRuntime = (R == -1) ? (bool)UnrollRuntime : (bool)R;
														
 
															       UserThreshold = (T != -1) || (UnrollThreshold.getNumOccurrences() > 0);
														
 
															       UserPercentDynamicCostSavedThreshold =
														
--- a/lib/Transforms/Scalar/ScalarReplAggregatesHLSL.cpp
+++ b/lib/Transforms/Scalar/ScalarReplAggregatesHLSL.cpp
@@ -3873,6 +3873,9 @@ static void ReplaceConstantWithInst(Constant *C, Value *V, IRBuilder<> &Builder)
 
															     if (Instruction *I = dyn_cast<Instruction>(U)) {
														
 
															       I->replaceUsesOfWith(C, V);
														
 
															     } else {
														
 
															+      // Skip unused ConstantExpr.
														
 
															+      if (U->user_empty())
														
 
															+        continue;
														
 
															       ConstantExpr *CE = cast<ConstantExpr>(U);
														
 
															       Instruction *Inst = CE->getAsInstruction();
														
 
															       Builder.Insert(Inst);
														
@@ -3880,6 +3883,7 @@ static void ReplaceConstantWithInst(Constant *C, Value *V, IRBuilder<> &Builder)
 
															       ReplaceConstantWithInst(CE, Inst, Builder);
														
 
															     }
														
 
															   }
														
 
															+  C->removeDeadConstantUsers();
														
 
															 }
														
 
															 static void ReplaceUnboundedArrayUses(Value *V, Value *Src, IRBuilder<> &Builder) {
														
@@ -6118,7 +6122,7 @@ void SROA_Parameter_HLSL::createFlattenedFunction(Function *F) {
 
															   // ShaderProps.
														
 
															   if (m_pHLModule->HasDxilFunctionProps(F)) {
														
 
															     DxilFunctionProps &funcProps = m_pHLModule->GetDxilFunctionProps(F);
														
 
															-    std::unique_ptr<DxilFunctionProps> flatFuncProps = std::make_unique<DxilFunctionProps>();
														
 
															+    std::unique_ptr<DxilFunctionProps> flatFuncProps = llvm::make_unique<DxilFunctionProps>();
														
 
															     flatFuncProps->shaderKind = funcProps.shaderKind;
														
 
															     flatFuncProps->ShaderProps = funcProps.ShaderProps;
														
 
															     m_pHLModule->AddDxilFunctionProps(flatF, flatFuncProps);
														
--- a/tools/clang/include/clang/AST/HlslTypes.h
+++ b/tools/clang/include/clang/AST/HlslTypes.h
@@ -117,15 +117,15 @@ struct MatrixMemberAccessPositions {
 
															     default:
														
 
															     case 3: *row = R3_Row; *col = R3_Col; break;
														
 
															     }
														
 
															-    assert(0 <= *row && *row <= 3);
														
 
															-    assert(0 <= *col && *col <= 3);
														
 
															+    assert(*row <= 3);
														
 
															+    assert(*col <= 3);
														
 
															   }
														
 
															   void SetPosition(uint32_t index, uint32_t row, uint32_t col)
														
 
															   {
														
 
															     assert(index < 4);
														
 
															-    assert(0 <= row && row <= 3);
														
 
															-    assert(0 <= col && col <= 3);
														
 
															+    assert(row <= 3);
														
 
															+    assert(col <= 3);
														
 
															     switch (index)
														
 
															     {
														
 
															     case 0: R0_Row = row; R0_Col = col; break;
														
@@ -168,13 +168,13 @@ struct VectorMemberAccessPositions {
 
															     default:
														
 
															     case 3: *col = Swz3; break;
														
 
															     }
														
 
															-    assert(0 <= *col && *col <= 3);
														
 
															+    assert(*col <= 3);
														
 
															   }
														
 
															   void SetPosition(uint32_t index, uint32_t col)
														
 
															   {
														
 
															     assert(index < 4);
														
 
															-    assert(0 <= col && col <= 3);
														
 
															+    assert(col <= 3);
														
 
															     switch (index)
														
 
															     {
														
 
															     case 0: Swz0 = col; break;
														
--- a/tools/clang/include/clang/AST/Type.h
+++ b/tools/clang/include/clang/AST/Type.h
@@ -3298,7 +3298,7 @@ public:
 
															   }
														
 
															   const hlsl::ParameterModifier *parammods_begin() const {
														
 
															     // param modifiers begin where exceptions end
														
 
															-    return (hlsl::ParameterModifier*)exception_end();
														
 
															+    return (const hlsl::ParameterModifier*)exception_end();
														
 
															   }
														
 
															   const hlsl::ParameterModifier *parammods_end() const {
														
 
															     // modifiers begin where arguments end (in place of exceptions, in HLSL)
														
--- a/tools/clang/include/clang/Basic/Attr.td
+++ b/tools/clang/include/clang/Basic/Attr.td
@@ -879,6 +879,14 @@ def VKLocation : InheritableAttr {
 
															   let Documentation = [Undocumented];
														
 
															 }
														
 
															+def VKIndex : InheritableAttr {
														
 
															+  let Spellings = [CXX11<"vk", "index">];
														
 
															+  let Subjects = SubjectList<[Function, ParmVar, Field], ErrorDiag>;
														
 
															+  let Args = [IntArgument<"Number">];
														
 
															+  let LangOpts = [SPIRV];
														
 
															+  let Documentation = [Undocumented];
														
 
															+}
														
 
															+
														
 
															 def VKBinding : InheritableAttr {
														
 
															   let Spellings = [CXX11<"vk", "binding">];
														
 
															   let Subjects = SubjectList<[GlobalVar, HLSLBuffer], ErrorDiag, "ExpectedGlobalVarOrCTBuffer">;
														
--- a/tools/clang/include/clang/Basic/DiagnosticSemaKinds.td
+++ b/tools/clang/include/clang/Basic/DiagnosticSemaKinds.td
@@ -2334,7 +2334,7 @@ def warn_attribute_wrong_decl_type : Warning<
 
															   "SubpassInput, SubpassInputMS|"
														
 
															   // SPIRV Change Ends
														
 
															   // HLSL Change Starts - add 3 more enum values
														
 
															-  "varibales and parameters|functions, parameters, and fields|"
														
 
															+  "variables and parameters|functions, parameters, and fields|"
														
 
															   "functions, variables, parameters, fields, and types}1">,
														
 
															   // HLSL Change Ends
														
 
															   InGroup<IgnoredAttributes>;
														
@@ -7518,6 +7518,8 @@ def err_hlsl_unsupported_array_equality_op: Error<
 
															   "equality operators cannot be used with array types">;
														
 
															 def err_hlsl_unsupported_array_size: Error<
														
 
															   "array dimension must be between 1 and 65536">;
														
 
															+def err_hlsl_unsupported_incomplete_array: Error<
														
 
															+  "array dimensions of struct/class members must be explicit">;
														
 
															 def err_hlsl_unsupported_bool_lvalue_op : Error<
														
 
															   "operator cannot be used with a bool lvalue">;
														
 
															 def err_hlsl_unsupported_lvalue_cast_op : Error<
														
--- a/tools/clang/include/clang/SPIRV/Decoration.h
+++ b/tools/clang/include/clang/SPIRV/Decoration.h
@@ -126,6 +126,7 @@ public:
 
															   static const Decoration *getInputAttachmentIndex(SPIRVContext &ctx,
														
 
															                                                    uint32_t index);
														
 
															   static const Decoration *getAlignment(SPIRVContext &ctx, uint32_t alignment);
														
 
															+  static const Decoration *getNonUniformEXT(SPIRVContext &ctx);
														
 
															   static const Decoration *getOverrideCoverageNV(SPIRVContext &ctx);
														
 
															   static const Decoration *getPassthroughNV(SPIRVContext &ctx);
														
 
															   static const Decoration *getViewportRelativeNV(SPIRVContext &ctx);
														
--- a/tools/clang/include/clang/SPIRV/EmitSPIRVOptions.h
+++ b/tools/clang/include/clang/SPIRV/EmitSPIRVOptions.h
@@ -35,10 +35,10 @@ struct EmitSPIRVOptions {
 
															   bool invertY;
														
 
															   bool useGlLayout;
														
 
															   bool useDxLayout;
														
 
															-  bool ignoreUnusedResources;
														
 
															   bool enable16BitTypes;
														
 
															   bool enableReflect;
														
 
															   bool enableDebugInfo;
														
 
															+  bool noWarnIgnoredFeatures;
														
 
															   llvm::StringRef stageIoOrder;
														
 
															   llvm::SmallVector<int32_t, 4> bShift;
														
 
															   llvm::SmallVector<int32_t, 4> tShift;
														
--- a/tools/clang/include/clang/SPIRV/FeatureManager.h
+++ b/tools/clang/include/clang/SPIRV/FeatureManager.h
@@ -34,8 +34,10 @@ enum class Extension {
 
															   KHR_device_group,
														
 
															   KHR_multiview,
														
 
															   KHR_shader_draw_parameters,
														
 
															+  EXT_descriptor_indexing,
														
 
															   EXT_fragment_fully_covered,
														
 
															   EXT_shader_stencil_export,
														
 
															+  EXT_shader_viewport_index_layer,
														
 
															   AMD_gpu_shader_half_float,
														
 
															   AMD_shader_explicit_vertex_parameter,
														
 
															   GOOGLE_hlsl_functionality1,
														
--- a/tools/clang/include/clang/SPIRV/ModuleBuilder.h
+++ b/tools/clang/include/clang/SPIRV/ModuleBuilder.h
@@ -199,10 +199,13 @@ public:
 
															   /// If residencyCodeId is not zero, the sparse version of the instructions
														
 
															   /// will be used, and the SPIR-V instruction for storing the resulting
														
 
															   /// residency code will also be emitted.
														
 
															+  ///
														
 
															+  /// If isNonUniform is true, the sampled image will be decorated with
														
 
															+  /// NonUniformEXT.
														
 
															   uint32_t createImageSample(uint32_t texelType, uint32_t imageType,
														
 
															                              uint32_t image, uint32_t sampler,
														
 
															-                             uint32_t coordinate, uint32_t compareVal,
														
 
															-                             uint32_t bias, uint32_t lod,
														
 
															+                             bool isNonUniform, uint32_t coordinate,
														
 
															+                             uint32_t compareVal, uint32_t bias, uint32_t lod,
														
 
															                              std::pair<uint32_t, uint32_t> grad,
														
 
															                              uint32_t constOffset, uint32_t varOffset,
														
 
															                              uint32_t constOffsets, uint32_t sample,
														
@@ -235,12 +238,15 @@ public:
 
															   /// If residencyCodeId is not zero, the sparse version of the instructions
														
 
															   /// will be used, and the SPIR-V instruction for storing the resulting
														
 
															   /// residency code will also be emitted.
														
 
															+  /// If isNonUniform is true, the sampled image will be decorated with
														
 
															+  /// NonUniformEXT.
														
 
															   uint32_t createImageGather(uint32_t texelType, uint32_t imageType,
														
 
															                              uint32_t image, uint32_t sampler,
														
 
															-                             uint32_t coordinate, uint32_t component,
														
 
															-                             uint32_t compareVal, uint32_t constOffset,
														
 
															-                             uint32_t varOffset, uint32_t constOffsets,
														
 
															-                             uint32_t sample, uint32_t residencyCodeId);
														
 
															+                             bool isNonUniform, uint32_t coordinate,
														
 
															+                             uint32_t component, uint32_t compareVal,
														
 
															+                             uint32_t constOffset, uint32_t varOffset,
														
 
															+                             uint32_t constOffsets, uint32_t sample,
														
 
															+                             uint32_t residencyCodeId);
														
 
															   /// \brief Creates an OpImageSparseTexelsResident SPIR-V instruction for the
														
 
															   /// given Resident Code and returns the <result-id> of the instruction.
														
@@ -375,6 +381,9 @@ public:
 
															   /// \brief Decorates the given target <result-id> with the given location.
														
 
															   void decorateLocation(uint32_t targetId, uint32_t location);
														
 
															+  /// \brief Decorates the given target <result-id> with the given index.
														
 
															+  void decorateIndex(uint32_t targetId, uint32_t index);
														
 
															+
														
 
															   /// \brief Decorates the given target <result-id> with the given descriptor
														
 
															   /// set and binding number.
														
 
															   void decorateDSetBinding(uint32_t targetId, uint32_t setNumber,
														
--- a/tools/clang/include/clang/SPIRV/Type.h
+++ b/tools/clang/include/clang/SPIRV/Type.h
@@ -41,7 +41,9 @@ public:
 
															   spv::Op getOpcode() const { return opcode; }
														
 
															   const std::vector<uint32_t> &getArgs() const { return args; }
														
 
															-  const auto &getDecorations() const { return decorations; }
														
 
															+  const llvm::SetVector<const Decoration *> &getDecorations() const {
														
 
															+    return decorations;
														
 
															+  }
														
 
															   bool hasDecoration(const Decoration *) const;
														
 
															   bool isBooleanType() const;
														
--- a/tools/clang/lib/CodeGen/CGExpr.cpp
+++ b/tools/clang/lib/CodeGen/CGExpr.cpp
@@ -2901,7 +2901,16 @@ CodeGenFunction::EmitHLSLVectorElementExpr(const HLSLVectorElementExpr *E) {
 
															     // Otherwise, if the base is an lvalue ( as in the case of foo.x.x),
														
 
															     // emit the base as an lvalue.
														
 
															     const Expr *base = E->getBase();
														
 
															-
														
 
															+    if (const ImplicitCastExpr *ICE = dyn_cast<ImplicitCastExpr>(base)) {
														
 
															+      if (ICE->getCastKind() == CastKind::CK_HLSLVectorSplat &&
														
 
															+          E->getNumElements() == 1) {
														
 
															+        // For pattern like:
														
 
															+        //   static bool t;
														
 
															+        //   t.x = bool(a);
														
 
															+        // Just ignore the .x, treat it like t = bool(a);
														
 
															+        return EmitLValue(ICE->getSubExpr());
														
 
															+      }
														
 
															+    }
														
 
															     assert(hlsl::IsHLSLVecType(base->getType()));
														
 
															     Base = EmitLValue(base);
														
 
															   } else {
														
--- a/tools/clang/lib/CodeGen/CGHLSLMS.cpp
+++ b/tools/clang/lib/CodeGen/CGHLSLMS.cpp
@@ -53,6 +53,28 @@ using std::unique_ptr;
 
															 static const bool KeepUndefinedTrue = true; // Keep interpolation mode undefined if not set explicitly.
														
 
															+// Define constant variables exposed in DxilConstants.h
														
 
															+namespace hlsl {
														
 
															+namespace DXIL {
														
 
															+  // TODO: revisit data layout descriptions for the following:
														
 
															+  //      - x64 pointers?
														
 
															+  //      - Keep elf manging(m:e)?
														
 
															+
														
 
															+  // For legacy data layout, everything less than 32 align to 32.
														
 
															+  const char* kLegacyLayoutString = "e-m:e-p:32:32-i1:32-i8:32-i16:32-i32:32-i64:64-f16:32-f32:32-f:64:64-n8:16:32:64";
														
 
															+
														
 
															+  // New data layout with native low precision types
														
 
															+  const char* kNewLayoutString = "e-m:e-p:32:32-i1:32-i8:8-i16:16-i32:32-i64:64-f16:16-f32:32-f64:64-n8:16:32:64";
														
 
															+
														
 
															+  // Function Attributes
														
 
															+  // TODO: consider generating attributes from hctdb
														
 
															+  const char* kFP32DenormKindString          = "fp32-denorm-mode";
														
 
															+  const char* kFP32DenormValueAnyString      = "any";
														
 
															+  const char* kFP32DenormValuePreserveString = "preserve";
														
 
															+  const char* kFP32DenormValueFtzString      = "ftz";
														
 
															+} // DXIL
														
 
															+} // hlsl
														
 
															+
														
 
															 namespace {
														
 
															 /// Use this class to represent HLSL cbuffer in high-level DXIL.
														
--- a/tools/clang/lib/CodeGen/ModuleBuilder.cpp
+++ b/tools/clang/lib/CodeGen/ModuleBuilder.cpp
@@ -25,6 +25,7 @@
 
															 #include "llvm/IR/LLVMContext.h"
														
 
															 #include "llvm/IR/Module.h"
														
 
															 #include <memory>
														
 
															+#include "dxc/HLSL/DxilMetadataHelper.h" // HLSL Change - dx source info
														
 
															 using namespace clang;
														
 
															 namespace {
														
@@ -222,7 +223,8 @@ namespace {
 
															              it != end; ++it) {
														
 
															           if (it->first->isValid() && !it->second->IsSystemFile) {
														
 
															             if (pContents == nullptr) {
														
 
															-              pContents = M->getOrInsertNamedMetadata("llvm.dbg.contents");
														
 
															+              pContents = M->getOrInsertNamedMetadata(
														
 
															+                  hlsl::DxilMDHelper::kDxilSourceContentsMDName);
														
 
															             }
														
 
															             llvm::MDTuple *pFileInfo = llvm::MDNode::get(
														
 
															                 LLVMCtx,
														
@@ -234,7 +236,8 @@ namespace {
 
															         }
														
 
															         // Add Defines to Debug Info
														
 
															-        llvm::NamedMDNode *pDefines = M->getOrInsertNamedMetadata("llvm.dbg.defines");
														
 
															+        llvm::NamedMDNode *pDefines = M->getOrInsertNamedMetadata(
														
 
															+            hlsl::DxilMDHelper::kDxilSourceDefinesMDName);
														
 
															         std::vector<llvm::Metadata *> vecDefines;
														
 
															         vecDefines.resize(CodeGenOpts.HLSLDefines.size());
														
 
															         std::transform(CodeGenOpts.HLSLDefines.begin(), CodeGenOpts.HLSLDefines.end(),
														
@@ -243,13 +246,15 @@ namespace {
 
															         pDefines->addOperand(pDefinesInfo);
														
 
															         // Add main file name to debug info
														
 
															-        llvm::NamedMDNode *pSourceFilename = M->getOrInsertNamedMetadata("llvm.dbg.mainFileName");
														
 
															+        llvm::NamedMDNode *pSourceFilename = M->getOrInsertNamedMetadata(
														
 
															+            hlsl::DxilMDHelper::kDxilSourceMainFileNameMDName);
														
 
															         llvm::MDTuple *pFileName = llvm::MDNode::get(
														
 
															           LLVMCtx, llvm::MDString::get(LLVMCtx, CodeGenOpts.MainFileName));
														
 
															         pSourceFilename->addOperand(pFileName);
														
 
															         // Pass in any other arguments to debug info
														
 
															-        llvm::NamedMDNode *pArgs = M->getOrInsertNamedMetadata("llvm.dbg.args");
														
 
															+        llvm::NamedMDNode *pArgs = M->getOrInsertNamedMetadata(
														
 
															+            hlsl::DxilMDHelper::kDxilSourceArgsMDName);
														
 
															         std::vector<llvm::Metadata *> vecArguments;
														
 
															         vecArguments.resize(CodeGenOpts.HLSLArguments.size());
														
 
															         std::transform(CodeGenOpts.HLSLArguments.begin(), CodeGenOpts.HLSLArguments.end(),
														
--- a/tools/clang/lib/Frontend/CompilerInstance.cpp
+++ b/tools/clang/lib/Frontend/CompilerInstance.cpp
@@ -596,7 +596,7 @@ void CompilerInstance::clearOutputFiles(bool EraseFiles) {
 
															   }
														
 
															   OutputFiles.clear();
														
 
															   NonSeekStream.reset();
														
 
															-  if (errorsFound) throw std::exception("errors when processing output"); // HLSL Change
														
 
															+  if (errorsFound) throw std::runtime_error("errors when processing output"); // HLSL Change
														
 
															 }
														
 
															 raw_pwrite_stream *
														
--- a/tools/clang/lib/Frontend/CompilerInvocation.cpp
+++ b/tools/clang/lib/Frontend/CompilerInvocation.cpp
@@ -1277,7 +1277,7 @@ void CompilerInvocation::setLangDefaults(LangOptions &Opts, InputKind IK,
 
															     Opts.NativeHalfType = 1;
														
 
															   }
														
 
															-  Opts.HLSL = IK == IK_HLSL || LangStd == LangStandard::lang_hlsl // HLSL Change: Langstandard for HLSL
														
 
															+  Opts.HLSL = IK == IK_HLSL || LangStd == LangStandard::lang_hlsl; // HLSL Change: Langstandard for HLSL
														
 
															   Opts.CUDA = IK == IK_CUDA || IK == IK_PreprocessedCuda ||
														
 
															               LangStd == LangStandard::lang_cuda;
														
--- a/tools/clang/lib/Frontend/FrontendActions.cpp
+++ b/tools/clang/lib/Frontend/FrontendActions.cpp
@@ -706,7 +706,7 @@ HLSLRootSignatureAction::HLSLRootSignatureAction(StringRef rootSigMacro,
 
															                                                  unsigned major, unsigned minor)
														
 
															     : HLSLRootSignatureMacro(rootSigMacro), rootSigMajor(major),
														
 
															       rootSigMinor(minor) {
														
 
															-  rootSigHandle = std::make_unique<hlsl::RootSignatureHandle>();
														
 
															+  rootSigHandle = llvm::make_unique<hlsl::RootSignatureHandle>();
														
 
															 }
														
 
															 void HLSLRootSignatureAction::ExecuteAction() {
														
--- a/tools/clang/lib/Lex/HeaderSearch.cpp
+++ b/tools/clang/lib/Lex/HeaderSearch.cpp
@@ -564,7 +564,9 @@ static bool checkMSVCHeaderSearch(DiagnosticsEngine &Diags,
 
															                                   const FileEntry *MSFE, const FileEntry *FE,
														
 
															                                   SourceLocation IncludeLoc) {
														
 
															   if (MSFE && FE != MSFE) {
														
 
															+#if 0  // HLSL Change - turn off warnings of MSVC search rules
														
 
															     Diags.Report(IncludeLoc, diag::ext_pp_include_search_ms) << MSFE->getName();
														
 
															+#endif // HLSL Change
														
 
															     return true;
														
 
															   }
														
 
															   return false;
														
--- a/tools/clang/lib/Parse/HLSLRootSignature.cpp
+++ b/tools/clang/lib/Parse/HLSLRootSignature.cpp
@@ -83,6 +83,8 @@ void RootSignatureTokenizer::ReadNextToken(uint32_t BufferIdx)
 
															     char *pBuffer = m_TokenStrings[BufferIdx];
														
 
															     Token &T = m_Tokens[BufferIdx];
														
 
															     bool bFloat = false;
														
 
															+    bool bKW = false;
														
 
															+    char c = 0;
														
 
															     EatSpace();
														
@@ -185,7 +187,7 @@ void RootSignatureTokenizer::ReadNextToken(uint32_t BufferIdx)
 
															     //
														
 
															     // Classify token
														
 
															     //
														
 
															-    char c = pBuffer[0];
														
 
															+    c = pBuffer[0];
														
 
															     // Delimiters
														
 
															     switch(c)
														
@@ -245,7 +247,6 @@ void RootSignatureTokenizer::ReadNextToken(uint32_t BufferIdx)
 
															     // Keyword
														
 
															 #define KW(__name)  ToKeyword(pBuffer, T, #__name, Token::Type::__name)
														
 
															-    bool bKW = false;
														
 
															     // Case-incensitive
														
 
															     switch(toupper(c))
														
 
															     {
														
--- a/tools/clang/lib/Parse/Parser.cpp
+++ b/tools/clang/lib/Parse/Parser.cpp
@@ -1416,7 +1416,9 @@ Parser::TryAnnotateName(bool IsAddressOfOperand,
 
															     if (TryAnnotateTypeOrScopeTokenAfterScopeSpec(EnteringContext, false, SS,
														
 
															                                                   !WasScopeAnnotation))
														
 
															       return ANK_Error;
														
 
															-    return ANK_Unresolved;
														
 
															+    // HLSL Change Starts - allow implicitly annotated templates
														
 
															+    return (Tok.isNot(tok::annot_typename) || SS.isInvalid()) ? ANK_Unresolved : ANK_Success;
														
 
															+    // HLSL Change End
														
 
															   }
														
 
															   IdentifierInfo *Name = Tok.getIdentifierInfo();
														
--- a/tools/clang/lib/SPIRV/DeclResultIdMapper.cpp
+++ b/tools/clang/lib/SPIRV/DeclResultIdMapper.cpp
@@ -99,11 +99,11 @@ std::string StageVar::getSemanticStr() const {
 
															   // Use what is in the source code.
														
 
															   // TODO: this looks like a hack to make the current tests happy.
														
 
															   // Should consider remove it and fix all tests.
														
 
															-  if (semanticIndex == 0)
														
 
															-    return semanticStr;
														
 
															+  if (semanticInfo.index == 0)
														
 
															+    return semanticInfo.str;
														
 
															   std::ostringstream ss;
														
 
															-  ss << semanticName.str() << semanticIndex;
														
 
															+  ss << semanticInfo.name.str() << semanticInfo.index;
														
 
															   return ss.str();
														
 
															 }
														
@@ -181,8 +181,7 @@ bool CounterVarFields::assign(const CounterVarFields &srcFields,
 
															   return true;
														
 
															 }
														
 
															-DeclResultIdMapper::SemanticInfo
														
 
															-DeclResultIdMapper::getStageVarSemantic(const NamedDecl *decl) {
														
 
															+SemanticInfo DeclResultIdMapper::getStageVarSemantic(const NamedDecl *decl) {
														
 
															   for (auto *annotation : decl->getUnusualAnnotations()) {
														
 
															     if (auto *sema = dyn_cast<hlsl::SemanticDecl>(annotation)) {
														
 
															       llvm::StringRef semanticStr = sema->SemanticName;
														
@@ -282,8 +281,7 @@ DeclResultIdMapper::getDeclSpirvInfo(const ValueDecl *decl) const {
 
															   return nullptr;
														
 
															 }
														
 
															-SpirvEvalInfo DeclResultIdMapper::getDeclEvalInfo(const ValueDecl *decl,
														
 
															-                                                  bool checkRegistered) {
														
 
															+SpirvEvalInfo DeclResultIdMapper::getDeclEvalInfo(const ValueDecl *decl) {
														
 
															   if (const auto *info = getDeclSpirvInfo(decl))
														
 
															     if (info->indexInCTBuffer >= 0) {
														
 
															       // If this is a VarDecl inside a HLSLBufferDecl, we need to do an extra
														
@@ -306,15 +304,12 @@ SpirvEvalInfo DeclResultIdMapper::getDeclEvalInfo(const ValueDecl *decl,
 
															       return *info;
														
 
															     }
														
 
															-  if (checkRegistered) {
														
 
															-    emitFatalError("found unregistered decl", decl->getLocation())
														
 
															-        << decl->getName();
														
 
															-    emitNote("please file a bug report on "
														
 
															-             "https://github.com/Microsoft/DirectXShaderCompiler/issues with "
														
 
															-             "source code if possible",
														
 
															-             {});
														
 
															-  }
														
 
															-
														
 
															+  emitFatalError("found unregistered decl", decl->getLocation())
														
 
															+      << decl->getName();
														
 
															+  emitNote("please file a bug report on "
														
 
															+           "https://github.com/Microsoft/DirectXShaderCompiler/issues with "
														
 
															+           "source code if possible",
														
 
															+           {});
														
 
															   return 0;
														
 
															 }
														
@@ -413,6 +408,15 @@ SpirvEvalInfo DeclResultIdMapper::createExternVar(const VarDecl *var) {
 
															   uint32_t varType = typeTranslator.translateType(var->getType(), rule);
														
 
															+  // Require corresponding capability for accessing 16-bit data.
														
 
															+  if (storageClass == spv::StorageClass::Uniform &&
														
 
															+      spirvOptions.enable16BitTypes &&
														
 
															+      typeTranslator.isOrContains16BitType(var->getType())) {
														
 
															+    theBuilder.addExtension(Extension::KHR_16bit_storage,
														
 
															+                            "16-bit types in resource", var->getLocation());
														
 
															+    theBuilder.requireCapability(spv::Capability::StorageUniformBufferBlock16);
														
 
															+  }
														
 
															+
														
 
															   const uint32_t id = theBuilder.addModuleVar(varType, storageClass,
														
 
															                                               var->getName(), llvm::None);
														
 
															   const auto info =
														
@@ -466,9 +470,8 @@ uint32_t DeclResultIdMapper::getMatrixStructType(const VarDecl *matVar,
 
															 }
														
 
															 uint32_t DeclResultIdMapper::createStructOrStructArrayVarOfExplicitLayout(
														
 
															-    const DeclContext *decl, uint32_t arraySize,
														
 
															-    const ContextUsageKind usageKind, llvm::StringRef typeName,
														
 
															-    llvm::StringRef varName) {
														
 
															+    const DeclContext *decl, int arraySize, const ContextUsageKind usageKind,
														
 
															+    llvm::StringRef typeName, llvm::StringRef varName) {
														
 
															   // cbuffers are translated into OpTypeStruct with Block decoration.
														
 
															   // tbuffers are translated into OpTypeStruct with BufferBlock decoration.
														
 
															   // Push constants are translated into OpTypeStruct with Block decoration.
														
@@ -479,6 +482,7 @@ uint32_t DeclResultIdMapper::createStructOrStructArrayVarOfExplicitLayout(
 
															   const bool forCBuffer = usageKind == ContextUsageKind::CBuffer;
														
 
															   const bool forTBuffer = usageKind == ContextUsageKind::TBuffer;
														
 
															   const bool forGlobals = usageKind == ContextUsageKind::Globals;
														
 
															+  const bool forPC = usageKind == ContextUsageKind::PushConstant;
														
 
															   auto &context = *theBuilder.getSPIRVContext();
														
 
															   const LayoutRule layoutRule =
														
@@ -512,6 +516,19 @@ uint32_t DeclResultIdMapper::createStructOrStructArrayVarOfExplicitLayout(
 
															     fieldTypes.push_back(typeTranslator.translateType(varType, layoutRule));
														
 
															     fieldNames.push_back(declDecl->getName());
														
 
															+    // Require corresponding capability for accessing 16-bit data.
														
 
															+    if (spirvOptions.enable16BitTypes &&
														
 
															+        typeTranslator.isOrContains16BitType(varType)) {
														
 
															+      theBuilder.addExtension(Extension::KHR_16bit_storage,
														
 
															+                              "16-bit types in resource",
														
 
															+                              declDecl->getLocation());
														
 
															+      theBuilder.requireCapability(
														
 
															+          (forCBuffer || forGlobals)
														
 
															+              ? spv::Capability::StorageUniform16
														
 
															+              : forPC ? spv::Capability::StoragePushConstant16
														
 
															+                      : spv::Capability::StorageUniformBufferBlock16);
														
 
															+    }
														
 
															+
														
 
															     // tbuffer/TextureBuffers are non-writable SSBOs. OpMemberDecorate
														
 
															     // NonWritable must be applied to all fields.
														
 
															     if (forTBuffer) {
														
@@ -526,16 +543,22 @@ uint32_t DeclResultIdMapper::createStructOrStructArrayVarOfExplicitLayout(
 
															       theBuilder.getStructType(fieldTypes, typeName, fieldNames, decorations);
														
 
															   // Make an array if requested.
														
 
															-  if (arraySize)
														
 
															+  if (arraySize > 0) {
														
 
															     resultType = theBuilder.getArrayType(
														
 
															         resultType, theBuilder.getConstantUint32(arraySize));
														
 
															+  } else if (arraySize == -1) {
														
 
															+    // Runtime arrays of cbuffer/tbuffer needs additional capability.
														
 
															+    theBuilder.addExtension(Extension::EXT_descriptor_indexing,
														
 
															+                            "runtime array of resources", {});
														
 
															+    theBuilder.requireCapability(spv::Capability::RuntimeDescriptorArrayEXT);
														
 
															+    resultType = theBuilder.getRuntimeArrayType(resultType);
														
 
															+  }
														
 
															   // Register the <type-id> for this decl
														
 
															   ctBufferPCTypeIds[decl] = resultType;
														
 
															-  const auto sc = usageKind == ContextUsageKind::PushConstant
														
 
															-                      ? spv::StorageClass::PushConstant
														
 
															-                      : spv::StorageClass::Uniform;
														
 
															+  const auto sc =
														
 
															+      forPC ? spv::StorageClass::PushConstant : spv::StorageClass::Uniform;
														
 
															   // Create the variable for the whole struct / struct array.
														
 
															   return theBuilder.addModuleVar(resultType, sc, varName);
														
@@ -574,18 +597,28 @@ uint32_t DeclResultIdMapper::createCTBuffer(const HLSLBufferDecl *decl) {
 
															 }
														
 
															 uint32_t DeclResultIdMapper::createCTBuffer(const VarDecl *decl) {
														
 
															-  const auto *recordType = decl->getType()->getAs<RecordType>();
														
 
															-  uint32_t arraySize = 0;
														
 
															+  const RecordType *recordType = nullptr;
														
 
															+  int arraySize = 0;
														
 
															   // In case we have an array of ConstantBuffer/TextureBuffer:
														
 
															-  if (!recordType) {
														
 
															-    if (const auto *arrayType =
														
 
															+  if (const auto *arrayType = decl->getType()->getAsArrayTypeUnsafe()) {
														
 
															+    recordType = arrayType->getElementType()->getAs<RecordType>();
														
 
															+    if (const auto *caType =
														
 
															             astContext.getAsConstantArrayType(decl->getType())) {
														
 
															-      recordType = arrayType->getElementType()->getAs<RecordType>();
														
 
															-      arraySize = static_cast<uint32_t>(arrayType->getSize().getZExtValue());
														
 
															+      arraySize = static_cast<uint32_t>(caType->getSize().getZExtValue());
														
 
															+    } else {
														
 
															+      arraySize = -1;
														
 
															     }
														
 
															+  } else {
														
 
															+    recordType = decl->getType()->getAs<RecordType>();
														
 
															   }
														
 
															-  assert(recordType);
														
 
															+  if (!recordType) {
														
 
															+    emitError("constant/texture buffer type %0 unimplemented",
														
 
															+              decl->getLocStart())
														
 
															+        << decl->getType();
														
 
															+    return 0;
														
 
															+  }
														
 
															+
														
 
															   const auto *context = cast<HLSLBufferDecl>(decl->getDeclContext());
														
 
															   const auto usageKind = context->isCBuffer() ? ContextUsageKind::CBuffer
														
 
															                                               : ContextUsageKind::TBuffer;
														
@@ -646,11 +679,12 @@ void DeclResultIdMapper::createGlobalsCBuffer(const VarDecl *var) {
 
															   uint32_t index = 0;
														
 
															   for (const auto *decl : typeTranslator.collectDeclsInDeclContext(context))
														
 
															     if (const auto *varDecl = dyn_cast<VarDecl>(decl)) {
														
 
															-      if (const auto *init = varDecl->getInit()) {
														
 
															-        emitWarning(
														
 
															-            "variable '%0' will be placed in $Globals so initializer ignored",
														
 
															-            init->getExprLoc())
														
 
															-            << var->getName() << init->getSourceRange();
														
 
															+      if (!spirvOptions.noWarnIgnoredFeatures) {
														
 
															+        if (const auto *init = varDecl->getInit())
														
 
															+          emitWarning(
														
 
															+              "variable '%0' will be placed in $Globals so initializer ignored",
														
 
															+              init->getExprLoc())
														
 
															+              << var->getName() << init->getSourceRange();
														
 
															       }
														
 
															       if (const auto *attr = varDecl->getAttr<VKBindingAttr>()) {
														
 
															         emitError("variable '%0' will be placed in $Globals so cannot have "
														
@@ -817,37 +851,53 @@ namespace {
 
															 /// the same location.
														
 
															 class LocationSet {
														
 
															 public:
														
 
															+  /// Maximum number of indices supported
														
 
															+  const static uint32_t kMaxIndex = 2;
														
 
															   /// Maximum number of locations supported
														
 
															   // Typically we won't have that many stage input or output variables.
														
 
															   // Using 64 should be fine here.
														
 
															   const static uint32_t kMaxLoc = 64;
														
 
															-  LocationSet() : usedLocs(kMaxLoc, false), nextLoc(0) {}
														
 
															+  LocationSet() {
														
 
															+    for (uint32_t i = 0; i < kMaxIndex; ++i) {
														
 
															+      usedLocs[i].resize(kMaxLoc);
														
 
															+      nextLoc[i] = 0;
														
 
															+    }
														
 
															+  }
														
 
															   /// Uses the given location.
														
 
															-  void useLoc(uint32_t loc) { usedLocs.set(loc); }
														
 
															+  void useLoc(uint32_t loc, uint32_t index = 0) {
														
 
															+    assert(index < kMaxIndex);
														
 
															+    usedLocs[index].set(loc);
														
 
															+  }
														
 
															   /// Uses the next |count| available location.
														
 
															-  int useNextLocs(uint32_t count) {
														
 
															-    while (usedLocs[nextLoc])
														
 
															-      nextLoc++;
														
 
															+  int useNextLocs(uint32_t count, uint32_t index = 0) {
														
 
															+    assert(index < kMaxIndex);
														
 
															+    auto &locs = usedLocs[index];
														
 
															+    auto &next = nextLoc[index];
														
 
															+    while (locs[next])
														
 
															+      next++;
														
 
															-    int toUse = nextLoc;
														
 
															+    int toUse = next;
														
 
															     for (uint32_t i = 0; i < count; ++i) {
														
 
															-      assert(!usedLocs[nextLoc]);
														
 
															-      usedLocs.set(nextLoc++);
														
 
															+      assert(!locs[next]);
														
 
															+      locs.set(next++);
														
 
															     }
														
 
															     return toUse;
														
 
															   }
														
 
															   /// Returns true if the given location number is already used.
														
 
															-  bool isLocUsed(uint32_t loc) { return usedLocs[loc]; }
														
 
															+  bool isLocUsed(uint32_t loc, uint32_t index = 0) {
														
 
															+    assert(index < kMaxIndex);
														
 
															+    return usedLocs[index][loc];
														
 
															+  }
														
 
															 private:
														
 
															-  llvm::SmallBitVector usedLocs; ///< All previously used locations
														
 
															-  uint32_t nextLoc;              ///< Next available location
														
 
															+  llvm::SmallBitVector usedLocs[kMaxIndex]; ///< All previously used locations
														
 
															+  uint32_t nextLoc[kMaxIndex];              ///< Next available location
														
 
															 };
														
 
															 /// A class for managing resource bindings to avoid duplicate uses of the same
														
@@ -930,17 +980,14 @@ bool DeclResultIdMapper::finalizeStageIOLocations(bool forInput) {
 
															     bool noError = true;
														
 
															     for (const auto &var : stageVars) {
														
 
															-      // Skip those stage variables we are not handling for this call
														
 
															-      if (forInput != isInputStorageClass(var))
														
 
															-        continue;
														
 
															-
														
 
															-      // Skip builtins
														
 
															-      if (var.isSpirvBuitin())
														
 
															+      // Skip builtins & those stage variables we are not handling for this call
														
 
															+      if (var.isSpirvBuitin() || forInput != isInputStorageClass(var))
														
 
															         continue;
														
 
															       const auto *attr = var.getLocationAttr();
														
 
															       const auto loc = attr->getNumber();
														
 
															       const auto attrLoc = attr->getLocation(); // Attr source code location
														
 
															+      const auto idx = var.getIndexAttr() ? var.getIndexAttr()->getNumber() : 0;
														
 
															       if (loc >= LocationSet::kMaxLoc) {
														
 
															         emitError("stage %select{output|input}0 location #%1 too large",
														
@@ -950,15 +997,17 @@ bool DeclResultIdMapper::finalizeStageIOLocations(bool forInput) {
 
															       }
														
 
															       // Make sure the same location is not assigned more than once
														
 
															-      if (locSet.isLocUsed(loc)) {
														
 
															+      if (locSet.isLocUsed(loc, idx)) {
														
 
															         emitError("stage %select{output|input}0 location #%1 already assigned",
														
 
															                   attrLoc)
														
 
															             << forInput << loc;
														
 
															         noError = false;
														
 
															       }
														
 
															-      locSet.useLoc(loc);
														
 
															+      locSet.useLoc(loc, idx);
														
 
															       theBuilder.decorateLocation(var.getSpirvId(), loc);
														
 
															+      if (var.getIndexAttr())
														
 
															+        theBuilder.decorateIndex(var.getSpirvId(), idx);
														
 
															     }
														
 
															     return noError;
														
@@ -968,30 +1017,28 @@ bool DeclResultIdMapper::finalizeStageIOLocations(bool forInput) {
 
															   LocationSet locSet;
														
 
															   for (const auto &var : stageVars) {
														
 
															-    if (forInput != isInputStorageClass(var))
														
 
															+    if (var.isSpirvBuitin() || forInput != isInputStorageClass(var))
														
 
															       continue;
														
 
															-    if (!var.isSpirvBuitin()) {
														
 
															-      if (var.getLocationAttr() != nullptr) {
														
 
															-        // We have checked that not all of the stage variables have explicit
														
 
															-        // location assignment.
														
 
															-        emitError("partial explicit stage %select{output|input}0 location "
														
 
															-                  "assignment via vk::location(X) unsupported",
														
 
															-                  {})
														
 
															-            << forInput;
														
 
															-        return false;
														
 
															-      }
														
 
															+    if (var.getLocationAttr()) {
														
 
															+      // We have checked that not all of the stage variables have explicit
														
 
															+      // location assignment.
														
 
															+      emitError("partial explicit stage %select{output|input}0 location "
														
 
															+                "assignment via vk::location(X) unsupported",
														
 
															+                {})
														
 
															+          << forInput;
														
 
															+      return false;
														
 
															+    }
														
 
															-      // Only SV_Target, SV_Depth, SV_DepthLessEqual, SV_DepthGreaterEqual,
														
 
															-      // SV_StencilRef, SV_Coverage are allowed in the pixel shader.
														
 
															-      // Arbitrary semantics are disallowed in pixel shader.
														
 
															-      if (var.getSemantic() &&
														
 
															-          var.getSemantic()->GetKind() == hlsl::Semantic::Kind::Target) {
														
 
															-        theBuilder.decorateLocation(var.getSpirvId(), var.getSemanticIndex());
														
 
															-        locSet.useLoc(var.getSemanticIndex());
														
 
															-      } else {
														
 
															-        vars.push_back(&var);
														
 
															-      }
														
 
															+    const auto &semaInfo = var.getSemanticInfo();
														
 
															+
														
 
															+    // We should special rules for SV_Target: the location number comes from the
														
 
															+    // semantic string index.
														
 
															+    if (semaInfo.isTarget()) {
														
 
															+      theBuilder.decorateLocation(var.getSpirvId(), semaInfo.index);
														
 
															+      locSet.useLoc(semaInfo.index);
														
 
															+    } else {
														
 
															+      vars.push_back(&var);
														
 
															     }
														
 
															   }
														
@@ -1209,7 +1256,10 @@ bool DeclResultIdMapper::createStageVars(const hlsl::SigPoint *sigPoint,
 
															     // Found semantic attached directly to this Decl. This means we need to
														
 
															     // map this decl to a single stage variable.
														
 
															-    const auto semanticKind = semanticToUse->semantic->GetKind();
														
 
															+    if (!validateVKAttributes(decl))
														
 
															+      return false;
														
 
															+
														
 
															+    const auto semanticKind = semanticToUse->getKind();
														
 
															     // Error out when the given semantic is invalid in this shader model
														
 
															     if (hlsl::SigPoint::GetInterpretation(semanticKind, sigPoint->GetKind(),
														
@@ -1227,18 +1277,9 @@ bool DeclResultIdMapper::createStageVars(const hlsl::SigPoint *sigPoint,
 
															     const auto *builtinAttr = decl->getAttr<VKBuiltInAttr>();
														
 
															-    // For VS/HS/DS, the PointSize builtin is handled in gl_PerVertex.
														
 
															-    // For GSVIn also in gl_PerVertex; for GSOut, it's a stand-alone
														
 
															-    // variable handled below.
														
 
															-    if (builtinAttr && builtinAttr->getBuiltIn() == "PointSize" &&
														
 
															-        glPerVertex.tryToAccessPointSize(sigPoint->GetKind(), invocationId,
														
 
															-                                         value, noWriteBack))
														
 
															-      return true;
														
 
															-
														
 
															     // Special handling of certain mappings between HLSL semantics and
														
 
															     // SPIR-V builtins:
														
 
															-    // * SV_Position/SV_CullDistance/SV_ClipDistance should be grouped into the
														
 
															-    //   gl_PerVertex struct in vertex processing stages.
														
 
															+    // * SV_CullDistance/SV_ClipDistance are outsourced to GlPerVertex.
														
 
															     // * SV_DomainLocation can refer to a float2, whereas TessCoord is a float3.
														
 
															     //   To ensure SPIR-V validity, we must create a float3 and  extract a
														
 
															     //   float2 from it before passing it to the main function.
														
@@ -1302,8 +1343,7 @@ bool DeclResultIdMapper::createStageVars(const hlsl::SigPoint *sigPoint,
 
															                                        theBuilder.getConstantUint32(arraySize));
														
 
															     StageVar stageVar(
														
 
															-        sigPoint, semanticToUse->str, semanticToUse->semantic,
														
 
															-        semanticToUse->name, semanticToUse->index, builtinAttr, typeId,
														
 
															+        sigPoint, *semanticToUse, builtinAttr, typeId,
														
 
															         // For HS/DS/GS, we have already stripped the outmost arrayness on type.
														
 
															         typeTranslator.getLocationCount(type));
														
 
															     const auto name = namePrefix.str() + "." + stageVar.getSemanticStr();
														
@@ -1315,11 +1355,12 @@ bool DeclResultIdMapper::createStageVars(const hlsl::SigPoint *sigPoint,
 
															     stageVar.setSpirvId(varId);
														
 
															     stageVar.setLocationAttr(decl->getAttr<VKLocationAttr>());
														
 
															+    stageVar.setIndexAttr(decl->getAttr<VKIndexAttr>());
														
 
															     stageVars.push_back(stageVar);
														
 
															     // Emit OpDecorate* instructions to link this stage variable with the HLSL
														
 
															     // semantic it is created for
														
 
															-    theBuilder.decorateHlslSemantic(varId, stageVar.getSemanticStr());
														
 
															+    theBuilder.decorateHlslSemantic(varId, stageVar.getSemanticInfo().str);
														
 
															     // We have semantics attached to this decl, which means it must be a
														
 
															     // function/parameter/variable. All are DeclaratorDecls.
														
@@ -1410,9 +1451,10 @@ bool DeclResultIdMapper::createStageVars(const hlsl::SigPoint *sigPoint,
 
															       // represents a Boolean value where false must be exactly 0, but true can
														
 
															       // be any odd (i.e. bit 0 set) non-zero value)."
														
 
															       else if (semanticKind == hlsl::Semantic::Kind::InnerCoverage) {
														
 
															+        const auto constOne = theBuilder.getConstantUint32(1);
														
 
															+        const auto constZero = theBuilder.getConstantUint32(0);
														
 
															         *value = theBuilder.createSelect(theBuilder.getUint32Type(), *value,
														
 
															-                                         theBuilder.getConstantUint32(1),
														
 
															-                                         theBuilder.getConstantUint32(0));
														
 
															+                                         constOne, constZero);
														
 
															       }
														
 
															       // Special handling of SV_Barycentrics, which is a float3, but the
														
 
															       // underlying stage input variable is a float2 (only provides the first
														
@@ -1452,6 +1494,10 @@ bool DeclResultIdMapper::createStageVars(const hlsl::SigPoint *sigPoint,
 
															       if (noWriteBack)
														
 
															         return true;
														
 
															+      // Negate SV_Position.y if requested
														
 
															+      if (semanticToUse->semantic->GetKind() == hlsl::Semantic::Kind::Position)
														
 
															+        *value = invertYIfRequested(*value);
														
 
															+
														
 
															       uint32_t ptr = varId;
														
 
															       // Special handling of SV_TessFactor HS patch constant output.
														
@@ -1680,16 +1726,8 @@ bool DeclResultIdMapper::writeBackOutputStream(const NamedDecl *decl,
 
															     assert(found != stageVarIds.end());
														
 
															     // Negate SV_Position.y if requested
														
 
															-    if (spirvOptions.invertY &&
														
 
															-        semanticInfo.semantic->GetKind() == hlsl::Semantic::Kind::Position) {
														
 
															-
														
 
															-      const auto f32Type = theBuilder.getFloat32Type();
														
 
															-      const auto v4f32Type = theBuilder.getVecType(f32Type, 4);
														
 
															-      const auto oldY = theBuilder.createCompositeExtract(f32Type, value, {1});
														
 
															-      const auto newY =
														
 
															-          theBuilder.createUnaryOp(spv::Op::OpFNegate, f32Type, oldY);
														
 
															-      value = theBuilder.createCompositeInsert(v4f32Type, value, {1}, newY);
														
 
															-    }
														
 
															+    if (semanticInfo.semantic->GetKind() == hlsl::Semantic::Kind::Position)
														
 
															+      value = invertYIfRequested(value);
														
 
															     theBuilder.createStore(found->second, value);
														
 
															     return true;
														
@@ -1733,6 +1771,19 @@ bool DeclResultIdMapper::writeBackOutputStream(const NamedDecl *decl,
 
															   return true;
														
 
															 }
														
 
															+uint32_t DeclResultIdMapper::invertYIfRequested(uint32_t position) {
														
 
															+  // Negate SV_Position.y if requested
														
 
															+  if (spirvOptions.invertY) {
														
 
															+    const auto f32Type = theBuilder.getFloat32Type();
														
 
															+    const auto v4f32Type = theBuilder.getVecType(f32Type, 4);
														
 
															+    const auto oldY = theBuilder.createCompositeExtract(f32Type, position, {1});
														
 
															+    const auto newY =
														
 
															+        theBuilder.createUnaryOp(spv::Op::OpFNegate, f32Type, oldY);
														
 
															+    position = theBuilder.createCompositeInsert(v4f32Type, position, {1}, newY);
														
 
															+  }
														
 
															+  return position;
														
 
															+}
														
 
															+
														
 
															 void DeclResultIdMapper::decoratePSInterpolationMode(const NamedDecl *decl,
														
 
															                                                      QualType type,
														
 
															                                                      uint32_t varId) {
														
@@ -1796,9 +1847,8 @@ uint32_t DeclResultIdMapper::getBuiltinVar(spv::BuiltIn builtIn) {
 
															           hlsl::DxilParamInputQual::In, shaderModel.GetKind(),
														
 
															           /*isPatchConstant=*/false));
														
 
															-  StageVar stageVar(sigPoint, /*semaStr=*/"", hlsl::Semantic::GetInvalid(),
														
 
															-                    /*semaName=*/"", /*semaIndex=*/0, /*builtinAttr=*/nullptr,
														
 
															-                    type, /*locCount=*/0);
														
 
															+  StageVar stageVar(sigPoint, /*semaInfo=*/{}, /*builtinAttr=*/nullptr, type,
														
 
															+                    /*locCount=*/0);
														
 
															   stageVar.setIsSpirvBuiltin();
														
 
															   stageVar.setSpirvId(varId);
														
@@ -1823,7 +1873,7 @@ uint32_t DeclResultIdMapper::createSpirvStageVar(StageVar *stageVar,
 
															   using spv::BuiltIn;
														
 
															   const auto sigPoint = stageVar->getSigPoint();
														
 
															-  const auto semanticKind = stageVar->getSemantic()->GetKind();
														
 
															+  const auto semanticKind = stageVar->getSemanticInfo().getKind();
														
 
															   const auto sigPointKind = sigPoint->GetKind();
														
 
															   const uint32_t type = stageVar->getSpirvTypeId();
														
@@ -1885,7 +1935,6 @@ uint32_t DeclResultIdMapper::createSpirvStageVar(StageVar *stageVar,
 
															     case hlsl::SigPoint::Kind::DSCPIn:
														
 
															     case hlsl::SigPoint::Kind::DSOut:
														
 
															     case hlsl::SigPoint::Kind::GSVIn:
														
 
															-      llvm_unreachable("should be handled in gl_PerVertex struct");
														
 
															     case hlsl::SigPoint::Kind::GSOut:
														
 
															       stageVar->setIsSpirvBuiltin();
														
 
															       return theBuilder.addStageBuiltinVar(type, sc, BuiltIn::Position);
														
@@ -2121,15 +2170,22 @@ uint32_t DeclResultIdMapper::createSpirvStageVar(StageVar *stageVar,
 
															   case hlsl::Semantic::Kind::RenderTargetArrayIndex: {
														
 
															     switch (sigPointKind) {
														
 
															     case hlsl::SigPoint::Kind::VSIn:
														
 
															-    case hlsl::SigPoint::Kind::VSOut:
														
 
															     case hlsl::SigPoint::Kind::HSCPIn:
														
 
															     case hlsl::SigPoint::Kind::HSCPOut:
														
 
															     case hlsl::SigPoint::Kind::PCOut:
														
 
															     case hlsl::SigPoint::Kind::DSIn:
														
 
															     case hlsl::SigPoint::Kind::DSCPIn:
														
 
															-    case hlsl::SigPoint::Kind::DSOut:
														
 
															     case hlsl::SigPoint::Kind::GSVIn:
														
 
															       return theBuilder.addStageIOVar(type, sc, name.str());
														
 
															+    case hlsl::SigPoint::Kind::VSOut:
														
 
															+    case hlsl::SigPoint::Kind::DSOut:
														
 
															+      theBuilder.addExtension(Extension::EXT_shader_viewport_index_layer,
														
 
															+                              "SV_RenderTargetArrayIndex", srcLoc);
														
 
															+      theBuilder.requireCapability(
														
 
															+          spv::Capability::ShaderViewportIndexLayerEXT);
														
 
															+
														
 
															+      stageVar->setIsSpirvBuiltin();
														
 
															+      return theBuilder.addStageBuiltinVar(type, sc, BuiltIn::Layer);
														
 
															     case hlsl::SigPoint::Kind::GSOut:
														
 
															     case hlsl::SigPoint::Kind::PSIn:
														
 
															       theBuilder.requireCapability(spv::Capability::Geometry);
														
@@ -2147,15 +2203,22 @@ uint32_t DeclResultIdMapper::createSpirvStageVar(StageVar *stageVar,
 
															   case hlsl::Semantic::Kind::ViewPortArrayIndex: {
														
 
															     switch (sigPointKind) {
														
 
															     case hlsl::SigPoint::Kind::VSIn:
														
 
															-    case hlsl::SigPoint::Kind::VSOut:
														
 
															     case hlsl::SigPoint::Kind::HSCPIn:
														
 
															     case hlsl::SigPoint::Kind::HSCPOut:
														
 
															     case hlsl::SigPoint::Kind::PCOut:
														
 
															     case hlsl::SigPoint::Kind::DSIn:
														
 
															     case hlsl::SigPoint::Kind::DSCPIn:
														
 
															-    case hlsl::SigPoint::Kind::DSOut:
														
 
															     case hlsl::SigPoint::Kind::GSVIn:
														
 
															       return theBuilder.addStageIOVar(type, sc, name.str());
														
 
															+    case hlsl::SigPoint::Kind::VSOut:
														
 
															+    case hlsl::SigPoint::Kind::DSOut:
														
 
															+      theBuilder.addExtension(Extension::EXT_shader_viewport_index_layer,
														
 
															+                              "SV_ViewPortArrayIndex", srcLoc);
														
 
															+      theBuilder.requireCapability(
														
 
															+          spv::Capability::ShaderViewportIndexLayerEXT);
														
 
															+
														
 
															+      stageVar->setIsSpirvBuiltin();
														
 
															+      return theBuilder.addStageBuiltinVar(type, sc, BuiltIn::ViewportIndex);
														
 
															     case hlsl::SigPoint::Kind::GSOut:
														
 
															     case hlsl::SigPoint::Kind::PSIn:
														
 
															       theBuilder.requireCapability(spv::Capability::MultiViewport);
														
@@ -2198,13 +2261,49 @@ uint32_t DeclResultIdMapper::createSpirvStageVar(StageVar *stageVar,
 
															   }
														
 
															   default:
														
 
															     emitError("semantic %0 unimplemented", srcLoc)
														
 
															-        << stageVar->getSemantic()->GetName();
														
 
															+        << stageVar->getSemanticStr();
														
 
															     break;
														
 
															   }
														
 
															   return 0;
														
 
															 }
														
 
															+bool DeclResultIdMapper::validateVKAttributes(const NamedDecl *decl) {
														
 
															+  bool success = true;
														
 
															+  if (const auto *idxAttr = decl->getAttr<VKIndexAttr>()) {
														
 
															+    if (!shaderModel.IsPS()) {
														
 
															+      emitError("vk::index only allowed in pixel shader",
														
 
															+                idxAttr->getLocation());
														
 
															+      success = false;
														
 
															+    }
														
 
															+
														
 
															+    const auto *locAttr = decl->getAttr<VKLocationAttr>();
														
 
															+
														
 
															+    if (!locAttr) {
														
 
															+      emitError("vk::index should be used together with vk::location for "
														
 
															+                "dual-source blending",
														
 
															+                idxAttr->getLocation());
														
 
															+      success = false;
														
 
															+    } else {
														
 
															+      const auto locNumber = locAttr->getNumber();
														
 
															+      if (locNumber != 0) {
														
 
															+        emitError("dual-source blending should use vk::location 0",
														
 
															+                  locAttr->getLocation());
														
 
															+        success = false;
														
 
															+      }
														
 
															+    }
														
 
															+
														
 
															+    const auto idxNumber = idxAttr->getNumber();
														
 
															+    if (idxNumber != 0 && idxNumber != 1) {
														
 
															+      emitError("dual-source blending only accepts 0 or 1 as vk::index",
														
 
															+                idxAttr->getLocation());
														
 
															+      success = false;
														
 
															+    }
														
 
															+  }
														
 
															+
														
 
															+  return success;
														
 
															+}
														
 
															+
														
 
															 bool DeclResultIdMapper::validateVKBuiltins(const NamedDecl *decl,
														
 
															                                             const hlsl::SigPoint *sigPoint) {
														
 
															   bool success = true;
														
--- a/tools/clang/lib/SPIRV/DeclResultIdMapper.h
+++ b/tools/clang/lib/SPIRV/DeclResultIdMapper.h
@@ -32,16 +32,29 @@
 
															 namespace clang {
														
 
															 namespace spirv {
														
 
															+/// A struct containing information about a particular HLSL semantic.
														
 
															+struct SemanticInfo {
														
 
															+  llvm::StringRef str;            ///< The original semantic string
														
 
															+  const hlsl::Semantic *semantic; ///< The unique semantic object
														
 
															+  llvm::StringRef name;           ///< The semantic string without index
														
 
															+  uint32_t index;                 ///< The semantic index
														
 
															+  SourceLocation loc;             ///< Source code location
														
 
															+
														
 
															+  bool isValid() const { return semantic != nullptr; }
														
 
															+
														
 
															+  inline hlsl::Semantic::Kind getKind() const;
														
 
															+  /// \brief Returns true if this semantic is a SV_Target.
														
 
															+  inline bool isTarget() const;
														
 
															+};
														
 
															+
														
 
															 /// \brief The class containing HLSL and SPIR-V information about a Vulkan stage
														
 
															 /// (builtin/input/output) variable.
														
 
															 class StageVar {
														
 
															 public:
														
 
															-  inline StageVar(const hlsl::SigPoint *sig, llvm::StringRef semaStr,
														
 
															-                  const hlsl::Semantic *sema, llvm::StringRef semaName,
														
 
															-                  uint32_t semaIndex, const VKBuiltInAttr *builtin,
														
 
															-                  uint32_t type, uint32_t locCount)
														
 
															-      : sigPoint(sig), semanticStr(semaStr), semantic(sema),
														
 
															-        semanticName(semaName), semanticIndex(semaIndex), builtinAttr(builtin),
														
 
															+  inline StageVar(const hlsl::SigPoint *sig, SemanticInfo semaInfo,
														
 
															+                  const VKBuiltInAttr *builtin, uint32_t type,
														
 
															+                  uint32_t locCount)
														
 
															+      : sigPoint(sig), semanticInfo(std::move(semaInfo)), builtinAttr(builtin),
														
 
															         typeId(type), valueId(0), isBuiltin(false),
														
 
															         storageClass(spv::StorageClass::Max), location(nullptr),
														
 
															         locationCount(locCount) {
														
@@ -49,7 +62,8 @@ public:
 
															   }
														
 
															   const hlsl::SigPoint *getSigPoint() const { return sigPoint; }
														
 
															-  const hlsl::Semantic *getSemantic() const { return semantic; }
														
 
															+  const SemanticInfo &getSemanticInfo() const { return semanticInfo; }
														
 
															+  std::string getSemanticStr() const;
														
 
															   uint32_t getSpirvTypeId() const { return typeId; }
														
@@ -58,9 +72,6 @@ public:
 
															   const VKBuiltInAttr *getBuiltInAttr() const { return builtinAttr; }
														
 
															-  std::string getSemanticStr() const;
														
 
															-  uint32_t getSemanticIndex() const { return semanticIndex; }
														
 
															-
														
 
															   bool isSpirvBuitin() const { return isBuiltin; }
														
 
															   void setIsSpirvBuiltin() { isBuiltin = true; }
														
@@ -70,20 +81,17 @@ public:
 
															   const VKLocationAttr *getLocationAttr() const { return location; }
														
 
															   void setLocationAttr(const VKLocationAttr *loc) { location = loc; }
														
 
															+  const VKIndexAttr *getIndexAttr() const { return indexAttr; }
														
 
															+  void setIndexAttr(const VKIndexAttr *idx) { indexAttr = idx; }
														
 
															+
														
 
															   uint32_t getLocationCount() const { return locationCount; }
														
 
															 private:
														
 
															   /// HLSL SigPoint. It uniquely identifies each set of parameters that may be
														
 
															   /// input or output for each entry point.
														
 
															   const hlsl::SigPoint *sigPoint;
														
 
															-  /// Original HLSL semantic string in the source code.
														
 
															-  llvm::StringRef semanticStr;
														
 
															-  /// HLSL semantic.
														
 
															-  const hlsl::Semantic *semantic;
														
 
															-  /// Original HLSL semantic string (without index) in the source code.
														
 
															-  llvm::StringRef semanticName;
														
 
															-  /// HLSL semantic index.
														
 
															-  uint32_t semanticIndex;
														
 
															+  /// Information about HLSL semantic string.
														
 
															+  SemanticInfo semanticInfo;
														
 
															   /// SPIR-V BuiltIn attribute.
														
 
															   const VKBuiltInAttr *builtinAttr;
														
 
															   /// SPIR-V <type-id>.
														
@@ -96,6 +104,8 @@ private:
 
															   spv::StorageClass storageClass;
														
 
															   /// Location assignment if input/output variable.
														
 
															   const VKLocationAttr *location;
														
 
															+  /// Index assignment if PS output variable
														
 
															+  const VKIndexAttr *indexAttr;
														
 
															   /// How many locations this stage variable takes.
														
 
															   uint32_t locationCount;
														
 
															 };
														
@@ -112,7 +122,9 @@ public:
 
															   const hlsl::RegisterAssignment *getRegister() const { return reg; }
														
 
															   const VKBindingAttr *getBinding() const { return binding; }
														
 
															   bool isCounter() const { return isCounterVar; }
														
 
															-  const auto *getCounterBinding() const { return counterBinding; }
														
 
															+  const VKCounterBindingAttr *getCounterBinding() const {
														
 
															+    return counterBinding;
														
 
															+  }
														
 
															 private:
														
 
															   uint32_t varId;                             ///< <result-id>
														
@@ -363,13 +375,10 @@ private:
 
															   const DeclSpirvInfo *getDeclSpirvInfo(const ValueDecl *decl) const;
														
 
															 public:
														
 
															-  /// \brief Returns the information for the given decl. If the decl is not
														
 
															-  /// registered previously, return an invalid SpirvEvalInfo.
														
 
															+  /// \brief Returns the information for the given decl.
														
 
															   ///
														
 
															-  /// This method will emit a fatal error if checkRegistered is true and the
														
 
															-  /// decl is not registered.
														
 
															-  SpirvEvalInfo getDeclEvalInfo(const ValueDecl *decl,
														
 
															-                                bool checkRegistered = true);
														
 
															+  /// This method will panic if the given decl is not registered.
														
 
															+  SpirvEvalInfo getDeclEvalInfo(const ValueDecl *decl);
														
 
															   /// \brief Returns the <result-id> for the given function if already
														
 
															   /// registered; otherwise, treats the given function as a normal decl and
														
@@ -424,6 +433,9 @@ public:
 
															   bool writeBackOutputStream(const NamedDecl *decl, QualType type,
														
 
															                              uint32_t value);
														
 
															+  /// \brief Inverts SV_Position.y is requested.
														
 
															+  uint32_t invertYIfRequested(uint32_t position);
														
 
															+
														
 
															   /// \brief Decorates all stage input and output variables with proper
														
 
															   /// location and returns true on success.
														
 
															   ///
														
@@ -512,22 +524,15 @@ private:
 
															   /// TextureBuffers, and PushConstants. usageKind must be set properly
														
 
															   /// depending on the usage kind.
														
 
															   ///
														
 
															+  /// If arraySize is 0, the variable will be created as a struct ; if arraySize
														
 
															+  /// is > 0, the variable will be created as an array; if arraySize is -1, the
														
 
															+  /// variable will be created as a runtime array.
														
 
															+  ///
														
 
															   /// Panics if the DeclContext is neither HLSLBufferDecl or RecordDecl.
														
 
															   uint32_t createStructOrStructArrayVarOfExplicitLayout(
														
 
															-      const DeclContext *decl, uint32_t arraySize, ContextUsageKind usageKind,
														
 
															+      const DeclContext *decl, int arraySize, ContextUsageKind usageKind,
														
 
															       llvm::StringRef typeName, llvm::StringRef varName);
														
 
															-  /// A struct containing information about a particular HLSL semantic.
														
 
															-  struct SemanticInfo {
														
 
															-    llvm::StringRef str;            ///< The original semantic string
														
 
															-    const hlsl::Semantic *semantic; ///< The unique semantic object
														
 
															-    llvm::StringRef name;           ///< The semantic string without index
														
 
															-    uint32_t index;                 ///< The semantic index
														
 
															-    SourceLocation loc;             ///< Source code location
														
 
															-
														
 
															-    bool isValid() const { return semantic != nullptr; }
														
 
															-  };
														
 
															-
														
 
															   /// Returns the given decl's HLSL semantic information.
														
 
															   static SemanticInfo getStageVarSemantic(const NamedDecl *decl);
														
@@ -568,6 +573,9 @@ private:
 
															   uint32_t createSpirvStageVar(StageVar *, const NamedDecl *decl,
														
 
															                                const llvm::StringRef name, SourceLocation);
														
 
															+  /// Returns true if all vk:: attributes usages are valid.
														
 
															+  bool validateVKAttributes(const NamedDecl *decl);
														
 
															+
														
 
															   /// Returns true if all vk::builtin usages are valid.
														
 
															   bool validateVKBuiltins(const NamedDecl *decl,
														
 
															                           const hlsl::SigPoint *sigPoint);
														
@@ -714,6 +722,14 @@ public:
 
															   GlPerVertex glPerVertex;
														
 
															 };
														
 
															+hlsl::Semantic::Kind SemanticInfo::getKind() const {
														
 
															+  assert(semantic);
														
 
															+  return semantic->GetKind();
														
 
															+}
														
 
															+bool SemanticInfo::isTarget() const {
														
 
															+  return semantic && semantic->GetKind() == hlsl::Semantic::Kind::Target;
														
 
															+}
														
 
															+
														
 
															 void CounterIdAliasPair::assign(const CounterIdAliasPair &srcPair,
														
 
															                                 ModuleBuilder &builder,
														
 
															                                 TypeTranslator &translator) const {
														
@@ -731,7 +747,7 @@ DeclResultIdMapper::DeclResultIdMapper(const hlsl::ShaderModel &model,
 
															       astContext(context), diags(context.getDiagnostics()),
														
 
															       typeTranslator(translator), featureManager(features), entryFunctionId(0),
														
 
															       laneCountBuiltinId(0), laneIndexBuiltinId(0), needsLegalization(false),
														
 
															-      glPerVertex(model, context, builder, typeTranslator, options.invertY) {}
														
 
															+      glPerVertex(model, context, builder, typeTranslator) {}
														
 
															 bool DeclResultIdMapper::decorateStageIOLocations() {
														
 
															   // Try both input and output even if input location assignment failed
														
--- a/tools/clang/lib/SPIRV/Decoration.cpp
+++ b/tools/clang/lib/SPIRV/Decoration.cpp
@@ -280,6 +280,10 @@ Decoration::getSecondaryViewportRelativeNV(SPIRVContext &context,
 
															   Decoration d = Decoration(spv::Decoration::SecondaryViewportRelativeNV);
														
 
															   return getUniqueDecoration(context, d);
														
 
															 }
														
 
															+const Decoration *Decoration::getNonUniformEXT(SPIRVContext &context) {
														
 
															+  Decoration d = Decoration(spv::Decoration::NonUniformEXT);
														
 
															+  return getUniqueDecoration(context, d);
														
 
															+}
														
 
															 const Decoration *Decoration::getHlslCounterBufferGOOGLE(SPIRVContext &context,
														
 
															                                                          uint32_t id) {
														
--- a/tools/clang/lib/SPIRV/FeatureManager.cpp
+++ b/tools/clang/lib/SPIRV/FeatureManager.cpp
@@ -100,10 +100,13 @@ Extension FeatureManager::getExtensionSymbol(llvm::StringRef name) {
 
															       .Case("SPV_KHR_multiview", Extension::KHR_multiview)
														
 
															       .Case("SPV_KHR_shader_draw_parameters",
														
 
															             Extension::KHR_shader_draw_parameters)
														
 
															+      .Case("SPV_EXT_descriptor_indexing", Extension::EXT_descriptor_indexing)
														
 
															       .Case("SPV_EXT_fragment_fully_covered",
														
 
															             Extension::EXT_fragment_fully_covered)
														
 
															       .Case("SPV_EXT_shader_stencil_export",
														
 
															             Extension::EXT_shader_stencil_export)
														
 
															+      .Case("SPV_EXT_shader_viewport_index_layer",
														
 
															+            Extension::EXT_shader_viewport_index_layer)
														
 
															       .Case("SPV_AMD_gpu_shader_half_float",
														
 
															             Extension::AMD_gpu_shader_half_float)
														
 
															       .Case("SPV_AMD_shader_explicit_vertex_parameter",
														
@@ -125,10 +128,14 @@ const char *FeatureManager::getExtensionName(Extension symbol) {
 
															     return "SPV_KHR_multiview";
														
 
															   case Extension::KHR_shader_draw_parameters:
														
 
															     return "SPV_KHR_shader_draw_parameters";
														
 
															+  case Extension::EXT_descriptor_indexing:
														
 
															+    return "SPV_EXT_descriptor_indexing";
														
 
															   case Extension::EXT_fragment_fully_covered:
														
 
															     return "SPV_EXT_fragment_fully_covered";
														
 
															   case Extension::EXT_shader_stencil_export:
														
 
															     return "SPV_EXT_shader_stencil_export";
														
 
															+  case Extension::EXT_shader_viewport_index_layer:
														
 
															+    return "SPV_EXT_shader_viewport_index_layer";
														
 
															   case Extension::AMD_gpu_shader_half_float:
														
 
															     return "SPV_AMD_gpu_shader_half_float";
														
 
															   case Extension::AMD_shader_explicit_vertex_parameter:
														
--- a/tools/clang/lib/SPIRV/GlPerVertex.cpp
+++ b/tools/clang/lib/SPIRV/GlPerVertex.cpp
@@ -18,11 +18,8 @@ namespace clang {
 
															 namespace spirv {
														
 
															 namespace {
														
 
															-constexpr uint32_t gPositionIndex = 0;
														
 
															-constexpr uint32_t gPointSizeIndex = 1;
														
 
															-constexpr uint32_t gClipDistanceIndex = 2;
														
 
															-constexpr uint32_t gCullDistanceIndex = 3;
														
 
															-constexpr uint32_t gGlPerVertexSize = 4;
														
 
															+constexpr uint32_t gClipDistanceIndex = 0;
														
 
															+constexpr uint32_t gCullDistanceIndex = 1;
														
 
															 /// \brief Returns true if the given decl has a semantic string attached and
														
 
															 /// writes the info to *semanticStr, *semantic, and *semanticIndex.
														
@@ -63,80 +60,49 @@ inline bool hasGSPrimitiveTypeQualifier(const DeclaratorDecl *decl) {
 
															 } // anonymous namespace
														
 
															 GlPerVertex::GlPerVertex(const hlsl::ShaderModel &sm, ASTContext &context,
														
 
															-                         ModuleBuilder &builder, TypeTranslator &translator,
														
 
															-                         bool negateY)
														
 
															+                         ModuleBuilder &builder, TypeTranslator &translator)
														
 
															     : shaderModel(sm), astContext(context), theBuilder(builder),
														
 
															-      typeTranslator(translator), invertY(negateY), inIsGrouped(true),
														
 
															-      outIsGrouped(true), inBlockVar(0), outBlockVar(0), inClipVar(0),
														
 
															-      inCullVar(0), outClipVar(0), outCullVar(0), inArraySize(0),
														
 
															-      outArraySize(0), inClipArraySize(1), outClipArraySize(1),
														
 
															-      inCullArraySize(1), outCullArraySize(1), inSemanticStrs(4, ""),
														
 
															-      outSemanticStrs(4, "") {}
														
 
															+      typeTranslator(translator), inClipVar(0), inCullVar(0), outClipVar(0),
														
 
															+      outCullVar(0), inArraySize(0), outArraySize(0), inClipArraySize(1),
														
 
															+      outClipArraySize(1), inCullArraySize(1), outCullArraySize(1),
														
 
															+      inSemanticStrs(2, ""), outSemanticStrs(2, "") {}
														
 
															 void GlPerVertex::generateVars(uint32_t inArrayLen, uint32_t outArrayLen) {
														
 
															-  // Calling this method twice is an internal error.
														
 
															-  assert(inBlockVar == 0);
														
 
															-  assert(outBlockVar == 0);
														
 
															-
														
 
															   inArraySize = inArrayLen;
														
 
															   outArraySize = outArrayLen;
														
 
															-  switch (shaderModel.GetKind()) {
														
 
															-  case hlsl::ShaderModel::Kind::Vertex:
														
 
															-    outBlockVar = createBlockVar(/*asInput=*/false, 0);
														
 
															-    break;
														
 
															-  case hlsl::ShaderModel::Kind::Hull:
														
 
															-    inBlockVar = createBlockVar(/*asInput=*/true, inArraySize);
														
 
															-    outBlockVar = createBlockVar(/*asInput=*/false, outArraySize);
														
 
															-    break;
														
 
															-  case hlsl::ShaderModel::Kind::Domain:
														
 
															-    inBlockVar = createBlockVar(/*asInput=*/true, inArraySize);
														
 
															-    outBlockVar = createBlockVar(/*asInput=*/false, 0);
														
 
															-    break;
														
 
															-  case hlsl::ShaderModel::Kind::Geometry:
														
 
															-    inBlockVar = createBlockVar(/*asInput=*/true, inArraySize);
														
 
															-    if (!outClipType.empty())
														
 
															-      outClipVar = createClipDistanceVar(/*asInput=*/false, outClipArraySize);
														
 
															-    if (!outCullType.empty())
														
 
															-      outCullVar = createCullDistanceVar(/*asInput=*/false, outCullArraySize);
														
 
															-    outIsGrouped = false;
														
 
															-    break;
														
 
															-  case hlsl::ShaderModel::Kind::Pixel:
														
 
															-    if (!inClipType.empty())
														
 
															-      inClipVar = createClipDistanceVar(/*asInput=*/true, inClipArraySize);
														
 
															-    if (!inCullType.empty())
														
 
															-      inCullVar = createCullDistanceVar(/*asInput=*/true, inCullArraySize);
														
 
															-    inIsGrouped = false;
														
 
															-    break;
														
 
															-  }
														
 
															+  if (!inClipType.empty())
														
 
															+    inClipVar = createClipCullDistanceVar(/*asInput=*/true, /*isClip=*/true,
														
 
															+                                          inClipArraySize);
														
 
															+  if (!inCullType.empty())
														
 
															+    inCullVar = createClipCullDistanceVar(/*asInput=*/true, /*isClip=*/false,
														
 
															+                                          inCullArraySize);
														
 
															+  if (!outClipType.empty())
														
 
															+    outClipVar = createClipCullDistanceVar(/*asInput=*/false, /*isClip=*/true,
														
 
															+                                           outClipArraySize);
														
 
															+  if (!outCullType.empty())
														
 
															+    outCullVar = createClipCullDistanceVar(/*asInput=*/false, /*isClip=*/false,
														
 
															+                                           outCullArraySize);
														
 
															 }
														
 
															-llvm::SmallVector<uint32_t, 4> GlPerVertex::getStageInVars() const {
														
 
															-  llvm::SmallVector<uint32_t, 4> vars;
														
 
															-  if (inIsGrouped) {
														
 
															-    if (inBlockVar)
														
 
															-      vars.push_back(inBlockVar);
														
 
															-  } else {
														
 
															-    if (inClipVar)
														
 
															-      vars.push_back(inClipVar);
														
 
															-    if (inCullVar)
														
 
															-      vars.push_back(inCullVar);
														
 
															-  }
														
 
															+llvm::SmallVector<uint32_t, 2> GlPerVertex::getStageInVars() const {
														
 
															+  llvm::SmallVector<uint32_t, 2> vars;
														
 
															+
														
 
															+  if (inClipVar)
														
 
															+    vars.push_back(inClipVar);
														
 
															+  if (inCullVar)
														
 
															+    vars.push_back(inCullVar);
														
 
															   return vars;
														
 
															 }
														
 
															-llvm::SmallVector<uint32_t, 4> GlPerVertex::getStageOutVars() const {
														
 
															-  llvm::SmallVector<uint32_t, 4> vars;
														
 
															-  if (outIsGrouped) {
														
 
															-    if (outBlockVar)
														
 
															-      vars.push_back(outBlockVar);
														
 
															-  } else {
														
 
															-    if (outClipVar)
														
 
															-      vars.push_back(outClipVar);
														
 
															-    if (outCullVar)
														
 
															-      vars.push_back(outCullVar);
														
 
															-  }
														
 
															+llvm::SmallVector<uint32_t, 2> GlPerVertex::getStageOutVars() const {
														
 
															+  llvm::SmallVector<uint32_t, 2> vars;
														
 
															+
														
 
															+  if (outClipVar)
														
 
															+    vars.push_back(outClipVar);
														
 
															+  if (outCullVar)
														
 
															+    vars.push_back(outCullVar);
														
 
															   return vars;
														
 
															 }
														
@@ -214,12 +180,9 @@ bool GlPerVertex::doGlPerVertexFacts(const DeclaratorDecl *decl,
 
															   uint32_t *blockArraySize = asInput ? &inArraySize : &outArraySize;
														
 
															   bool isCull = false;
														
 
															   auto *semanticStrs = asInput ? &inSemanticStrs : &outSemanticStrs;
														
 
															-  auto index = gGlPerVertexSize; // The index of this semantic in gl_PerVertex
														
 
															+  uint32_t index = kSemanticStrCount;
														
 
															   switch (semantic->GetKind()) {
														
 
															-  case hlsl::Semantic::Kind::Position:
														
 
															-    index = gPositionIndex;
														
 
															-    break;
														
 
															   case hlsl::Semantic::Kind::ClipDistance:
														
 
															     typeMap = asInput ? &inClipType : &outClipType;
														
 
															     index = gClipDistanceIndex;
														
@@ -231,15 +194,9 @@ bool GlPerVertex::doGlPerVertexFacts(const DeclaratorDecl *decl,
 
															     break;
														
 
															   }
														
 
															-  // PointSize does not have corresponding SV semantic; it uses
														
 
															-  // [[vk::builtin("PointSize")]] instead.
														
 
															-  if (const auto *builtinAttr = decl->getAttr<VKBuiltInAttr>())
														
 
															-    if (builtinAttr->getBuiltIn() == "PointSize")
														
 
															-      index = gPointSizeIndex;
														
 
															-
														
 
															   // Remember the semantic strings provided by the developer so that we can
														
 
															   // emit OpDecorate* instructions properly for them
														
 
															-  if (index < gGlPerVertexSize) {
														
 
															+  if (index < kSemanticStrCount) {
														
 
															     if ((*semanticStrs)[index].empty())
														
 
															       (*semanticStrs)[index] = semanticStr;
														
 
															     // We can have multiple ClipDistance/CullDistance semantics mapping to the
														
@@ -353,70 +310,27 @@ void GlPerVertex::calculateClipCullDistanceArraySize() {
 
															   updateSizeAndOffset(outCullType, &outCullOffset, &outCullArraySize);
														
 
															 }
														
 
															-uint32_t GlPerVertex::createBlockVar(bool asInput, uint32_t arraySize) {
														
 
															-  const llvm::StringRef typeName = "type.gl_PerVertex";
														
 
															-  spv::StorageClass sc = spv::StorageClass::Input;
														
 
															-  llvm::StringRef varName = "gl_PerVertexIn";
														
 
															-  auto *semanticStrs = &inSemanticStrs;
														
 
															-  uint32_t clipSize = inClipArraySize;
														
 
															-  uint32_t cullSize = inCullArraySize;
														
 
															-
														
 
															-  if (!asInput) {
														
 
															-    sc = spv::StorageClass::Output;
														
 
															-    varName = "gl_PerVertexOut";
														
 
															-    semanticStrs = &outSemanticStrs;
														
 
															-    clipSize = outClipArraySize;
														
 
															-    cullSize = outCullArraySize;
														
 
															-  }
														
 
															-
														
 
															-  uint32_t typeId = typeTranslator.getGlPerVertexStruct(
														
 
															-      clipSize, cullSize, typeName, *semanticStrs);
														
 
															-
														
 
															-  // Handle the extra arrayness over the block
														
 
															-  if (arraySize != 0) {
														
 
															-    const uint32_t arraySizeId = theBuilder.getConstantUint32(arraySize);
														
 
															-    typeId = theBuilder.getArrayType(typeId, arraySizeId);
														
 
															-  }
														
 
															-
														
 
															-  return theBuilder.addStageIOVar(typeId, sc, varName);
														
 
															-}
														
 
															-
														
 
															-uint32_t GlPerVertex::createPositionVar(bool asInput) {
														
 
															-  const uint32_t type = theBuilder.getVecType(theBuilder.getFloat32Type(), 4);
														
 
															-  const spv::StorageClass sc =
														
 
															-      asInput ? spv::StorageClass::Input : spv::StorageClass::Output;
														
 
															-  // Special handling here. Requesting Position for input means we are in
														
 
															-  // PS, which should use FragCoord instead of Position.
														
 
															-  assert(asInput ? shaderModel.IsPS() : true);
														
 
															-  const spv::BuiltIn builtin =
														
 
															-      asInput ? spv::BuiltIn::FragCoord : spv::BuiltIn::Position;
														
 
															-
														
 
															-  return theBuilder.addStageBuiltinVar(type, sc, builtin);
														
 
															-}
														
 
															-
														
 
															-uint32_t GlPerVertex::createClipDistanceVar(bool asInput, uint32_t arraySize) {
														
 
															-  const uint32_t type = theBuilder.getArrayType(
														
 
															+uint32_t GlPerVertex::createClipCullDistanceVar(bool asInput, bool isClip,
														
 
															+                                                uint32_t arraySize) {
														
 
															+  uint32_t type = theBuilder.getArrayType(
														
 
															       theBuilder.getFloat32Type(), theBuilder.getConstantUint32(arraySize));
														
 
															-  spv::StorageClass sc =
														
 
															-      asInput ? spv::StorageClass::Input : spv::StorageClass::Output;
														
 
															-
														
 
															-  auto id = theBuilder.addStageBuiltinVar(type, sc, spv::BuiltIn::ClipDistance);
														
 
															-  theBuilder.decorateHlslSemantic(
														
 
															-      id, asInput ? inSemanticStrs[gClipDistanceIndex]
														
 
															-                  : outSemanticStrs[gClipDistanceIndex]);
														
 
															-  return id;
														
 
															-}
														
 
															+  if (asInput && inArraySize != 0) {
														
 
															+    type = theBuilder.getArrayType(type,
														
 
															+                                   theBuilder.getConstantUint32(inArraySize));
														
 
															+  } else if (!asInput && outArraySize != 0) {
														
 
															+    type = theBuilder.getArrayType(type,
														
 
															+                                   theBuilder.getConstantUint32(outArraySize));
														
 
															+  }
														
 
															-uint32_t GlPerVertex::createCullDistanceVar(bool asInput, uint32_t arraySize) {
														
 
															-  const uint32_t type = theBuilder.getArrayType(
														
 
															-      theBuilder.getFloat32Type(), theBuilder.getConstantUint32(arraySize));
														
 
															   spv::StorageClass sc =
														
 
															       asInput ? spv::StorageClass::Input : spv::StorageClass::Output;
														
 
															-  auto id = theBuilder.addStageBuiltinVar(type, sc, spv::BuiltIn::CullDistance);
														
 
															-  theBuilder.decorateHlslSemantic(
														
 
															-      id, asInput ? inSemanticStrs[gCullDistanceIndex]
														
 
															-                  : outSemanticStrs[gCullDistanceIndex]);
														
 
															+  auto id = theBuilder.addStageBuiltinVar(type, sc,
														
 
															+                                          isClip ? spv::BuiltIn::ClipDistance
														
 
															+                                                 : spv::BuiltIn::CullDistance);
														
 
															+  const auto index = isClip ? gClipDistanceIndex : gCullDistanceIndex;
														
 
															+  theBuilder.decorateHlslSemantic(id, asInput ? inSemanticStrs[index]
														
 
															+                                              : outSemanticStrs[index]);
														
 
															   return id;
														
 
															 }
														
@@ -430,7 +344,6 @@ bool GlPerVertex::tryToAccess(hlsl::SigPoint::Kind sigPointKind,
 
															                                  : true);
														
 
															   switch (semanticKind) {
														
 
															-  case hlsl::Semantic::Kind::Position:
														
 
															   case hlsl::Semantic::Kind::ClipDistance:
														
 
															   case hlsl::Semantic::Kind::CullDistance:
														
 
															     // gl_PerVertex only cares about these builtins.
														
@@ -441,24 +354,12 @@ bool GlPerVertex::tryToAccess(hlsl::SigPoint::Kind sigPointKind,
 
															   switch (sigPointKind) {
														
 
															   case hlsl::SigPoint::Kind::PSIn:
														
 
															-    // We don't handle stand-alone Position builtin in this class.
														
 
															-    if (semanticKind == hlsl::Semantic::Kind::Position)
														
 
															-      return false; // Fall back to the normal path
														
 
															-
														
 
															-    // Fall through
														
 
															-
														
 
															   case hlsl::SigPoint::Kind::HSCPIn:
														
 
															   case hlsl::SigPoint::Kind::DSCPIn:
														
 
															   case hlsl::SigPoint::Kind::GSVIn:
														
 
															     return readField(semanticKind, semanticIndex, value);
														
 
															   case hlsl::SigPoint::Kind::GSOut:
														
 
															-    // We don't handle stand-alone Position builtin in this class.
														
 
															-    if (semanticKind == hlsl::Semantic::Kind::Position)
														
 
															-      return false; // Fall back to the normal path
														
 
															-
														
 
															-    // Fall through
														
 
															-
														
 
															   case hlsl::SigPoint::Kind::VSOut:
														
 
															   case hlsl::SigPoint::Kind::HSCPOut:
														
 
															   case hlsl::SigPoint::Kind::DSOut:
														
@@ -471,68 +372,9 @@ bool GlPerVertex::tryToAccess(hlsl::SigPoint::Kind sigPointKind,
 
															   return false;
														
 
															 }
														
 
															-bool GlPerVertex::tryToAccessPointSize(hlsl::SigPoint::Kind sigPointKind,
														
 
															-                                       llvm::Optional<uint32_t> invocation,
														
 
															-                                       uint32_t *value, bool noWriteBack) {
														
 
															-  switch (sigPointKind) {
														
 
															-  case hlsl::SigPoint::Kind::HSCPIn:
														
 
															-  case hlsl::SigPoint::Kind::DSCPIn:
														
 
															-  case hlsl::SigPoint::Kind::GSVIn:
														
 
															-    *value = readPositionOrPointSize(/*isPosition=*/false);
														
 
															-    return true;
														
 
															-  case hlsl::SigPoint::Kind::VSOut:
														
 
															-  case hlsl::SigPoint::Kind::HSCPOut:
														
 
															-  case hlsl::SigPoint::Kind::DSOut:
														
 
															-    writePositionOrPointSize(/*isPosition=*/false, invocation, *value);
														
 
															-    return true;
														
 
															-  }
														
 
															-
														
 
															-  return false; // Fall back to normal path: GSOut
														
 
															-}
														
 
															-
														
 
															-uint32_t GlPerVertex::readPositionOrPointSize(bool isPosition) const {
														
 
															-  // We do not handle stand-alone Position/PointSize builtin here.
														
 
															-  assert(inIsGrouped);
														
 
															-
														
 
															-  // The PointSize builtin is always of float type.
														
 
															-  // The Position builtin is always of float4 type.
														
 
															-  const uint32_t f32Type = theBuilder.getFloat32Type();
														
 
															-  const uint32_t fieldType =
														
 
															-      isPosition ? theBuilder.getVecType(f32Type, 4) : f32Type;
														
 
															-  const uint32_t ptrType =
														
 
															-      theBuilder.getPointerType(fieldType, spv::StorageClass::Input);
														
 
															-  const uint32_t fieldIndex = theBuilder.getConstantUint32(isPosition ? 0 : 1);
														
 
															-
														
 
															-  if (inArraySize == 0) {
														
 
															-    // The input builtin block is a single block. Only need one index to
														
 
															-    // locate the Position/PointSize builtin.
														
 
															-    const uint32_t ptr =
														
 
															-        theBuilder.createAccessChain(ptrType, inBlockVar, {fieldIndex});
														
 
															-    return theBuilder.createLoad(fieldType, ptr);
														
 
															-  }
														
 
															-
														
 
															-  // The input builtin block is an array of blocks, which means we need to
														
 
															-  // read an array of float4 from an array of structs.
														
 
															-
														
 
															-  llvm::SmallVector<uint32_t, 8> elements;
														
 
															-  for (uint32_t i = 0; i < inArraySize; ++i) {
														
 
															-    const uint32_t arrayIndex = theBuilder.getConstantUint32(i);
														
 
															-    // Get pointer into the array of structs. We need two indices to locate
														
 
															-    // the Position/PointSize builtin now: the first one is the array index,
														
 
															-    // and the second one is the struct index.
														
 
															-    const uint32_t ptr = theBuilder.createAccessChain(ptrType, inBlockVar,
														
 
															-                                                      {arrayIndex, fieldIndex});
														
 
															-    elements.push_back(theBuilder.createLoad(fieldType, ptr));
														
 
															-  }
														
 
															-  // Construct a new array of float4/float for the Position/PointSize builtins
														
 
															-  const uint32_t arrayType = theBuilder.getArrayType(
														
 
															-      fieldType, theBuilder.getConstantUint32(inArraySize));
														
 
															-  return theBuilder.createCompositeConstruct(arrayType, elements);
														
 
															-}
														
 
															-
														
 
															 uint32_t GlPerVertex::readClipCullArrayAsType(bool isClip, uint32_t offset,
														
 
															                                               QualType asType) const {
														
 
															-  const uint32_t clipCullIndex = isClip ? 2 : 3;
														
 
															+  const uint32_t clipCullVar = isClip ? inClipVar : inCullVar;
														
 
															   // The ClipDistance/CullDistance is always an float array. We are accessing
														
 
															   // it using pointers, which should be of pointer to float type.
														
@@ -541,25 +383,16 @@ uint32_t GlPerVertex::readClipCullArrayAsType(bool isClip, uint32_t offset,
 
															       theBuilder.getPointerType(f32Type, spv::StorageClass::Input);
														
 
															   if (inArraySize == 0) {
														
 
															-    // The input builtin block is a single block. Only need two indices to
														
 
															-    // locate the array segment for this SV_ClipDistance/SV_CullDistance
														
 
															-    // variable: one is the index in the gl_PerVertex struct, the other is
														
 
															-    // the start offset within the float array.
														
 
															+    // The input builtin does not have extra arrayness. Only need one index
														
 
															+    // to locate the array segment for this SV_ClipDistance/SV_CullDistance
														
 
															+    // variable: the start offset within the float array.
														
 
															     QualType elemType = {};
														
 
															     uint32_t count = {};
														
 
															     if (TypeTranslator::isScalarType(asType)) {
														
 
															       const uint32_t offsetId = theBuilder.getConstantUint32(offset);
														
 
															-      uint32_t ptr = 0;
														
 
															-
														
 
															-      if (inIsGrouped) {
														
 
															-        ptr = theBuilder.createAccessChain(
														
 
															-            ptrType, inBlockVar,
														
 
															-            {theBuilder.getConstantUint32(clipCullIndex), offsetId});
														
 
															-      } else {
														
 
															-        ptr = theBuilder.createAccessChain(
														
 
															-            ptrType, clipCullIndex == 2 ? inClipVar : inCullVar, {offsetId});
														
 
															-      }
														
 
															+      const uint32_t ptr =
														
 
															+          theBuilder.createAccessChain(ptrType, clipCullVar, {offsetId});
														
 
															       return theBuilder.createLoad(f32Type, ptr);
														
 
															     }
														
@@ -570,16 +403,8 @@ uint32_t GlPerVertex::readClipCullArrayAsType(bool isClip, uint32_t offset,
 
															       for (uint32_t i = 0; i < count; ++i) {
														
 
															         // Read elements sequentially from the float array
														
 
															         const uint32_t offsetId = theBuilder.getConstantUint32(offset + i);
														
 
															-        uint32_t ptr = 0;
														
 
															-
														
 
															-        if (inIsGrouped) {
														
 
															-          ptr = theBuilder.createAccessChain(
														
 
															-              ptrType, inBlockVar,
														
 
															-              {theBuilder.getConstantUint32(clipCullIndex), offsetId});
														
 
															-        } else {
														
 
															-          ptr = theBuilder.createAccessChain(
														
 
															-              ptrType, clipCullIndex == 2 ? inClipVar : inCullVar, {offsetId});
														
 
															-        }
														
 
															+        const uint32_t ptr =
														
 
															+            theBuilder.createAccessChain(ptrType, clipCullVar, {offsetId});
														
 
															         elements.push_back(theBuilder.createLoad(f32Type, ptr));
														
 
															       }
														
 
															       return theBuilder.createCompositeConstruct(
														
@@ -597,8 +422,6 @@ uint32_t GlPerVertex::readClipCullArrayAsType(bool isClip, uint32_t offset,
 
															   // for indexing into the gl_PerVertex struct, and the third one for reading
														
 
															   // the correct element in the float array for ClipDistance/CullDistance.
														
 
															-  assert(inIsGrouped); // Separated builtins won't have the extra arrayness.
														
 
															-
														
 
															   llvm::SmallVector<uint32_t, 8> arrayElements;
														
 
															   QualType elemType = {};
														
 
															   uint32_t count = {};
														
@@ -609,9 +432,8 @@ uint32_t GlPerVertex::readClipCullArrayAsType(bool isClip, uint32_t offset,
 
															     arrayType = theBuilder.getArrayType(f32Type, arraySize);
														
 
															     for (uint32_t i = 0; i < inArraySize; ++i) {
														
 
															       const uint32_t ptr = theBuilder.createAccessChain(
														
 
															-          ptrType, inBlockVar,
														
 
															+          ptrType, clipCullVar,
														
 
															           {theBuilder.getConstantUint32(i), // Block array index
														
 
															-           theBuilder.getConstantUint32(clipCullIndex),
														
 
															            theBuilder.getConstantUint32(offset)});
														
 
															       arrayElements.push_back(theBuilder.createLoad(f32Type, ptr));
														
 
															     }
														
@@ -623,9 +445,9 @@ uint32_t GlPerVertex::readClipCullArrayAsType(bool isClip, uint32_t offset,
 
															       llvm::SmallVector<uint32_t, 4> vecElements;
														
 
															       for (uint32_t j = 0; j < count; ++j) {
														
 
															         const uint32_t ptr = theBuilder.createAccessChain(
														
 
															-            ptrType, inBlockVar,
														
 
															-            {theBuilder.getConstantUint32(i), // Block array index
														
 
															-             theBuilder.getConstantUint32(clipCullIndex),
														
 
															+            ptrType, clipCullVar,
														
 
															+            // Block array index
														
 
															+            {theBuilder.getConstantUint32(i),
														
 
															              // Read elements sequentially from the float array
														
 
															              theBuilder.getConstantUint32(offset + j)});
														
 
															         vecElements.push_back(theBuilder.createLoad(f32Type, ptr));
														
@@ -644,9 +466,6 @@ uint32_t GlPerVertex::readClipCullArrayAsType(bool isClip, uint32_t offset,
 
															 bool GlPerVertex::readField(hlsl::Semantic::Kind semanticKind,
														
 
															                             uint32_t semanticIndex, uint32_t *value) {
														
 
															   switch (semanticKind) {
														
 
															-  case hlsl::Semantic::Kind::Position:
														
 
															-    *value = readPositionOrPointSize(/*isPosition=*/true);
														
 
															-    return true;
														
 
															   case hlsl::Semantic::Kind::ClipDistance: {
														
 
															     const auto offsetIter = inClipOffset.find(semanticIndex);
														
 
															     const auto typeIter = inClipType.find(semanticIndex);
														
@@ -671,62 +490,10 @@ bool GlPerVertex::readField(hlsl::Semantic::Kind semanticKind,
 
															   return false;
														
 
															 }
														
 
															-void GlPerVertex::writePositionOrPointSize(
														
 
															-    bool isPosition, llvm::Optional<uint32_t> invocationId, uint32_t value) {
														
 
															-  // We do not handle stand-alone Position/PointSize builtin here.
														
 
															-  assert(outIsGrouped);
														
 
															-
														
 
															-  // The Position builtin is always of float4 type.
														
 
															-  // The PointSize builtin is always of float type.
														
 
															-  const uint32_t f32Type = theBuilder.getFloat32Type();
														
 
															-  const uint32_t fieldType =
														
 
															-      isPosition ? theBuilder.getVecType(f32Type, 4) : f32Type;
														
 
															-  const uint32_t ptrType =
														
 
															-      theBuilder.getPointerType(fieldType, spv::StorageClass::Output);
														
 
															-  const uint32_t fieldIndex = theBuilder.getConstantUint32(isPosition ? 0 : 1);
														
 
															-
														
 
															-  if (outArraySize == 0) {
														
 
															-    // The input builtin block is a single block. Only need one index to
														
 
															-    // locate the Position/PointSize builtin.
														
 
															-    const uint32_t ptr =
														
 
															-        theBuilder.createAccessChain(ptrType, outBlockVar, {fieldIndex});
														
 
															-
														
 
															-    if (isPosition && invertY) {
														
 
															-      if (shaderModel.IsVS() || shaderModel.IsDS()) {
														
 
															-        const auto oldY =
														
 
															-            theBuilder.createCompositeExtract(f32Type, value, {1});
														
 
															-        const auto newY =
														
 
															-            theBuilder.createUnaryOp(spv::Op::OpFNegate, f32Type, oldY);
														
 
															-        value = theBuilder.createCompositeInsert(fieldType, value, {1}, newY);
														
 
															-      }
														
 
															-    }
														
 
															-
														
 
															-    theBuilder.createStore(ptr, value);
														
 
															-    return;
														
 
															-  }
														
 
															-
														
 
															-  // Writing to an array only happens in HSCPOut.
														
 
															-  assert(shaderModel.IsHS());
														
 
															-  // And we are only writing to the array element with InvocationId as index.
														
 
															-  assert(invocationId.hasValue());
														
 
															-
														
 
															-  // The input builtin block is an array of blocks, which means we need to
														
 
															-  // to write a float4 to each gl_PerVertex in the array.
														
 
															-
														
 
															-  const uint32_t arrayIndex = invocationId.getValue();
														
 
															-  // Get pointer into the array of structs. We need two indices to locate
														
 
															-  // the Position/PointSize builtin now: the first one is the array index,
														
 
															-  // and the second one is the struct index.
														
 
															-  const uint32_t ptr = theBuilder.createAccessChain(ptrType, outBlockVar,
														
 
															-                                                    {arrayIndex, fieldIndex});
														
 
															-
														
 
															-  theBuilder.createStore(ptr, value);
														
 
															-}
														
 
															-
														
 
															 void GlPerVertex::writeClipCullArrayFromType(
														
 
															     llvm::Optional<uint32_t> invocationId, bool isClip, uint32_t offset,
														
 
															     QualType fromType, uint32_t fromValue) const {
														
 
															-  const uint32_t clipCullIndex = isClip ? 2 : 3;
														
 
															+  const uint32_t clipCullVar = isClip ? outClipVar : outCullVar;
														
 
															   // The ClipDistance/CullDistance is always an float array. We are accessing
														
 
															   // it using pointers, which should be of pointer to float type.
														
@@ -735,25 +502,16 @@ void GlPerVertex::writeClipCullArrayFromType(
 
															       theBuilder.getPointerType(f32Type, spv::StorageClass::Output);
														
 
															   if (outArraySize == 0) {
														
 
															-    // The input builtin block is a single block. Only need two indices to
														
 
															-    // locate the array segment for this SV_ClipDistance/SV_CullDistance
														
 
															-    // variable: one is the index in the gl_PerVertex struct, the other is
														
 
															-    // the start offset within the float array.
														
 
															+    // The output builtin does not have extra arrayness. Only need one index
														
 
															+    // to locate the array segment for this SV_ClipDistance/SV_CullDistance
														
 
															+    // variable: the start offset within the float array.
														
 
															     QualType elemType = {};
														
 
															     uint32_t count = {};
														
 
															     if (TypeTranslator::isScalarType(fromType)) {
														
 
															       const uint32_t offsetId = theBuilder.getConstantUint32(offset);
														
 
															-      uint32_t ptr = 0;
														
 
															-
														
 
															-      if (outIsGrouped) {
														
 
															-        ptr = theBuilder.createAccessChain(
														
 
															-            ptrType, outBlockVar,
														
 
															-            {theBuilder.getConstantUint32(clipCullIndex), offsetId});
														
 
															-      } else {
														
 
															-        ptr = theBuilder.createAccessChain(
														
 
															-            ptrType, clipCullIndex == 2 ? outClipVar : outCullVar, {offsetId});
														
 
															-      }
														
 
															+      const uint32_t ptr =
														
 
															+          theBuilder.createAccessChain(ptrType, clipCullVar, {offsetId});
														
 
															       theBuilder.createStore(ptr, fromValue);
														
 
															       return;
														
 
															     }
														
@@ -764,17 +522,8 @@ void GlPerVertex::writeClipCullArrayFromType(
 
															       for (uint32_t i = 0; i < count; ++i) {
														
 
															         // Write elements sequentially into the float array
														
 
															         const uint32_t offsetId = theBuilder.getConstantUint32(offset + i);
														
 
															-        uint32_t ptr = 0;
														
 
															-
														
 
															-        if (outIsGrouped) {
														
 
															-          ptr = theBuilder.createAccessChain(
														
 
															-              ptrType, outBlockVar,
														
 
															-              {theBuilder.getConstantUint32(clipCullIndex), offsetId});
														
 
															-        } else {
														
 
															-          ptr = theBuilder.createAccessChain(
														
 
															-              ptrType, clipCullIndex == 2 ? outClipVar : outCullVar,
														
 
															-              {offsetId});
														
 
															-        }
														
 
															+        const uint32_t ptr =
														
 
															+            theBuilder.createAccessChain(ptrType, clipCullVar, {offsetId});
														
 
															         const uint32_t subValue =
														
 
															             theBuilder.createCompositeExtract(f32Type, fromValue, {i});
														
 
															         theBuilder.createStore(ptr, subValue);
														
@@ -787,8 +536,6 @@ void GlPerVertex::writeClipCullArrayFromType(
 
															     return;
														
 
															   }
														
 
															-  assert(outIsGrouped); // Separated builtins won't have the extra arrayness.
														
 
															-
														
 
															   // Writing to an array only happens in HSCPOut.
														
 
															   assert(shaderModel.IsHS());
														
 
															   // And we are only writing to the array element with InvocationId as index.
														
@@ -806,11 +553,10 @@ void GlPerVertex::writeClipCullArrayFromType(
 
															   uint32_t count = {};
														
 
															   if (TypeTranslator::isScalarType(fromType)) {
														
 
															-    const uint32_t ptr = theBuilder.createAccessChain(
														
 
															-        ptrType, outBlockVar,
														
 
															-        {arrayIndex, // Block array index
														
 
															-         theBuilder.getConstantUint32(clipCullIndex),
														
 
															-         theBuilder.getConstantUint32(offset)});
														
 
															+    const uint32_t ptr =
														
 
															+        theBuilder.createAccessChain(ptrType, clipCullVar,
														
 
															+                                     {arrayIndex, // Block array index
														
 
															+                                      theBuilder.getConstantUint32(offset)});
														
 
															     theBuilder.createStore(ptr, fromValue);
														
 
															     return;
														
 
															   }
														
@@ -819,9 +565,9 @@ void GlPerVertex::writeClipCullArrayFromType(
 
															     // For each gl_PerVertex block, we need to write a vector into it.
														
 
															     for (uint32_t i = 0; i < count; ++i) {
														
 
															       const uint32_t ptr = theBuilder.createAccessChain(
														
 
															-          ptrType, outBlockVar,
														
 
															-          {arrayIndex, // Block array index
														
 
															-           theBuilder.getConstantUint32(clipCullIndex),
														
 
															+          ptrType, clipCullVar,
														
 
															+          // Block array index
														
 
															+          {arrayIndex,
														
 
															            // Write elements sequentially into the float array
														
 
															            theBuilder.getConstantUint32(offset + i)});
														
 
															       const uint32_t subValue =
														
@@ -855,9 +601,6 @@ bool GlPerVertex::writeField(hlsl::Semantic::Kind semanticKind,
 
															   // The interesting shader stage is HS. We need the InvocationID to write
														
 
															   // out the value to the correct array element.
														
 
															   switch (semanticKind) {
														
 
															-  case hlsl::Semantic::Kind::Position:
														
 
															-    writePositionOrPointSize(/*isPosition=*/true, invocationId, *value);
														
 
															-    return true;
														
 
															   case hlsl::Semantic::Kind::ClipDistance: {
														
 
															     const auto offsetIter = outClipOffset.find(semanticIndex);
														
 
															     const auto typeIter = outClipType.find(semanticIndex);
														
--- a/tools/clang/lib/SPIRV/GlPerVertex.h
+++ b/tools/clang/lib/SPIRV/GlPerVertex.h
@@ -23,20 +23,8 @@
 
															 namespace clang {
														
 
															 namespace spirv {
														
 
															-/// The class for representing special gl_PerVertex builtin interface block.
														
 
															-/// The Position, PointSize, ClipDistance, and CullDistance builtin should
														
 
															-/// be handled by this class, except for
														
 
															-/// * Position builtin used in GS output and PS input,
														
 
															-/// * PointSize builtin used in GS output.
														
 
															-///
														
 
															-/// Although the Vulkan spec does not require this directly, it seems the only
														
 
															-/// way to avoid violating the spec is to group the Position, ClipDistance, and
														
 
															-/// CullDistance builtins together into a struct. That's also how GLSL handles
														
 
															-/// these builtins. In GLSL, this struct is called gl_PerVertex.
														
 
															-///
														
 
															-/// This struct should appear as the entry point parameters but it should not
														
 
															-/// have location assignment. We can have two such blocks at most: one for
														
 
															-/// input, one for output.
														
 
															+/// The class for handling ClipDistance and CullDistance builtin variables that
														
 
															+/// belong to gl_PerVertex.
														
 
															 ///
														
 
															 /// Reading/writing of the ClipDistance/CullDistance builtin is not as
														
 
															 /// straightforward as other builtins. This is because in HLSL, we can have
														
@@ -57,19 +45,18 @@ namespace spirv {
 
															 class GlPerVertex {
														
 
															 public:
														
 
															   GlPerVertex(const hlsl::ShaderModel &sm, ASTContext &context,
														
 
															-              ModuleBuilder &builder, TypeTranslator &translator, bool negateY);
														
 
															+              ModuleBuilder &builder, TypeTranslator &translator);
														
 
															   /// Records a declaration of SV_ClipDistance/SV_CullDistance so later
														
 
															   /// we can caculate the ClipDistance/CullDistance array layout.
														
 
															-  /// Also records the semantic strings provided for the builtins in
														
 
															-  /// gl_PerVertex.
														
 
															+  /// Also records the semantic strings provided for them.
														
 
															   bool recordGlPerVertexDeclFacts(const DeclaratorDecl *decl, bool asInput);
														
 
															   /// Calculates the layout for ClipDistance/CullDistance arrays.
														
 
															   void calculateClipCullDistanceArraySize();
														
 
															-  /// Emits SPIR-V code for the input and/or ouput gl_PerVertex builtin
														
 
															-  /// interface blocks. If inputArrayLength is not zero, the input gl_PerVertex
														
 
															+  /// Emits SPIR-V code for the input and/or ouput ClipDistance/CullDistance
														
 
															+  /// builtin variables. If inputArrayLength is not zero, the input variable
														
 
															   /// will have an additional arrayness of the given size. Similarly for
														
 
															   /// outputArrayLength.
														
 
															   ///
														
@@ -78,9 +65,9 @@ public:
 
															   void generateVars(uint32_t inputArrayLength, uint32_t outputArrayLength);
														
 
															   /// Returns the <result-id>s for stage input variables.
														
 
															-  llvm::SmallVector<uint32_t, 4> getStageInVars() const;
														
 
															+  llvm::SmallVector<uint32_t, 2> getStageInVars() const;
														
 
															   /// Returns the <result-id>s for stage output variables.
														
 
															-  llvm::SmallVector<uint32_t, 4> getStageOutVars() const;
														
 
															+  llvm::SmallVector<uint32_t, 2> getStageOutVars() const;
														
 
															   /// Requires the ClipDistance/CullDistance capability if we've seen
														
 
															   /// definition of SV_ClipDistance/SV_CullDistance.
														
@@ -98,17 +85,12 @@ public:
 
															   /// accesses the element at the invocation offset in the gl_PerVeterx array.
														
 
															   ///
														
 
															   /// Emits SPIR-V instructions and returns true if we are accessing builtins
														
 
															-  /// belonging to gl_PerVertex. Does nothing and returns true if we are
														
 
															-  /// accessing builtins not in gl_PerVertex. Returns false if errors occurs.
														
 
															+  /// that are ClipDistance or CullDistance. Does nothing and returns true if
														
 
															+  /// accessing builtins for others. Returns false if errors occurs.
														
 
															   bool tryToAccess(hlsl::SigPoint::Kind sigPoint, hlsl::Semantic::Kind,
														
 
															                    uint32_t semanticIndex, llvm::Optional<uint32_t> invocation,
														
 
															                    uint32_t *value, bool noWriteBack);
														
 
															-  /// Similar to tryToAccess, but only used for the PointSize builtin.
														
 
															-  bool tryToAccessPointSize(hlsl::SigPoint::Kind sigPoint,
														
 
															-                            llvm::Optional<uint32_t> invocation,
														
 
															-                            uint32_t *value, bool noWriteBack);
														
 
															-
														
 
															 private:
														
 
															   template <unsigned N>
														
 
															   DiagnosticBuilder emitError(const char (&message)[N], SourceLocation loc) {
														
@@ -117,19 +99,10 @@ private:
 
															     return astContext.getDiagnostics().Report(loc, diagId);
														
 
															   }
														
 
															-  /// Creates a gl_PerVertex interface block variable. If arraySize is not zero,
														
 
															-  /// The created variable will be an array of gl_PerVertex of the given size.
														
 
															-  /// Otherwise, it will just be a plain struct.
														
 
															-  uint32_t createBlockVar(bool asInput, uint32_t arraySize);
														
 
															-  /// Creates a stand-alone Position builtin variable.
														
 
															-  uint32_t createPositionVar(bool asInput);
														
 
															-  /// Creates a stand-alone ClipDistance builtin variable.
														
 
															-  uint32_t createClipDistanceVar(bool asInput, uint32_t arraySize);
														
 
															-  /// Creates a stand-alone CullDistance builtin variable.
														
 
															-  uint32_t createCullDistanceVar(bool asInput, uint32_t arraySize);
														
 
															-
														
 
															-  /// Emits SPIR-V instructions for reading the Position/PointSize builtin.
														
 
															-  uint32_t readPositionOrPointSize(bool isPosition) const;
														
 
															+  /// Creates a stand-alone ClipDistance/CullDistance builtin variable.
														
 
															+  uint32_t createClipCullDistanceVar(bool asInput, bool isClip,
														
 
															+                                     uint32_t arraySize);
														
 
															+
														
 
															   /// Emits SPIR-V instructions for reading the data starting from offset in
														
 
															   /// the ClipDistance/CullDistance builtin. The data read will be transformed
														
 
															   /// into the given type asType.
														
@@ -139,10 +112,6 @@ private:
 
															   bool readField(hlsl::Semantic::Kind semanticKind, uint32_t semanticIndex,
														
 
															                  uint32_t *value);
														
 
															-  /// Emits SPIR-V instructions for writing the Position/PointSize builtin.
														
 
															-  void writePositionOrPointSize(bool isPosition,
														
 
															-                                llvm::Optional<uint32_t> invocationId,
														
 
															-                                uint32_t value);
														
 
															   /// Emits SPIR-V instructions for writing data into the ClipDistance/
														
 
															   /// CullDistance builtin starting from offset. The value to be written is
														
 
															   /// fromValue, whose type is fromType. Necessary transformations will be
														
@@ -167,41 +136,14 @@ private:
 
															   ModuleBuilder &theBuilder;
														
 
															   TypeTranslator &typeTranslator;
														
 
															-  /// Indicates whether to invert SV_Position.y to accommodate Vulkan's
														
 
															-  /// coordinate system
														
 
															-  bool invertY;
														
 
															-
														
 
															-  /// We can have Position, ClipDistance, and CullDistance either grouped (G)
														
 
															-  /// into the gl_PerVertex struct, or separated (S) as stand-alone variables.
														
 
															-  /// The following table shows for each shader stage, which one is used:
														
 
															-  ///
														
 
															-  /// ===== ===== ======
														
 
															-  /// Stage Input Output
														
 
															-  /// ===== ===== ======
														
 
															-  ///  VS     X     G
														
 
															-  ///  HS     G     G
														
 
															-  ///  DS     G     G
														
 
															-  ///  GS     G     S
														
 
															-  ///  PS     S     X
														
 
															-  /// ===== ===== ======
														
 
															-  ///
														
 
															-  /// Note that when we use separated variables, there is no extra arrayness.
														
 
															-  ///
														
 
															-  /// So depending on the shader stage, we may use one of the following set
														
 
															-  /// of variables to store <result-id>s of the variables:
														
 
															-
														
 
															-  /// Indicates which set of variables are used.
														
 
															-  bool inIsGrouped, outIsGrouped;
														
 
															-  /// Input/output gl_PerVertex block variable if grouped.
														
 
															-  uint32_t inBlockVar, outBlockVar;
														
 
															-  /// Input/output ClipDistance/CullDistance variable if separated.
														
 
															+  /// Input/output ClipDistance/CullDistance variable.
														
 
															   uint32_t inClipVar, inCullVar;
														
 
															   uint32_t outClipVar, outCullVar;
														
 
															-  /// The array size for the input/output gl_PerVertex block variabe.
														
 
															+  /// The array size for the input/output gl_PerVertex block member variables.
														
 
															   /// HS input and output, DS input, GS input has an additional level of
														
 
															   /// arrayness. The array size is stored in this variable. Zero means
														
 
															-  /// the corresponding variable is a plain struct, not an array.
														
 
															+  /// the corresponding variable does not need extra arrayness.
														
 
															   uint32_t inArraySize, outArraySize;
														
 
															   /// The array size of input/output ClipDistance/CullDistance float arrays.
														
 
															   /// This is not the array size of the whole gl_PerVertex struct.
														
@@ -218,10 +160,12 @@ private:
 
															   SemanticIndexToArrayOffsetMap inClipOffset, outClipOffset;
														
 
															   SemanticIndexToArrayOffsetMap inCullOffset, outCullOffset;
														
 
															+  enum { kSemanticStrCount = 2 };
														
 
															+
														
 
															   /// Keeps track of the semantic strings provided in the source code for the
														
 
															   /// builtins in gl_PerVertex.
														
 
															-  llvm::SmallVector<std::string, 4> inSemanticStrs;
														
 
															-  llvm::SmallVector<std::string, 4> outSemanticStrs;
														
 
															+  llvm::SmallVector<std::string, kSemanticStrCount> inSemanticStrs;
														
 
															+  llvm::SmallVector<std::string, kSemanticStrCount> outSemanticStrs;
														
 
															 };
														
 
															 } // end namespace spirv
														
--- a/tools/clang/lib/SPIRV/ModuleBuilder.cpp
+++ b/tools/clang/lib/SPIRV/ModuleBuilder.cpp
@@ -13,7 +13,6 @@
 
															 #include "spirv/unified1//spirv.hpp11"
														
 
															 #include "clang/SPIRV/BitwiseCast.h"
														
 
															 #include "clang/SPIRV/InstBuilder.h"
														
 
															-#include "llvm/llvm_assert/assert.h"
														
 
															 namespace clang {
														
 
															 namespace spirv {
														
@@ -400,6 +399,7 @@ spv::ImageOperandsMask ModuleBuilder::composeImageOperandsMask(
 
															   if (constOffsets) {
														
 
															     mask = mask | ImageOperandsMask::ConstOffsets;
														
 
															+    requireCapability(spv::Capability::ImageGatherExtended);
														
 
															     orderedParams->push_back(constOffsets);
														
 
															   }
														
@@ -442,8 +442,8 @@ uint32_t ModuleBuilder::createImageTexelPointer(uint32_t resultType,
 
															 uint32_t ModuleBuilder::createImageSample(
														
 
															     uint32_t texelType, uint32_t imageType, uint32_t image, uint32_t sampler,
														
 
															-    uint32_t coordinate, uint32_t compareVal, uint32_t bias, uint32_t lod,
														
 
															-    std::pair<uint32_t, uint32_t> grad, uint32_t constOffset,
														
 
															+    bool isNonUniform, uint32_t coordinate, uint32_t compareVal, uint32_t bias,
														
 
															+    uint32_t lod, std::pair<uint32_t, uint32_t> grad, uint32_t constOffset,
														
 
															     uint32_t varOffset, uint32_t constOffsets, uint32_t sample, uint32_t minLod,
														
 
															     uint32_t residencyCodeId) {
														
 
															   assert(insertPoint && "null insert point");
														
@@ -470,6 +470,12 @@ uint32_t ModuleBuilder::createImageSample(
 
															   instBuilder.opSampledImage(sampledImgTy, sampledImgId, image, sampler).x();
														
 
															   insertPoint->appendInstruction(std::move(constructSite));
														
 
															+  if (isNonUniform) {
														
 
															+    // The sampled image will be used to access resource's memory, so we need
														
 
															+    // to decorate it with NonUniformEXT.
														
 
															+    decorate(sampledImgId, spv::Decoration::NonUniformEXT);
														
 
															+  }
														
 
															+
														
 
															   uint32_t texelId = theContext.takeNextId();
														
 
															   llvm::SmallVector<uint32_t, 4> params;
														
 
															   const auto mask =
														
@@ -550,9 +556,9 @@ uint32_t ModuleBuilder::createImageFetchOrRead(
 
															 uint32_t ModuleBuilder::createImageGather(
														
 
															     uint32_t texelType, uint32_t imageType, uint32_t image, uint32_t sampler,
														
 
															-    uint32_t coordinate, uint32_t component, uint32_t compareVal,
														
 
															-    uint32_t constOffset, uint32_t varOffset, uint32_t constOffsets,
														
 
															-    uint32_t sample, uint32_t residencyCodeId) {
														
 
															+    bool isNonUniform, uint32_t coordinate, uint32_t component,
														
 
															+    uint32_t compareVal, uint32_t constOffset, uint32_t varOffset,
														
 
															+    uint32_t constOffsets, uint32_t sample, uint32_t residencyCodeId) {
														
 
															   assert(insertPoint && "null insert point");
														
 
															   uint32_t sparseRetType = 0;
														
@@ -567,6 +573,12 @@ uint32_t ModuleBuilder::createImageGather(
 
															   instBuilder.opSampledImage(sampledImgTy, sampledImgId, image, sampler).x();
														
 
															   insertPoint->appendInstruction(std::move(constructSite));
														
 
															+  if (isNonUniform) {
														
 
															+    // The sampled image will be used to access resource's memory, so we need
														
 
															+    // to decorate it with NonUniformEXT.
														
 
															+    decorate(sampledImgId, spv::Decoration::NonUniformEXT);
														
 
															+  }
														
 
															+
														
 
															   llvm::SmallVector<uint32_t, 2> params;
														
 
															   // TODO: Update ImageGather to accept minLod if necessary.
														
@@ -859,6 +871,11 @@ void ModuleBuilder::decorateLocation(uint32_t targetId, uint32_t location) {
 
															   theModule.addDecoration(d, targetId);
														
 
															 }
														
 
															+void ModuleBuilder::decorateIndex(uint32_t targetId, uint32_t index) {
														
 
															+  const Decoration *d = Decoration::getIndex(theContext, index);
														
 
															+  theModule.addDecoration(d, targetId);
														
 
															+}
														
 
															+
														
 
															 void ModuleBuilder::decorateSpecId(uint32_t targetId, uint32_t specId) {
														
 
															   const Decoration *d = Decoration::getSpecId(theContext, specId);
														
 
															   theModule.addDecoration(d, targetId);
														
@@ -888,6 +905,9 @@ void ModuleBuilder::decorate(uint32_t targetId, spv::Decoration decoration) {
 
															   case spv::Decoration::Patch:
														
 
															     d = Decoration::getPatch(theContext);
														
 
															     break;
														
 
															+  case spv::Decoration::NonUniformEXT:
														
 
															+    d = Decoration::getNonUniformEXT(theContext);
														
 
															+    break;
														
 
															   }
														
 
															   assert(d && "unimplemented decoration");
														
--- a/tools/clang/lib/SPIRV/SPIRVContext.cpp
+++ b/tools/clang/lib/SPIRV/SPIRVContext.cpp
@@ -10,7 +10,6 @@
 
															 #include <tuple>
														
 
															 #include "clang/SPIRV/SPIRVContext.h"
														
 
															-#include "llvm/llvm_assert/assert.h"
														
 
															 namespace clang {
														
 
															 namespace spirv {
														
--- a/tools/clang/lib/SPIRV/SPIRVEmitter.cpp
+++ b/tools/clang/lib/SPIRV/SPIRVEmitter.cpp
@@ -163,8 +163,9 @@ inline bool isExternalVar(const VarDecl *var) {
 
															   // groupshared variables are allowed to be declared as "static". But we still
														
 
															   // need to put them in the Workgroup storage class. That is, when seeing
														
 
															   // "static groupshared", ignore "static".
														
 
															-  return var->hasExternalFormalLinkage() ? !var->isStaticDataMember()
														
 
															-                                         : var->getAttr<HLSLGroupSharedAttr>();
														
 
															+  return var->hasExternalFormalLinkage()
														
 
															+             ? !var->isStaticDataMember()
														
 
															+             : (var->getAttr<HLSLGroupSharedAttr>() != nullptr);
														
 
															 }
														
 
															 /// Returns the referenced variable's DeclContext if the given expr is
														
@@ -181,9 +182,11 @@ const DeclContext *isConstantTextureBufferDeclRef(const Expr *expr) {
 
															 /// Returns true if
														
 
															 /// * the given expr is an DeclRefExpr referencing a kind of structured or byte
														
 
															-/// buffer and it is non-alias one, or
														
 
															+///   buffer and it is non-alias one, or
														
 
															 /// * the given expr is an CallExpr returning a kind of structured or byte
														
 
															-/// buffer.
														
 
															+///   buffer.
														
 
															+/// * the given expr is an ArraySubscriptExpr referencing a kind of structured
														
 
															+///   or byte buffer.
														
 
															 ///
														
 
															 /// Note: legalization specific code
														
 
															 bool isReferencingNonAliasStructuredOrByteBuffer(const Expr *expr) {
														
@@ -195,6 +198,8 @@ bool isReferencingNonAliasStructuredOrByteBuffer(const Expr *expr) {
 
															   } else if (const auto *callExpr = dyn_cast<CallExpr>(expr)) {
														
 
															     if (TypeTranslator::isAKindOfStructuredOrByteBuffer(callExpr->getType()))
														
 
															       return true;
														
 
															+  } else if (const auto *arrSubExpr = dyn_cast<ArraySubscriptExpr>(expr)) {
														
 
															+    return isReferencingNonAliasStructuredOrByteBuffer(arrSubExpr->getBase());
														
 
															   }
														
 
															   return false;
														
 
															 }
														
@@ -533,6 +538,37 @@ std::string getFnName(const FunctionDecl *fn) {
 
															   return getNamespacePrefix(fn) + classOrStructName + fn->getName().str();
														
 
															 }
														
 
															+/// Returns the capability required to non-uniformly index into the given type.
														
 
															+spv::Capability getNonUniformCapability(QualType type) {
														
 
															+  using spv::Capability;
														
 
															+
														
 
															+  if (type->isArrayType()) {
														
 
															+    return getNonUniformCapability(
														
 
															+        type->getAsArrayTypeUnsafe()->getElementType());
														
 
															+  }
														
 
															+  if (TypeTranslator::isTexture(type) || TypeTranslator::isSampler(type)) {
														
 
															+    return Capability::SampledImageArrayNonUniformIndexingEXT;
														
 
															+  }
														
 
															+  if (TypeTranslator::isRWTexture(type)) {
														
 
															+    return Capability::StorageImageArrayNonUniformIndexingEXT;
														
 
															+  }
														
 
															+  if (TypeTranslator::isBuffer(type)) {
														
 
															+    return Capability::UniformTexelBufferArrayNonUniformIndexingEXT;
														
 
															+  }
														
 
															+  if (TypeTranslator::isRWBuffer(type)) {
														
 
															+    return Capability::StorageTexelBufferArrayNonUniformIndexingEXT;
														
 
															+  }
														
 
															+  if (const auto *recordType = type->getAs<RecordType>()) {
														
 
															+    const auto name = recordType->getDecl()->getName();
														
 
															+
														
 
															+    if (name == "SubpassInput" || name == "SubpassInputMS") {
														
 
															+      return Capability::InputAttachmentArrayNonUniformIndexingEXT;
														
 
															+    }
														
 
															+  }
														
 
															+
														
 
															+  return Capability::Max;
														
 
															+}
														
 
															+
														
 
															 } // namespace
														
 
															 SPIRVEmitter::SPIRVEmitter(CompilerInstance &ci, EmitSPIRVOptions &options)
														
@@ -548,7 +584,7 @@ SPIRVEmitter::SPIRVEmitter(CompilerInstance &ci, EmitSPIRVOptions &options)
 
															                    featureManager, options),
														
 
															       entryFunctionId(0), curFunction(nullptr), curThis(0),
														
 
															       seenPushConstantAt(), isSpecConstantMode(false),
														
 
															-      needsLegalization(false) {
														
 
															+      foundNonUniformResourceIndex(false), needsLegalization(false) {
														
 
															   if (shaderModel.GetKind() == hlsl::ShaderModel::Kind::Invalid)
														
 
															     emitError("unknown shader module: %0", {}) << shaderModel.GetName();
														
@@ -587,11 +623,7 @@ void SPIRVEmitter::HandleTranslationUnit(ASTContext &context) {
 
															         workQueue.insert(funcDecl);
														
 
															       }
														
 
															     } else {
														
 
															-      // If ignoring unused resources, defer Decl handling inside
														
 
															-      // TranslationUnit to the time of first referencing.
														
 
															-      if (!spirvOptions.ignoreUnusedResources) {
														
 
															-        doDecl(decl);
														
 
															-      }
														
 
															+      doDecl(decl);
														
 
															     }
														
 
															   }
														
@@ -749,21 +781,6 @@ void SPIRVEmitter::doStmt(const Stmt *stmt,
 
															   }
														
 
															 }
														
 
															-SpirvEvalInfo SPIRVEmitter::doDeclRefExpr(const DeclRefExpr *expr) {
														
 
															-  const auto *decl = expr->getDecl();
														
 
															-  auto id = declIdMapper.getDeclEvalInfo(decl, false);
														
 
															-
														
 
															-  if (spirvOptions.ignoreUnusedResources && !id) {
														
 
															-    // First time referencing a Decl inside TranslationUnit. Register
														
 
															-    // into DeclResultIdMapper and emit SPIR-V for it and then query
														
 
															-    // again.
														
 
															-    doDecl(decl);
														
 
															-    id = declIdMapper.getDeclEvalInfo(decl);
														
 
															-  }
														
 
															-
														
 
															-  return id;
														
 
															-}
														
 
															-
														
 
															 SpirvEvalInfo SPIRVEmitter::doExpr(const Expr *expr) {
														
 
															   SpirvEvalInfo result(/*id*/ 0);
														
@@ -774,7 +791,7 @@ SpirvEvalInfo SPIRVEmitter::doExpr(const Expr *expr) {
 
															   expr = expr->IgnoreParens();
														
 
															   if (const auto *declRefExpr = dyn_cast<DeclRefExpr>(expr)) {
														
 
															-    result = doDeclRefExpr(declRefExpr);
														
 
															+    result = declIdMapper.getDeclEvalInfo(declRefExpr->getDecl());
														
 
															   } else if (const auto *memberExpr = dyn_cast<MemberExpr>(expr)) {
														
 
															     result = doMemberExpr(memberExpr);
														
 
															   } else if (const auto *castExpr = dyn_cast<CastExpr>(expr)) {
														
@@ -879,6 +896,12 @@ SpirvEvalInfo SPIRVEmitter::loadIfGLValue(const Expr *expr,
 
															   uint32_t loadedId = theBuilder.createLoad(valType, info);
														
 
															+  // Decorate with NonUniformEXT if loading from a pointer with that property.
														
 
															+  // We are likely loading an element from the resource array here.
														
 
															+  if (info.isNonUniform()) {
														
 
															+    theBuilder.decorate(loadedId, spv::Decoration::NonUniformEXT);
														
 
															+  }
														
 
															+
														
 
															   // Special-case: According to the SPIR-V Spec: There is no physical size or
														
 
															   // bit pattern defined for boolean type. Therefore an unsigned integer is used
														
 
															   // to represent booleans when layout is required. In such cases, after loading
														
@@ -1190,11 +1213,13 @@ void SPIRVEmitter::doHLSLBufferDecl(const HLSLBufferDecl *bufferDecl) {
 
															   // supported in Vulkan
														
 
															   for (const auto *member : bufferDecl->decls()) {
														
 
															     if (const auto *varMember = dyn_cast<VarDecl>(member)) {
														
 
															-      if (const auto *init = varMember->getInit())
														
 
															-        emitWarning("%select{tbuffer|cbuffer}0 member initializer "
														
 
															-                    "ignored since no Vulkan equivalent",
														
 
															-                    init->getExprLoc())
														
 
															-            << bufferDecl->isCBuffer() << init->getSourceRange();
														
 
															+      if (!spirvOptions.noWarnIgnoredFeatures) {
														
 
															+        if (const auto *init = varMember->getInit())
														
 
															+          emitWarning("%select{tbuffer|cbuffer}0 member initializer "
														
 
															+                      "ignored since no Vulkan equivalent",
														
 
															+                      init->getExprLoc())
														
 
															+              << bufferDecl->isCBuffer() << init->getSourceRange();
														
 
															+      }
														
 
															       // We cannot handle external initialization of column-major matrices now.
														
 
															       if (typeTranslator.isOrContainsNonFpColMajorMatrix(varMember->getType(),
														
@@ -1240,11 +1265,16 @@ void SPIRVEmitter::doVarDecl(const VarDecl *decl) {
 
															               decl->getLocation());
														
 
															   }
														
 
															-  if (const auto *arrayType =
														
 
															-          astContext.getAsConstantArrayType(decl->getType())) {
														
 
															-    if (TypeTranslator::isAKindOfStructuredOrByteBuffer(
														
 
															-            arrayType->getElementType())) {
														
 
															-      emitError("arrays of structured/byte buffers unsupported",
														
 
															+  // Reject arrays of RW/append/consume structured buffers. They have assoicated
														
 
															+  // counters, which are quite nasty to handle.
														
 
															+  if (decl->getType()->isArrayType()) {
														
 
															+    auto type = decl->getType();
														
 
															+    do {
														
 
															+      type = type->getAsArrayTypeUnsafe()->getElementType();
														
 
															+    } while (type->isArrayType());
														
 
															+
														
 
															+    if (TypeTranslator::isRWAppendConsumeSBuffer(type)) {
														
 
															+      emitError("arrays of RW/append/consume structured buffers unsupported",
														
 
															                 decl->getLocation());
														
 
															       return;
														
 
															     }
														
@@ -1890,8 +1920,20 @@ void SPIRVEmitter::doSwitchStmt(const SwitchStmt *switchStmt,
 
															 SpirvEvalInfo
														
 
															 SPIRVEmitter::doArraySubscriptExpr(const ArraySubscriptExpr *expr) {
														
 
															+  // Make sure we don't have previously unhandled NonUniformResourceIndex()
														
 
															+  assert(!foundNonUniformResourceIndex);
														
 
															+
														
 
															   llvm::SmallVector<uint32_t, 4> indices;
														
 
															-  auto info = loadIfAliasVarRef(collectArrayStructIndices(expr, &indices));
														
 
															+  const auto *base = collectArrayStructIndices(expr, &indices);
														
 
															+  auto info = loadIfAliasVarRef(base);
														
 
															+
														
 
															+  if (foundNonUniformResourceIndex) {
														
 
															+    // Add the necessary capability required for indexing into this kind
														
 
															+    // of resource
														
 
															+    theBuilder.requireCapability(getNonUniformCapability(base->getType()));
														
 
															+    info.setNonUniform(); // Carry forward the NonUniformEXT decoration
														
 
															+    foundNonUniformResourceIndex = false;
														
 
															+  }
														
 
															   if (!indices.empty()) {
														
 
															     (void)turnIntoElementPtr(info, expr->getType(), indices);
														
@@ -1959,7 +2001,8 @@ SpirvEvalInfo SPIRVEmitter::processCall(const CallExpr *callExpr) {
 
															   SpirvEvalInfo objectEvalInfo = 0; // EvalInfo for the object (if exists)
														
 
															   bool needsTempVar = false;        // Whether we need temporary variable.
														
 
															-  llvm::SmallVector<uint32_t, 4> params;    // Temporary variables
														
 
															+  llvm::SmallVector<uint32_t, 4> vars;      // Variables for function call
														
 
															+  llvm::SmallVector<bool, 4> isTempVar;     // Temporary variable or not
														
 
															   llvm::SmallVector<SpirvEvalInfo, 4> args; // Evaluated arguments
														
 
															   if (const auto *memberCall = dyn_cast<CXXMemberCallExpr>(callExpr)) {
														
@@ -1998,7 +2041,8 @@ SpirvEvalInfo SPIRVEmitter::processCall(const CallExpr *callExpr) {
 
															       args.push_back(objectId);
														
 
															       // We do not need to create a new temporary variable for the this
														
 
															       // object. Use the evaluated argument.
														
 
															-      params.push_back(args.back());
														
 
															+      vars.push_back(args.back());
														
 
															+      isTempVar.push_back(false);
														
 
															     }
														
 
															   }
														
@@ -2010,25 +2054,44 @@ SpirvEvalInfo SPIRVEmitter::processCall(const CallExpr *callExpr) {
 
															     auto *arg = callExpr->getArg(i)->IgnoreParenLValueCasts();
														
 
															     const auto *param = callee->getParamDecl(i);
														
 
															-    // We need to create variables for holding the values to be used as
														
 
															-    // arguments. The variables themselves are of pointer types.
														
 
															-    const uint32_t varType =
														
 
															-        declIdMapper.getTypeAndCreateCounterForPotentialAliasVar(param);
														
 
															-    const std::string varName = "param.var." + param->getNameAsString();
														
 
															-    const uint32_t tempVarId = theBuilder.addFnVar(varType, varName);
														
 
															+    // Get the evaluation info if this argument is referencing some variable
														
 
															+    // *as a whole*, in which case we can avoid creating the temporary variable
														
 
															+    // for it if it is Function scope and can act as out parameter.
														
 
															+    SpirvEvalInfo argInfo = 0;
														
 
															+    if (const auto *declRefExpr = dyn_cast<DeclRefExpr>(arg)) {
														
 
															+      argInfo = declIdMapper.getDeclEvalInfo(declRefExpr->getDecl());
														
 
															+    }
														
 
															+
														
 
															+    if (argInfo && argInfo.getStorageClass() == spv::StorageClass::Function &&
														
 
															+        canActAsOutParmVar(param)) {
														
 
															+      vars.push_back(argInfo);
														
 
															+      isTempVar.push_back(false);
														
 
															+      args.push_back(doExpr(arg));
														
 
															+    } else {
														
 
															+      // We need to create variables for holding the values to be used as
														
 
															+      // arguments. The variables themselves are of pointer types.
														
 
															+      const uint32_t varType =
														
 
															+          declIdMapper.getTypeAndCreateCounterForPotentialAliasVar(param);
														
 
															+      const std::string varName = "param.var." + param->getNameAsString();
														
 
															+      const uint32_t tempVarId = theBuilder.addFnVar(varType, varName);
														
 
															-    params.push_back(tempVarId);
														
 
															-    args.push_back(doExpr(arg));
														
 
															+      vars.push_back(tempVarId);
														
 
															+      isTempVar.push_back(true);
														
 
															+      args.push_back(doExpr(arg));
														
 
															-    // Update counter variable associated with function parameters
														
 
															-    tryToAssignCounterVar(param, arg);
														
 
															+      // Update counter variable associated with function parameters
														
 
															+      tryToAssignCounterVar(param, arg);
														
 
															-    // Manually load the argument here
														
 
															-    const auto rhsVal = loadIfGLValue(arg, args.back());
														
 
															-    // Initialize the temporary variables using the contents of the arguments
														
 
															-    storeValue(tempVarId, rhsVal, param->getType());
														
 
															+      // Manually load the argument here
														
 
															+      const auto rhsVal = loadIfGLValue(arg, args.back());
														
 
															+      // Initialize the temporary variables using the contents of the arguments
														
 
															+      storeValue(tempVarId, rhsVal, param->getType());
														
 
															+    }
														
 
															   }
														
 
															+  assert(vars.size() == isTempVar.size());
														
 
															+  assert(vars.size() == args.size());
														
 
															+
														
 
															   // Push the callee into the work queue if it is not there.
														
 
															   if (!workQueue.count(callee)) {
														
 
															     workQueue.insert(callee);
														
@@ -2039,26 +2102,25 @@ SpirvEvalInfo SPIRVEmitter::processCall(const CallExpr *callExpr) {
 
															   // Get or forward declare the function <result-id>
														
 
															   const uint32_t funcId = declIdMapper.getOrRegisterFnResultId(callee);
														
 
															-  const uint32_t retVal =
														
 
															-      theBuilder.createFunctionCall(retType, funcId, params);
														
 
															+  const uint32_t retVal = theBuilder.createFunctionCall(retType, funcId, vars);
														
 
															   // If we created a temporary variable for the lvalue object this method is
														
 
															   // invoked upon, we need to copy the contents in the temporary variable back
														
 
															   // to the original object's variable in case there are side effects.
														
 
															   if (needsTempVar && !objectEvalInfo.isRValue()) {
														
 
															     const uint32_t typeId = typeTranslator.translateType(objectType);
														
 
															-    const uint32_t value = theBuilder.createLoad(typeId, params.front());
														
 
															+    const uint32_t value = theBuilder.createLoad(typeId, vars.front());
														
 
															     storeValue(objectEvalInfo, value, objectType);
														
 
															   }
														
 
															   // Go through all parameters and write those marked as out/inout
														
 
															   for (uint32_t i = 0; i < numParams; ++i) {
														
 
															     const auto *param = callee->getParamDecl(i);
														
 
															-    if (canActAsOutParmVar(param)) {
														
 
															+    if (isTempVar[i] && canActAsOutParmVar(param)) {
														
 
															       const auto *arg = callExpr->getArg(i);
														
 
															       const uint32_t index = i + isNonStaticMemberCall;
														
 
															       const uint32_t typeId = typeTranslator.translateType(param->getType());
														
 
															-      const uint32_t value = theBuilder.createLoad(typeId, params[index]);
														
 
															+      const uint32_t value = theBuilder.createLoad(typeId, vars[index]);
														
 
															       processAssignment(arg, value, false, args[index]);
														
 
															     }
														
@@ -2717,7 +2779,9 @@ uint32_t SPIRVEmitter::processGetSamplePosition(const CXXMemberCallExpr *expr) {
 
															 SpirvEvalInfo SPIRVEmitter::processSubpassLoad(const CXXMemberCallExpr *expr) {
														
 
															   const auto *object = expr->getImplicitObjectArgument()->IgnoreParens();
														
 
															-  const uint32_t sample = expr->getNumArgs() == 1 ? doExpr(expr->getArg(0)) : 0;
														
 
															+  const uint32_t sample = expr->getNumArgs() == 1
														
 
															+                              ? static_cast<uint32_t>(doExpr(expr->getArg(0)))
														
 
															+                              : 0;
														
 
															   const uint32_t zero = theBuilder.getConstantInt32(0);
														
 
															   const uint32_t location = theBuilder.getConstantComposite(
														
 
															       theBuilder.getVecType(theBuilder.getInt32Type(), 2), {zero, zero});
														
@@ -2779,16 +2843,10 @@ SPIRVEmitter::processBufferTextureGetDimensions(const CXXMemberCallExpr *expr) {
 
															   // The HLSL methods, however, have overloaded functions which have float
														
 
															   // output arguments. Since the AST naturally won't have casting AST nodes for
														
 
															   // such cases, we'll have to perform the cast ourselves.
														
 
															-  const auto storeToOutputArg = [this](const Expr *outputArg,
														
 
															-                                       uint32_t toStoreId) {
														
 
															-    const auto outputArgType = outputArg->getType();
														
 
															-    // Perform cast to float if necessary.
														
 
															-    if (isFloatOrVecMatOfFloatType(outputArgType)) {
														
 
															-      toStoreId = theBuilder.createUnaryOp(
														
 
															-          spv::Op::OpConvertUToF, typeTranslator.translateType(outputArgType),
														
 
															-          toStoreId);
														
 
															-    }
														
 
															-    theBuilder.createStore(doExpr(outputArg), toStoreId);
														
 
															+  const auto storeToOutputArg = [this](const Expr *outputArg, uint32_t id,
														
 
															+                                       QualType type) {
														
 
															+    id = castToType(id, type, outputArg->getType(), outputArg->getExprLoc());
														
 
															+    theBuilder.createStore(doExpr(outputArg), id);
														
 
															   };
														
 
															   if ((typeName == "Texture1D" && numArgs > 1) ||
														
@@ -2815,8 +2873,11 @@ SPIRVEmitter::processBufferTextureGetDimensions(const CXXMemberCallExpr *expr) {
 
															     querySize -= 1;
														
 
															   const uint32_t uintId = theBuilder.getUint32Type();
														
 
															-  const uint32_t resultTypeId =
														
 
															-      querySize == 1 ? uintId : theBuilder.getVecType(uintId, querySize);
														
 
															+  const QualType resultQualType =
														
 
															+      querySize == 1
														
 
															+          ? astContext.UnsignedIntTy
														
 
															+          : astContext.getExtVectorType(astContext.UnsignedIntTy, querySize);
														
 
															+  const uint32_t resultTypeId = typeTranslator.translateType(resultQualType);
														
 
															   // Only Texture types use ImageQuerySizeLod.
														
 
															   // TextureMS, RWTexture, Buffers, RWBuffers use ImageQuerySize.
														
@@ -2839,7 +2900,7 @@ SPIRVEmitter::processBufferTextureGetDimensions(const CXXMemberCallExpr *expr) {
 
															   if (querySize == 1) {
														
 
															     const uint32_t argIndex = mipLevel ? 1 : 0;
														
 
															-    storeToOutputArg(expr->getArg(argIndex), query);
														
 
															+    storeToOutputArg(expr->getArg(argIndex), query, resultQualType);
														
 
															   } else {
														
 
															     for (uint32_t i = 0; i < querySize; ++i) {
														
 
															       const uint32_t component =
														
@@ -2847,7 +2908,8 @@ SPIRVEmitter::processBufferTextureGetDimensions(const CXXMemberCallExpr *expr) {
 
															       // If the first arg is the mipmap level, we must write the results
														
 
															       // starting from Arg(i+1), not Arg(i).
														
 
															       const uint32_t argIndex = mipLevel ? i + 1 : i;
														
 
															-      storeToOutputArg(expr->getArg(argIndex), component);
														
 
															+      storeToOutputArg(expr->getArg(argIndex), component,
														
 
															+                       astContext.UnsignedIntTy);
														
 
															     }
														
 
															   }
														
@@ -2857,7 +2919,8 @@ SPIRVEmitter::processBufferTextureGetDimensions(const CXXMemberCallExpr *expr) {
 
															         numLevels ? spv::Op::OpImageQueryLevels : spv::Op::OpImageQuerySamples;
														
 
															     const uint32_t numLevelsSamplesQuery =
														
 
															         theBuilder.createUnaryOp(opcode, uintId, objectId);
														
 
															-    storeToOutputArg(numLevelsSamplesArg, numLevelsSamplesQuery);
														
 
															+    storeToOutputArg(numLevelsSamplesArg, numLevelsSamplesQuery,
														
 
															+                     astContext.UnsignedIntTy);
														
 
															   }
														
 
															   return 0;
														
@@ -2873,13 +2936,19 @@ SPIRVEmitter::processTextureLevelOfDetail(const CXXMemberCallExpr *expr) {
 
															   // Return type is always a single float (LOD).
														
 
															   assert(expr->getNumArgs() == 2u);
														
 
															   const auto *object = expr->getImplicitObjectArgument();
														
 
															-  const uint32_t objectId = loadIfGLValue(object);
														
 
															-  const uint32_t samplerState = doExpr(expr->getArg(0));
														
 
															+  const auto objectInfo = loadIfGLValue(object);
														
 
															+  const auto samplerState = doExpr(expr->getArg(0));
														
 
															   const uint32_t coordinate = doExpr(expr->getArg(1));
														
 
															   const uint32_t sampledImageType = theBuilder.getSampledImageType(
														
 
															       typeTranslator.translateType(object->getType()));
														
 
															   const uint32_t sampledImage = theBuilder.createBinaryOp(
														
 
															-      spv::Op::OpSampledImage, sampledImageType, objectId, samplerState);
														
 
															+      spv::Op::OpSampledImage, sampledImageType, objectInfo, samplerState);
														
 
															+
														
 
															+  if (objectInfo.isNonUniform() || samplerState.isNonUniform()) {
														
 
															+    // The sampled image will be used to access resource's memory, so we need
														
 
															+    // to decorate it with NonUniformEXT.
														
 
															+    theBuilder.decorate(sampledImage, spv::Decoration::NonUniformEXT);
														
 
															+  }
														
 
															   // The result type of OpImageQueryLod must be a float2.
														
 
															   const uint32_t queryResultType =
														
@@ -2933,10 +3002,11 @@ uint32_t SPIRVEmitter::processTextureGatherRGBACmpRGBA(
 
															   // No offset args for TextureCube, 1 or 4 offset args for the rest.
														
 
															   assert(numOffsetArgs == 0 || numOffsetArgs == 1 || numOffsetArgs == 4);
														
 
															-  const uint32_t image = loadIfGLValue(imageExpr);
														
 
															-  const uint32_t sampler = doExpr(expr->getArg(0));
														
 
															+  const auto image = loadIfGLValue(imageExpr);
														
 
															+  const auto sampler = doExpr(expr->getArg(0));
														
 
															   const uint32_t coordinate = doExpr(expr->getArg(1));
														
 
															-  const uint32_t compareVal = isCmp ? doExpr(expr->getArg(2)) : 0;
														
 
															+  const uint32_t compareVal =
														
 
															+      isCmp ? static_cast<uint32_t>(doExpr(expr->getArg(2))) : 0;
														
 
															   // Handle offsets (if any).
														
 
															   bool needsEmulation = false;
														
@@ -2965,7 +3035,10 @@ uint32_t SPIRVEmitter::processTextureGatherRGBACmpRGBA(
 
															     }
														
 
															   }
														
 
															-  const auto status = hasStatusArg ? doExpr(expr->getArg(numArgs - 1)) : 0;
														
 
															+  const auto status =
														
 
															+      hasStatusArg ? static_cast<uint32_t>(doExpr(expr->getArg(numArgs - 1)))
														
 
															+                   : 0;
														
 
															+  const bool isNonUniform = image.isNonUniform() || sampler.isNonUniform();
														
 
															   if (needsEmulation) {
														
 
															     const auto elemType = typeTranslator.translateType(
														
@@ -2975,7 +3048,7 @@ uint32_t SPIRVEmitter::processTextureGatherRGBACmpRGBA(
 
															     for (uint32_t i = 0; i < 4; ++i) {
														
 
															       varOffset = doExpr(expr->getArg(2 + isCmp + i));
														
 
															       const uint32_t gatherRet = theBuilder.createImageGather(
														
 
															-          retTypeId, imageTypeId, image, sampler, coordinate,
														
 
															+          retTypeId, imageTypeId, image, sampler, isNonUniform, coordinate,
														
 
															           theBuilder.getConstantInt32(component), compareVal, /*constOffset*/ 0,
														
 
															           varOffset, /*constOffsets*/ 0, /*sampleNumber*/ 0, status);
														
 
															       texels[i] = theBuilder.createCompositeExtract(elemType, gatherRet, {i});
														
@@ -2985,7 +3058,7 @@ uint32_t SPIRVEmitter::processTextureGatherRGBACmpRGBA(
 
															   }
														
 
															   return theBuilder.createImageGather(
														
 
															-      retTypeId, imageTypeId, image, sampler, coordinate,
														
 
															+      retTypeId, imageTypeId, image, sampler, isNonUniform, coordinate,
														
 
															       theBuilder.getConstantInt32(component), compareVal, constOffset,
														
 
															       varOffset, constOffsets, /*sampleNumber*/ 0, status);
														
 
															 }
														
@@ -3019,8 +3092,8 @@ uint32_t SPIRVEmitter::processTextureGatherCmp(const CXXMemberCallExpr *expr) {
 
															   const bool hasOffsetArg = (numArgs == 5) || (numArgs == 4 && !hasStatusArg);
														
 
															   const auto *imageExpr = expr->getImplicitObjectArgument();
														
 
															-  const uint32_t image = loadIfGLValue(imageExpr);
														
 
															-  const uint32_t sampler = doExpr(expr->getArg(0));
														
 
															+  const auto image = loadIfGLValue(imageExpr);
														
 
															+  const auto sampler = doExpr(expr->getArg(0));
														
 
															   const uint32_t coordinate = doExpr(expr->getArg(1));
														
 
															   const uint32_t comparator = doExpr(expr->getArg(2));
														
 
															   uint32_t constOffset = 0, varOffset = 0;
														
@@ -3029,11 +3102,14 @@ uint32_t SPIRVEmitter::processTextureGatherCmp(const CXXMemberCallExpr *expr) {
 
															   const auto retType = typeTranslator.translateType(callee->getReturnType());
														
 
															   const auto imageType = typeTranslator.translateType(imageExpr->getType());
														
 
															-  const auto status = hasStatusArg ? doExpr(expr->getArg(numArgs - 1)) : 0;
														
 
															+  const auto status =
														
 
															+      hasStatusArg ? static_cast<uint32_t>(doExpr(expr->getArg(numArgs - 1)))
														
 
															+                   : 0;
														
 
															   return theBuilder.createImageGather(
														
 
															-      retType, imageType, image, sampler, coordinate, /*component*/ 0,
														
 
															-      comparator, constOffset, varOffset, /*constOffsets*/ 0,
														
 
															+      retType, imageType, image, sampler,
														
 
															+      image.isNonUniform() || sampler.isNonUniform(), coordinate,
														
 
															+      /*component*/ 0, comparator, constOffset, varOffset, /*constOffsets*/ 0,
														
 
															       /*sampleNumber*/ 0, status);
														
 
															 }
														
@@ -3051,7 +3127,12 @@ SpirvEvalInfo SPIRVEmitter::processBufferTextureLoad(
 
															   const bool doFetch =
														
 
															       TypeTranslator::isBuffer(type) || TypeTranslator::isTexture(type);
														
 
															-  const uint32_t objectId = loadIfGLValue(object);
														
 
															+  const auto objectInfo = loadIfGLValue(object);
														
 
															+
														
 
															+  if (objectInfo.isNonUniform()) {
														
 
															+    // Decoreate the image handle for OpImageFetch/OpImageRead
														
 
															+    theBuilder.decorate(objectInfo, spv::Decoration::NonUniformEXT);
														
 
															+  }
														
 
															   // For Texture2DMS and Texture2DMSArray, Sample must be used rather than Lod.
														
 
															   uint32_t sampleNumber = 0;
														
@@ -3080,7 +3161,7 @@ SpirvEvalInfo SPIRVEmitter::processBufferTextureLoad(
 
															   // OpImageFetch and OpImageRead can only fetch a vector of 4 elements.
														
 
															   const uint32_t texelTypeId = theBuilder.getVecType(elemTypeId, 4u);
														
 
															   const uint32_t texel = theBuilder.createImageFetchOrRead(
														
 
															-      doFetch, texelTypeId, type, objectId, locationId, lod, constOffset,
														
 
															+      doFetch, texelTypeId, type, objectInfo, locationId, lod, constOffset,
														
 
															       varOffset, /*constOffsets*/ 0, sampleNumber, residencyCode);
														
 
															   // If the result type is a vec1, vec2, or vec3, some extra processing
														
@@ -3795,8 +3876,8 @@ SPIRVEmitter::processIntrinsicMemberCall(const CXXMemberCallExpr *expr,
 
															 uint32_t SPIRVEmitter::createImageSample(
														
 
															     QualType retType, uint32_t imageType, uint32_t image, uint32_t sampler,
														
 
															-    uint32_t coordinate, uint32_t compareVal, uint32_t bias, uint32_t lod,
														
 
															-    std::pair<uint32_t, uint32_t> grad, uint32_t constOffset,
														
 
															+    bool isNonUniform, uint32_t coordinate, uint32_t compareVal, uint32_t bias,
														
 
															+    uint32_t lod, std::pair<uint32_t, uint32_t> grad, uint32_t constOffset,
														
 
															     uint32_t varOffset, uint32_t constOffsets, uint32_t sample, uint32_t minLod,
														
 
															     uint32_t residencyCodeId) {
														
@@ -3805,10 +3886,10 @@ uint32_t SPIRVEmitter::createImageSample(
 
															   // SampleDref* instructions in SPIR-V always return a scalar.
														
 
															   // They also have the correct type in HLSL.
														
 
															   if (compareVal) {
														
 
															-    return theBuilder.createImageSample(retTypeId, imageType, image, sampler,
														
 
															-                                        coordinate, compareVal, bias, lod, grad,
														
 
															-                                        constOffset, varOffset, constOffsets,
														
 
															-                                        sample, minLod, residencyCodeId);
														
 
															+    return theBuilder.createImageSample(
														
 
															+        retTypeId, imageType, image, sampler, isNonUniform, coordinate,
														
 
															+        compareVal, bias, lod, grad, constOffset, varOffset, constOffsets,
														
 
															+        sample, minLod, residencyCodeId);
														
 
															   }
														
 
															   // Non-Dref Sample instructions in SPIR-V must always return a vec4.
														
@@ -3835,9 +3916,9 @@ uint32_t SPIRVEmitter::createImageSample(
 
															     needsLegalization = true;
														
 
															   uint32_t retVal = theBuilder.createImageSample(
														
 
															-      texelTypeId, imageType, image, sampler, coordinate, compareVal, bias, lod,
														
 
															-      grad, constOffset, varOffset, constOffsets, sample, minLod,
														
 
															-      residencyCodeId);
														
 
															+      texelTypeId, imageType, image, sampler, isNonUniform, coordinate,
														
 
															+      compareVal, bias, lod, grad, constOffset, varOffset, constOffsets, sample,
														
 
															+      minLod, residencyCodeId);
														
 
															   // Extract smaller vector from the vec4 result if necessary.
														
 
															   if (texelTypeId != retTypeId) {
														
@@ -3886,7 +3967,9 @@ uint32_t SPIRVEmitter::processTextureSampleGather(const CXXMemberCallExpr *expr,
 
															   else if (numArgs > 3 && expr->getArg(3)->getType()->isFloatingType())
														
 
															     clamp = doExpr(expr->getArg(3));
														
 
															   const bool hasClampArg = (clamp != 0);
														
 
															-  const auto status = hasStatusArg ? doExpr(expr->getArg(numArgs - 1)) : 0;
														
 
															+  const auto status =
														
 
															+      hasStatusArg ? static_cast<uint32_t>(doExpr(expr->getArg(numArgs - 1)))
														
 
															+                   : 0;
														
 
															   // Subtract 1 for status (if it exists), subtract 1 for clamp (if it exists),
														
 
															   // and subtract 2 for sampler_state and location.
														
@@ -3894,24 +3977,26 @@ uint32_t SPIRVEmitter::processTextureSampleGather(const CXXMemberCallExpr *expr,
 
															   const auto *imageExpr = expr->getImplicitObjectArgument();
														
 
															   const uint32_t imageType = typeTranslator.translateType(imageExpr->getType());
														
 
															-  const uint32_t image = loadIfGLValue(imageExpr);
														
 
															-  const uint32_t sampler = doExpr(expr->getArg(0));
														
 
															+  const auto image = loadIfGLValue(imageExpr);
														
 
															+  const auto sampler = doExpr(expr->getArg(0));
														
 
															   const uint32_t coordinate = doExpr(expr->getArg(1));
														
 
															   // .Sample()/.Gather() may have a third optional paramter for offset.
														
 
															   uint32_t constOffset = 0, varOffset = 0;
														
 
															   if (hasOffsetArg)
														
 
															     handleOffsetInMethodCall(expr, 2, &constOffset, &varOffset);
														
 
															+  const bool isNonUniform = image.isNonUniform() || sampler.isNonUniform();
														
 
															   const auto retType = expr->getDirectCallee()->getReturnType();
														
 
															   const auto retTypeId = typeTranslator.translateType(retType);
														
 
															   if (isSample) {
														
 
															     return createImageSample(
														
 
															-        retType, imageType, image, sampler, coordinate, /*compareVal*/ 0,
														
 
															-        /*bias*/ 0, /*lod*/ 0, std::make_pair(0, 0), constOffset, varOffset,
														
 
															-        /*constOffsets*/ 0, /*sampleNumber*/ 0, /*minLod*/ clamp, status);
														
 
															+        retType, imageType, image, sampler, isNonUniform, coordinate,
														
 
															+        /*compareVal*/ 0, /*bias*/ 0, /*lod*/ 0, std::make_pair(0, 0),
														
 
															+        constOffset, varOffset, /*constOffsets*/ 0, /*sampleNumber*/ 0,
														
 
															+        /*minLod*/ clamp, status);
														
 
															   } else {
														
 
															     return theBuilder.createImageGather(
														
 
															-        retTypeId, imageType, image, sampler, coordinate,
														
 
															+        retTypeId, imageType, image, sampler, isNonUniform, coordinate,
														
 
															         // .Gather() doc says we return four components of red data.
														
 
															         theBuilder.getConstantInt32(0), /*compareVal*/ 0, constOffset,
														
 
															         varOffset, /*constOffsets*/ 0, /*sampleNumber*/ 0, status);
														
@@ -3953,7 +4038,9 @@ SPIRVEmitter::processTextureSampleBiasLevel(const CXXMemberCallExpr *expr,
 
															   const auto numArgs = expr->getNumArgs();
														
 
															   const bool hasStatusArg =
														
 
															       expr->getArg(numArgs - 1)->getType()->isUnsignedIntegerType();
														
 
															-  const auto status = hasStatusArg ? doExpr(expr->getArg(numArgs - 1)) : 0;
														
 
															+  const auto status =
														
 
															+      hasStatusArg ? static_cast<uint32_t>(doExpr(expr->getArg(numArgs - 1)))
														
 
															+                   : 0;
														
 
															   uint32_t clamp = 0;
														
 
															   // The .SampleLevel() methods do not take the clamp argument.
														
@@ -3971,8 +4058,8 @@ SPIRVEmitter::processTextureSampleBiasLevel(const CXXMemberCallExpr *expr,
 
															   const auto *imageExpr = expr->getImplicitObjectArgument();
														
 
															   const uint32_t imageType = typeTranslator.translateType(imageExpr->getType());
														
 
															-  const uint32_t image = loadIfGLValue(imageExpr);
														
 
															-  const uint32_t sampler = doExpr(expr->getArg(0));
														
 
															+  const auto image = loadIfGLValue(imageExpr);
														
 
															+  const auto sampler = doExpr(expr->getArg(0));
														
 
															   const uint32_t coordinate = doExpr(expr->getArg(1));
														
 
															   uint32_t lod = 0;
														
 
															   uint32_t bias = 0;
														
@@ -3988,10 +4075,11 @@ SPIRVEmitter::processTextureSampleBiasLevel(const CXXMemberCallExpr *expr,
 
															   const auto retType = expr->getDirectCallee()->getReturnType();
														
 
															-  return createImageSample(retType, imageType, image, sampler, coordinate,
														
 
															-                           /*compareVal*/ 0, bias, lod, std::make_pair(0, 0),
														
 
															-                           constOffset, varOffset, /*constOffsets*/ 0,
														
 
															-                           /*sampleNumber*/ 0, /*minLod*/ clamp, status);
														
 
															+  return createImageSample(
														
 
															+      retType, imageType, image, sampler,
														
 
															+      image.isNonUniform() || sampler.isNonUniform(), coordinate,
														
 
															+      /*compareVal*/ 0, bias, lod, std::make_pair(0, 0), constOffset, varOffset,
														
 
															+      /*constOffsets*/ 0, /*sampleNumber*/ 0, /*minLod*/ clamp, status);
														
 
															 }
														
 
															 uint32_t SPIRVEmitter::processTextureSampleGrad(const CXXMemberCallExpr *expr) {
														
@@ -4016,7 +4104,9 @@ uint32_t SPIRVEmitter::processTextureSampleGrad(const CXXMemberCallExpr *expr) {
 
															   const auto numArgs = expr->getNumArgs();
														
 
															   const bool hasStatusArg =
														
 
															       expr->getArg(numArgs - 1)->getType()->isUnsignedIntegerType();
														
 
															-  const auto status = hasStatusArg ? doExpr(expr->getArg(numArgs - 1)) : 0;
														
 
															+  const auto status =
														
 
															+      hasStatusArg ? static_cast<uint32_t>(doExpr(expr->getArg(numArgs - 1)))
														
 
															+                   : 0;
														
 
															   uint32_t clamp = 0;
														
 
															   if (numArgs > 4 && expr->getArg(4)->getType()->isFloatingType())
														
@@ -4031,8 +4121,8 @@ uint32_t SPIRVEmitter::processTextureSampleGrad(const CXXMemberCallExpr *expr) {
 
															   const auto *imageExpr = expr->getImplicitObjectArgument();
														
 
															   const uint32_t imageType = typeTranslator.translateType(imageExpr->getType());
														
 
															-  const uint32_t image = loadIfGLValue(imageExpr);
														
 
															-  const uint32_t sampler = doExpr(expr->getArg(0));
														
 
															+  const auto image = loadIfGLValue(imageExpr);
														
 
															+  const auto sampler = doExpr(expr->getArg(0));
														
 
															   const uint32_t coordinate = doExpr(expr->getArg(1));
														
 
															   const uint32_t ddx = doExpr(expr->getArg(2));
														
 
															   const uint32_t ddy = doExpr(expr->getArg(3));
														
@@ -4043,9 +4133,11 @@ uint32_t SPIRVEmitter::processTextureSampleGrad(const CXXMemberCallExpr *expr) {
 
															   const auto retType = expr->getDirectCallee()->getReturnType();
														
 
															   return createImageSample(
														
 
															-      retType, imageType, image, sampler, coordinate, /*compareVal*/ 0,
														
 
															-      /*bias*/ 0, /*lod*/ 0, std::make_pair(ddx, ddy), constOffset, varOffset,
														
 
															-      /*constOffsets*/ 0, /*sampleNumber*/ 0, /*minLod*/ clamp, status);
														
 
															+      retType, imageType, image, sampler,
														
 
															+      image.isNonUniform() || sampler.isNonUniform(), coordinate,
														
 
															+      /*compareVal*/ 0, /*bias*/ 0, /*lod*/ 0, std::make_pair(ddx, ddy),
														
 
															+      constOffset, varOffset, /*constOffsets*/ 0, /*sampleNumber*/ 0,
														
 
															+      /*minLod*/ clamp, status);
														
 
															 }
														
 
															 uint32_t
														
@@ -4098,7 +4190,9 @@ SPIRVEmitter::processTextureSampleCmpCmpLevelZero(const CXXMemberCallExpr *expr,
 
															   const auto numArgs = expr->getNumArgs();
														
 
															   const bool hasStatusArg =
														
 
															       expr->getArg(numArgs - 1)->getType()->isUnsignedIntegerType();
														
 
															-  const auto status = hasStatusArg ? doExpr(expr->getArg(numArgs - 1)) : 0;
														
 
															+  const auto status =
														
 
															+      hasStatusArg ? static_cast<uint32_t>(doExpr(expr->getArg(numArgs - 1)))
														
 
															+                   : 0;
														
 
															   uint32_t clamp = 0;
														
 
															   // The .SampleCmpLevelZero() methods do not take the clamp argument.
														
@@ -4115,8 +4209,8 @@ SPIRVEmitter::processTextureSampleCmpCmpLevelZero(const CXXMemberCallExpr *expr,
 
															   const bool hasOffsetArg = numArgs - hasClampArg - hasStatusArg - 3 > 0;
														
 
															   const auto *imageExpr = expr->getImplicitObjectArgument();
														
 
															-  const uint32_t image = loadIfGLValue(imageExpr);
														
 
															-  const uint32_t sampler = doExpr(expr->getArg(0));
														
 
															+  const auto image = loadIfGLValue(imageExpr);
														
 
															+  const auto sampler = doExpr(expr->getArg(0));
														
 
															   const uint32_t coordinate = doExpr(expr->getArg(1));
														
 
															   const uint32_t compareVal = doExpr(expr->getArg(2));
														
 
															   // If offset is present in .SampleCmp(), it will be the fourth argument.
														
@@ -4126,21 +4220,13 @@ SPIRVEmitter::processTextureSampleCmpCmpLevelZero(const CXXMemberCallExpr *expr,
 
															   const uint32_t lod = isCmp ? 0 : theBuilder.getConstantFloat32(0);
														
 
															   const auto retType = expr->getDirectCallee()->getReturnType();
														
 
															-  // TODO: Hack. Drivers are expecting the Depth value in OpTypeImage to match
														
 
															-  // the OpImageSample* instruction: Depth=0 for normal sampling, and Depth=1
														
 
															-  // for depth-comparison sampling. That behavior is not what the spec says;
														
 
															-  // Vulkan spec reads "The 'Depth' operand of OpTypeImage is ignored."
														
 
															-  // We always generate OpTypeImage variables with Depth=0. Hack this only
														
 
															-  // depth-comparison sampling code path to use Depth=1 for the OpTypeImage
														
 
															-  // used by OpSampledImage. This causes inconsistent types in SPIR-V, but
														
 
															-  // pleases drivers. Whatever.
														
 
															-  const auto imageType = typeTranslator.translateResourceType(
														
 
															-      imageExpr->getType(), LayoutRule::Void, /*isDepthCmp=*/true);
														
 
															-
														
 
															-  return createImageSample(retType, imageType, image, sampler, coordinate,
														
 
															-                           compareVal, /*bias*/ 0, lod, std::make_pair(0, 0),
														
 
															-                           constOffset, varOffset, /*constOffsets*/ 0,
														
 
															-                           /*sampleNumber*/ 0, /*minLod*/ clamp, status);
														
 
															+  const auto imageType = typeTranslator.translateType(imageExpr->getType());
														
 
															+
														
 
															+  return createImageSample(
														
 
															+      retType, imageType, image, sampler,
														
 
															+      image.isNonUniform() || sampler.isNonUniform(), coordinate, compareVal,
														
 
															+      /*bias*/ 0, lod, std::make_pair(0, 0), constOffset, varOffset,
														
 
															+      /*constOffsets*/ 0, /*sampleNumber*/ 0, /*minLod*/ clamp, status);
														
 
															 }
														
 
															 SpirvEvalInfo
														
@@ -4192,7 +4278,9 @@ SPIRVEmitter::processBufferTextureLoad(const CXXMemberCallExpr *expr) {
 
															   const bool isTextureMS = TypeTranslator::isTextureMS(objectType);
														
 
															   const bool hasStatusArg =
														
 
															       expr->getArg(numArgs - 1)->getType()->isUnsignedIntegerType();
														
 
															-  const auto status = hasStatusArg ? doExpr(expr->getArg(numArgs - 1)) : 0;
														
 
															+  const auto status =
														
 
															+      hasStatusArg ? static_cast<uint32_t>(doExpr(expr->getArg(numArgs - 1)))
														
 
															+                   : 0;
														
 
															   if (TypeTranslator::isBuffer(objectType) ||
														
 
															       TypeTranslator::isRWBuffer(objectType) ||
														
@@ -4552,19 +4640,21 @@ SpirvEvalInfo SPIRVEmitter::doUnaryOperator(const UnaryOperator *expr) {
 
															     // Prefix increment/decrement operator returns a lvalue, while postfix
														
 
															     // increment/decrement returns a rvalue.
														
 
															-    return isPre ? subValue : SpirvEvalInfo(originValue).setRValue();
														
 
															+    return isPre ? subValue : subValue.setResultId(originValue).setRValue();
														
 
															   }
														
 
															   case UO_Not: {
														
 
															-    const auto valId =
														
 
															-        theBuilder.createUnaryOp(spv::Op::OpNot, subTypeId, subValue);
														
 
															-    return SpirvEvalInfo(valId).setRValue();
														
 
															+    return subValue
														
 
															+        .setResultId(
														
 
															+            theBuilder.createUnaryOp(spv::Op::OpNot, subTypeId, subValue))
														
 
															+        .setRValue();
														
 
															   }
														
 
															   case UO_LNot: {
														
 
															     // Parsing will do the necessary casting to make sure we are applying the
														
 
															     // ! operator on boolean values.
														
 
															-    const auto valId =
														
 
															-        theBuilder.createUnaryOp(spv::Op::OpLogicalNot, subTypeId, subValue);
														
 
															-    return SpirvEvalInfo(valId).setRValue();
														
 
															+    return subValue
														
 
															+        .setResultId(theBuilder.createUnaryOp(spv::Op::OpLogicalNot, subTypeId,
														
 
															+                                              subValue))
														
 
															+        .setRValue();
														
 
															   }
														
 
															   case UO_Plus:
														
 
															     // No need to do anything for the prefix + operator.
														
@@ -4573,8 +4663,9 @@ SpirvEvalInfo SPIRVEmitter::doUnaryOperator(const UnaryOperator *expr) {
 
															     // SPIR-V have two opcodes for negating values: OpSNegate and OpFNegate.
														
 
															     const spv::Op spvOp = isFloatOrVecOfFloatType(subType) ? spv::Op::OpFNegate
														
 
															                                                            : spv::Op::OpSNegate;
														
 
															-    const auto valId = theBuilder.createUnaryOp(spvOp, subTypeId, subValue);
														
 
															-    return SpirvEvalInfo(valId).setRValue();
														
 
															+    return subValue
														
 
															+        .setResultId(theBuilder.createUnaryOp(spvOp, subTypeId, subValue))
														
 
															+        .setRValue();
														
 
															   }
														
 
															   default:
														
 
															     break;
														
@@ -4708,6 +4799,8 @@ SpirvEvalInfo SPIRVEmitter::processAssignment(const Expr *lhs,
 
															                                               const SpirvEvalInfo &rhs,
														
 
															                                               const bool isCompoundAssignment,
														
 
															                                               SpirvEvalInfo lhsPtr) {
														
 
															+  lhs = lhs->IgnoreParenNoopCasts(astContext);
														
 
															+
														
 
															   // Assigning to vector swizzling should be handled differently.
														
 
															   if (SpirvEvalInfo result = tryToAssignToVectorElements(lhs, rhs))
														
 
															     return result;
														
@@ -4734,7 +4827,9 @@ SpirvEvalInfo SPIRVEmitter::processAssignment(const Expr *lhs,
 
															 void SPIRVEmitter::storeValue(const SpirvEvalInfo &lhsPtr,
														
 
															                               const SpirvEvalInfo &rhsVal,
														
 
															-                              const QualType lhsValType) {
														
 
															+                              QualType lhsValType) {
														
 
															+  if (const auto *refType = lhsValType->getAs<ReferenceType>())
														
 
															+    lhsValType = refType->getPointeeType();
														
 
															   QualType matElemType = {};
														
 
															   const bool lhsIsMat = typeTranslator.isMxNMatrix(lhsValType, &matElemType);
														
@@ -5082,8 +5177,14 @@ SpirvEvalInfo SPIRVEmitter::processBinaryOp(const Expr *lhs, const Expr *rhs,
 
															     }
														
 
															     auto result = SpirvEvalInfo(valId).setRValue();
														
 
															+
														
 
															+    // Propagate RelaxedPrecision
														
 
															     if (lhsVal.isRelaxedPrecision() || rhsVal.isRelaxedPrecision())
														
 
															       result.setRelaxedPrecision();
														
 
															+    // Propagate NonUniformEXT
														
 
															+    if (lhsVal.isNonUniform() || rhsVal.isNonUniform())
														
 
															+      result.setNonUniform();
														
 
															+
														
 
															     return result;
														
 
															   }
														
 
															   case BO_Assign:
														
@@ -5556,8 +5657,9 @@ SPIRVEmitter::tryToAssignToVectorElements(const Expr *lhs,
 
															   }
														
 
															   const auto vec1 = doExpr(base);
														
 
															-  const uint32_t vec1Val =
														
 
															-      vec1.isRValue() ? vec1 : theBuilder.createLoad(baseTypeId, vec1);
														
 
															+  const uint32_t vec1Val = vec1.isRValue()
														
 
															+                               ? static_cast<uint32_t>(vec1)
														
 
															+                               : theBuilder.createLoad(baseTypeId, vec1);
														
 
															   const uint32_t shuffle =
														
 
															       theBuilder.createVectorShuffle(baseTypeId, vec1Val, rhs, selectors);
														
@@ -5579,9 +5681,14 @@ SPIRVEmitter::tryToAssignToRWBufferRWTexture(const Expr *lhs,
 
															   if (isBufferTextureIndexing(lhsExpr, &baseExpr, &indexExpr)) {
														
 
															     const uint32_t locId = doExpr(indexExpr);
														
 
															     const QualType imageType = baseExpr->getType();
														
 
															+    const auto baseInfo = doExpr(baseExpr);
														
 
															     const uint32_t imageId = theBuilder.createLoad(
														
 
															-        typeTranslator.translateType(imageType), doExpr(baseExpr));
														
 
															+        typeTranslator.translateType(imageType), baseInfo);
														
 
															     theBuilder.createImageWrite(imageType, imageId, locId, rhs);
														
 
															+    if (baseInfo.isNonUniform()) {
														
 
															+      // Decorate the image handle for OpImageWrite
														
 
															+      theBuilder.decorate(imageId, spv::Decoration::NonUniformEXT);
														
 
															+    }
														
 
															     return rhs;
														
 
															   }
														
 
															   return 0;
														
@@ -6192,6 +6299,9 @@ SpirvEvalInfo SPIRVEmitter::processIntrinsicCallExpr(const CallExpr *callExpr) {
 
															   case hlsl::IntrinsicOp::IOP_InterlockedCompareExchange:
														
 
															     retVal = processIntrinsicInterlockedMethod(callExpr, hlslOpcode);
														
 
															     break;
														
 
															+  case hlsl::IntrinsicOp::IOP_NonUniformResourceIndex:
														
 
															+    retVal = processIntrinsicNonUniformResourceIndex(callExpr);
														
 
															+    break;
														
 
															   case hlsl::IntrinsicOp::IOP_tex1D:
														
 
															   case hlsl::IntrinsicOp::IOP_tex1Dbias:
														
 
															   case hlsl::IntrinsicOp::IOP_tex1Dgrad:
														
@@ -6578,6 +6688,11 @@ SPIRVEmitter::processIntrinsicInterlockedMethod(const CallExpr *expr,
 
															       }
														
 
															       const auto coordId = doExpr(index);
														
 
															       ptr = theBuilder.createImageTexelPointer(ptrType, baseId, coordId, zero);
														
 
															+      if (baseId.isNonUniform()) {
														
 
															+        // Image texel pointer will used to access image memory. Vulkan requires
														
 
															+        // it to be decorated with NonUniformEXT.
														
 
															+        theBuilder.decorate(ptr, spv::Decoration::NonUniformEXT);
														
 
															+      }
														
 
															     }
														
 
															   }
														
 
															   if (!ptr)
														
@@ -6621,6 +6736,28 @@ SPIRVEmitter::processIntrinsicInterlockedMethod(const CallExpr *expr,
 
															   return 0;
														
 
															 }
														
 
															+SpirvEvalInfo
														
 
															+SPIRVEmitter::processIntrinsicNonUniformResourceIndex(const CallExpr *expr) {
														
 
															+  foundNonUniformResourceIndex = true;
														
 
															+  theBuilder.addExtension(Extension::EXT_descriptor_indexing,
														
 
															+                          "NonUniformResourceIndex", expr->getExprLoc());
														
 
															+  theBuilder.requireCapability(spv::Capability::ShaderNonUniformEXT);
														
 
															+
														
 
															+  auto index = doExpr(expr->getArg(0)).setNonUniform();
														
 
															+  // Decorate the expression in NonUniformResourceIndex() with NonUniformEXT.
														
 
															+  // Aside from this, we also need to eventually populate the NonUniformEXT
														
 
															+  // status to the usage of this expression: the "pointer" operand to a memory
														
 
															+  // access instruction. Vulkan spec has the following rules:
														
 
															+  //
														
 
															+  // If an instruction loads from or stores to a resource (including atomics and
														
 
															+  // image instructions) and the resource descriptor being accessed is not
														
 
															+  // dynamically uniform, then the operand corresponding to that resource (e.g.
														
 
															+  // the pointer or sampled image operand) must be decorated with NonUniformEXT.
														
 
															+  theBuilder.decorate(index, spv::Decoration::NonUniformEXT);
														
 
															+
														
 
															+  return index;
														
 
															+}
														
 
															+
														
 
															 uint32_t SPIRVEmitter::processIntrinsicMsad4(const CallExpr *callExpr) {
														
 
															   emitWarning("msad4 intrinsic function is emulated using many SPIR-V "
														
 
															               "instructions due to lack of direct SPIR-V equivalent",
														
@@ -9143,8 +9280,8 @@ bool SPIRVEmitter::emitEntryFunctionWrapper(const FunctionDecl *decl,
 
															   declIdMapper.glPerVertex.calculateClipCullDistanceArraySize();
														
 
															   if (!shaderModel.IsCS()) {
														
 
															-    // Generate the gl_PerVertex structs or stand-alone builtins of
														
 
															-    // Position, ClipDistance, and CullDistance.
														
 
															+    // Generate stand-alone builtins of Position, ClipDistance, and
														
 
															+    // CullDistance, which belongs to gl_PerVertex.
														
 
															     declIdMapper.glPerVertex.generateVars(inputArraySize, outputArraySize);
														
 
															   }
														
@@ -9323,11 +9460,12 @@ bool SPIRVEmitter::processHSEntryPointOutputAndPCF(
 
															   // Now create a barrier before calling the Patch Constant Function (PCF).
														
 
															   // Flags are:
														
 
															   // Execution Barrier scope = Workgroup (2)
														
 
															-  // Memory Barrier scope = Device (1)
														
 
															+  // Memory Barrier scope = Invocation (4)
														
 
															   // Memory Semantics Barrier scope = None (0)
														
 
															-  theBuilder.createBarrier(theBuilder.getConstantUint32(2),
														
 
															-                           theBuilder.getConstantUint32(1),
														
 
															-                           theBuilder.getConstantUint32(0));
														
 
															+  const auto constZero = theBuilder.getConstantUint32(0);
														
 
															+  const auto constFour = theBuilder.getConstantUint32(4);
														
 
															+  const auto constTwo = theBuilder.getConstantUint32(2);
														
 
															+  theBuilder.createBarrier(constTwo, constFour, constZero);
														
 
															   // The PCF should be called only once. Therefore, we check the invocationID,
														
 
															   // and we only allow ID 0 to call the PCF.
														
--- a/tools/clang/lib/SPIRV/SPIRVEmitter.h
+++ b/tools/clang/lib/SPIRV/SPIRVEmitter.h
@@ -100,7 +100,6 @@ private:
 
															   SpirvEvalInfo doConditionalOperator(const ConditionalOperator *expr);
														
 
															   SpirvEvalInfo doCXXMemberCallExpr(const CXXMemberCallExpr *expr);
														
 
															   SpirvEvalInfo doCXXOperatorCallExpr(const CXXOperatorCallExpr *expr);
														
 
															-  SpirvEvalInfo doDeclRefExpr(const DeclRefExpr *expr);
														
 
															   SpirvEvalInfo doExtMatrixElementExpr(const ExtMatrixElementExpr *expr);
														
 
															   SpirvEvalInfo doHLSLVectorElementExpr(const HLSLVectorElementExpr *expr);
														
 
															   SpirvEvalInfo doInitListExpr(const InitListExpr *expr);
														
@@ -273,9 +272,8 @@ private:
 
															   /// Creates a temporary local variable in the current function of the given
														
 
															   /// varType and varName. Initializes the variable with the given initValue.
														
 
															   /// Returns the <result-id> of the variable.
														
 
															-  uint32_t SPIRVEmitter::createTemporaryVar(QualType varType,
														
 
															-                                            llvm::StringRef varName,
														
 
															-                                            const SpirvEvalInfo &initValue);
														
 
															+  uint32_t createTemporaryVar(QualType varType, llvm::StringRef varName,
														
 
															+                              const SpirvEvalInfo &initValue);
														
 
															   /// Collects all indices (SPIR-V constant values) from consecutive MemberExprs
														
 
															   /// or ArraySubscriptExprs or operator[] calls and writes into indices.
														
@@ -472,6 +470,9 @@ private:
 
															   /// Processes SM6.0 quad-wide shuffle.
														
 
															   uint32_t processWaveQuadWideShuffle(const CallExpr *, hlsl::IntrinsicOp op);
														
 
															+  /// Processes the NonUniformResourceIndex intrinsic function.
														
 
															+  SpirvEvalInfo processIntrinsicNonUniformResourceIndex(const CallExpr *);
														
 
															+
														
 
															 private:
														
 
															   /// Returns the <result-id> for constant value 0 of the given type.
														
 
															   uint32_t getValueZero(QualType type);
														
@@ -854,8 +855,8 @@ private:
 
															   /// return a vec4. As a result, an extra processing step is necessary.
														
 
															   uint32_t createImageSample(QualType retType, uint32_t imageType,
														
 
															                              uint32_t image, uint32_t sampler,
														
 
															-                             uint32_t coordinate, uint32_t compareVal,
														
 
															-                             uint32_t bias, uint32_t lod,
														
 
															+                             bool isNonUniform, uint32_t coordinate,
														
 
															+                             uint32_t compareVal, uint32_t bias, uint32_t lod,
														
 
															                              std::pair<uint32_t, uint32_t> grad,
														
 
															                              uint32_t constOffset, uint32_t varOffset,
														
 
															                              uint32_t constOffsets, uint32_t sample,
														
@@ -939,6 +940,13 @@ private:
 
															   /// all 32-bit scalar constants will be translated into OpSpecConstant.
														
 
															   bool isSpecConstantMode;
														
 
															+  /// Indicates that we have found a NonUniformResourceIndex call when
														
 
															+  /// traversing.
														
 
															+  /// This field is used to convery information in a bottom-up manner; if we
														
 
															+  /// have something like `aResource[NonUniformResourceIndex(aIndex)]`, we need
														
 
															+  /// to attach `aResource` with proper decorations.
														
 
															+  bool foundNonUniformResourceIndex;
														
 
															+
														
 
															   /// Whether the translated SPIR-V binary needs legalization.
														
 
															   ///
														
 
															   /// The following cases will require legalization:
														
--- a/tools/clang/lib/SPIRV/SpirvEvalInfo.h
+++ b/tools/clang/lib/SPIRV/SpirvEvalInfo.h
@@ -93,6 +93,9 @@ public:
 
															   inline SpirvEvalInfo &setRelaxedPrecision();
														
 
															   bool isRelaxedPrecision() const { return isRelaxedPrecision_; }
														
 
															+  inline SpirvEvalInfo &setNonUniform(bool nu = true);
														
 
															+  bool isNonUniform() const { return isNonUniform_; }
														
 
															+
														
 
															 private:
														
 
															   uint32_t resultId;
														
 
															   /// Indicates whether this evaluation result contains alias variables
														
@@ -112,13 +115,14 @@ private:
 
															   bool isConstant_;
														
 
															   bool isSpecConstant_;
														
 
															   bool isRelaxedPrecision_;
														
 
															+  bool isNonUniform_;
														
 
															 };
														
 
															 SpirvEvalInfo::SpirvEvalInfo(uint32_t id)
														
 
															     : resultId(id), containsAlias(false),
														
 
															       storageClass(spv::StorageClass::Function), layoutRule(LayoutRule::Void),
														
 
															       isRValue_(false), isConstant_(false), isSpecConstant_(false),
														
 
															-      isRelaxedPrecision_(false) {}
														
 
															+      isRelaxedPrecision_(false), isNonUniform_(false) {}
														
 
															 SpirvEvalInfo &SpirvEvalInfo::setResultId(uint32_t id) {
														
 
															   resultId = id;
														
@@ -167,6 +171,11 @@ SpirvEvalInfo &SpirvEvalInfo::setRelaxedPrecision() {
 
															   return *this;
														
 
															 }
														
 
															+SpirvEvalInfo &SpirvEvalInfo::setNonUniform(bool nu) {
														
 
															+  isNonUniform_ = nu;
														
 
															+  return *this;
														
 
															+}
														
 
															+
														
 
															 } // end namespace spirv
														
 
															 } // end namespace clang
														
--- a/tools/clang/lib/SPIRV/TypeTranslator.cpp
+++ b/tools/clang/lib/SPIRV/TypeTranslator.cpp
@@ -621,22 +621,37 @@ uint32_t TypeTranslator::translateType(QualType type, LayoutRule rule) {
 
															                                     decorations);
														
 
															   }
														
 
															-  if (const auto *arrayType = astContext.getAsConstantArrayType(type)) {
														
 
															-    const uint32_t elemType = translateType(arrayType->getElementType(), rule);
														
 
															-    // TODO: handle extra large array size?
														
 
															-    const auto size =
														
 
															-        static_cast<uint32_t>(arrayType->getSize().getZExtValue());
														
 
															+  // Array type
														
 
															+  if (const auto *arrayType = astContext.getAsArrayType(type)) {
														
 
															+    const auto elemType = arrayType->getElementType();
														
 
															+    const uint32_t elemTypeId = translateType(elemType, rule);
														
 
															     llvm::SmallVector<const Decoration *, 4> decorations;
														
 
															-    if (rule != LayoutRule::Void) {
														
 
															+    if (rule != LayoutRule::Void &&
														
 
															+        // We won't have stride information for structured/byte buffers since
														
 
															+        // they contain runtime arrays.
														
 
															+        !isAKindOfStructuredOrByteBuffer(elemType)) {
														
 
															       uint32_t stride = 0;
														
 
															       (void)getAlignmentAndSize(type, rule, &stride);
														
 
															       decorations.push_back(
														
 
															           Decoration::getArrayStride(*theBuilder.getSPIRVContext(), stride));
														
 
															     }
														
 
															-    return theBuilder.getArrayType(elemType, theBuilder.getConstantUint32(size),
														
 
															-                                   decorations);
														
 
															+    if (const auto *caType = astContext.getAsConstantArrayType(type)) {
														
 
															+      const auto size = static_cast<uint32_t>(caType->getSize().getZExtValue());
														
 
															+      return theBuilder.getArrayType(
														
 
															+          elemTypeId, theBuilder.getConstantUint32(size), decorations);
														
 
															+    } else {
														
 
															+      assert(type->isIncompleteArrayType());
														
 
															+      // Runtime arrays of resources needs additional capability.
														
 
															+      if (hlsl::IsHLSLResourceType(arrayType->getElementType())) {
														
 
															+        theBuilder.addExtension(Extension::EXT_descriptor_indexing,
														
 
															+                                "runtime array of resources", {});
														
 
															+        theBuilder.requireCapability(
														
 
															+            spv::Capability::RuntimeDescriptorArrayEXT);
														
 
															+      }
														
 
															+      return theBuilder.getRuntimeArrayType(elemTypeId, decorations);
														
 
															+    }
														
 
															   }
														
 
															   emitError("type %0 unimplemented") << type->getTypeClassName();
														
@@ -656,39 +671,6 @@ uint32_t TypeTranslator::getACSBufferCounter() {
 
															                                   decorations);
														
 
															 }
														
 
															-uint32_t TypeTranslator::getGlPerVertexStruct(
														
 
															-    uint32_t clipArraySize, uint32_t cullArraySize, llvm::StringRef name,
														
 
															-    const llvm::SmallVector<std::string, 4> &fieldSemantics) {
														
 
															-  const uint32_t f32Type = theBuilder.getFloat32Type();
														
 
															-  const uint32_t v4f32Type = theBuilder.getVecType(f32Type, 4);
														
 
															-  const uint32_t clipType = theBuilder.getArrayType(
														
 
															-      f32Type, theBuilder.getConstantUint32(clipArraySize));
														
 
															-  const uint32_t cullType = theBuilder.getArrayType(
														
 
															-      f32Type, theBuilder.getConstantUint32(cullArraySize));
														
 
															-
														
 
															-  auto &ctx = *theBuilder.getSPIRVContext();
														
 
															-  llvm::SmallVector<const Decoration *, 1> decorations;
														
 
															-
														
 
															-  decorations.push_back(Decoration::getBuiltIn(ctx, spv::BuiltIn::Position, 0));
														
 
															-  decorations.push_back(
														
 
															-      Decoration::getBuiltIn(ctx, spv::BuiltIn::PointSize, 1));
														
 
															-  decorations.push_back(
														
 
															-      Decoration::getBuiltIn(ctx, spv::BuiltIn::ClipDistance, 2));
														
 
															-  decorations.push_back(
														
 
															-      Decoration::getBuiltIn(ctx, spv::BuiltIn::CullDistance, 3));
														
 
															-  decorations.push_back(Decoration::getBlock(ctx));
														
 
															-
														
 
															-  if (spirvOptions.enableReflect) {
														
 
															-    for (uint32_t i = 0; i < 4; ++i)
														
 
															-      if (!fieldSemantics[i].empty())
														
 
															-        decorations.push_back(
														
 
															-            Decoration::getHlslSemanticGOOGLE(ctx, fieldSemantics[i], i));
														
 
															-  }
														
 
															-
														
 
															-  return theBuilder.getStructType({v4f32Type, f32Type, clipType, cullType},
														
 
															-                                  name, {}, decorations);
														
 
															-}
														
 
															-
														
 
															 bool TypeTranslator::isScalarType(QualType type, QualType *scalarType) {
														
 
															   bool isScalar = false;
														
 
															   QualType ty = {};
														
@@ -749,6 +731,10 @@ bool TypeTranslator::isRWAppendConsumeSBuffer(QualType type) {
 
															 }
														
 
															 bool TypeTranslator::isAKindOfStructuredOrByteBuffer(QualType type) {
														
 
															+  // Strip outer arrayness first
														
 
															+  while (type->isArrayType())
														
 
															+    type = type->getAsArrayTypeUnsafe()->getElementType();
														
 
															+
														
 
															   if (const RecordType *recordType = type->getAs<RecordType>()) {
														
 
															     StringRef name = recordType->getDecl()->getName();
														
 
															     return name == "StructuredBuffer" || name == "RWStructuredBuffer" ||
														
@@ -775,6 +761,79 @@ bool TypeTranslator::isOrContainsAKindOfStructuredOrByteBuffer(QualType type) {
 
															   return false;
														
 
															 }
														
 
															+bool TypeTranslator::isOrContains16BitType(QualType type) {
														
 
															+  // Primitive types
														
 
															+  {
														
 
															+    QualType ty = {};
														
 
															+    if (isScalarType(type, &ty)) {
														
 
															+      if (const auto *builtinType = ty->getAs<BuiltinType>()) {
														
 
															+        switch (builtinType->getKind()) {
														
 
															+        case BuiltinType::Short:
														
 
															+        case BuiltinType::UShort:
														
 
															+        case BuiltinType::Min12Int:
														
 
															+        case BuiltinType::Half:
														
 
															+        case BuiltinType::Min10Float: {
														
 
															+          return spirvOptions.enable16BitTypes;
														
 
															+        }
														
 
															+        default:
														
 
															+          return false;
														
 
															+        }
														
 
															+      }
														
 
															+    }
														
 
															+  }
														
 
															+
														
 
															+  // Vector types
														
 
															+  {
														
 
															+    QualType elemType = {};
														
 
															+    if (isVectorType(type, &elemType))
														
 
															+      return isOrContains16BitType(elemType);
														
 
															+  }
														
 
															+
														
 
															+  // Matrix types
														
 
															+  {
														
 
															+    QualType elemType = {};
														
 
															+    if (isMxNMatrix(type, &elemType)) {
														
 
															+      return isOrContains16BitType(elemType);
														
 
															+    }
														
 
															+  }
														
 
															+
														
 
															+  // Struct type
														
 
															+  if (const auto *structType = type->getAs<RecordType>()) {
														
 
															+    const auto *decl = structType->getDecl();
														
 
															+
														
 
															+    for (const auto *field : decl->fields()) {
														
 
															+      if (isOrContains16BitType(field->getType()))
														
 
															+        return true;
														
 
															+    }
														
 
															+
														
 
															+    return false;
														
 
															+  }
														
 
															+
														
 
															+  // Array type
														
 
															+  if (const auto *arrayType = type->getAsArrayTypeUnsafe()) {
														
 
															+    return isOrContains16BitType(arrayType->getElementType());
														
 
															+  }
														
 
															+
														
 
															+  // Reference types
														
 
															+  if (const auto *refType = type->getAs<ReferenceType>()) {
														
 
															+    return isOrContains16BitType(refType->getPointeeType());
														
 
															+  }
														
 
															+
														
 
															+  // Pointer types
														
 
															+  if (const auto *ptrType = type->getAs<PointerType>()) {
														
 
															+    return isOrContains16BitType(ptrType->getPointeeType());
														
 
															+  }
														
 
															+
														
 
															+  if (const auto *typedefType = type->getAs<TypedefType>()) {
														
 
															+    return isOrContains16BitType(typedefType->desugar());
														
 
															+  }
														
 
															+
														
 
															+  emitError("checking 16-bit type for %0 unimplemented")
														
 
															+      << type->getTypeClassName();
														
 
															+  type->dump();
														
 
															+  return 0;
														
 
															+}
														
 
															+
														
 
															 bool TypeTranslator::isStructuredBuffer(QualType type) {
														
 
															   const auto *recordType = type->getAs<RecordType>();
														
 
															   if (!recordType)
														
@@ -1326,8 +1385,7 @@ TypeTranslator::collectDeclsInDeclContext(const DeclContext *declContext) {
 
															   return decls;
														
 
															 }
														
 
															-uint32_t TypeTranslator::translateResourceType(QualType type, LayoutRule rule,
														
 
															-                                               bool isDepthCmp) {
														
 
															+uint32_t TypeTranslator::translateResourceType(QualType type, LayoutRule rule) {
														
 
															   // Resource types are either represented like C struct or C++ class in the
														
 
															   // AST. Samplers are represented like C struct, so isStructureType() will
														
 
															   // return true for it; textures are represented like C++ class, so
														
@@ -1357,7 +1415,7 @@ uint32_t TypeTranslator::translateResourceType(QualType type, LayoutRule rule,
 
															       const auto isMS = (name == "Texture2DMS" || name == "Texture2DMSArray");
														
 
															       const auto sampledType = hlsl::GetHLSLResourceResultType(type);
														
 
															       return theBuilder.getImageType(translateType(getElementType(sampledType)),
														
 
															-                                     dim, isDepthCmp, isArray, isMS);
														
 
															+                                     dim, /*depth*/ 2, isArray, isMS);
														
 
															     }
														
 
															     // There is no RWTexture3DArray
														
@@ -1369,7 +1427,7 @@ uint32_t TypeTranslator::translateResourceType(QualType type, LayoutRule rule,
 
															       const auto sampledType = hlsl::GetHLSLResourceResultType(type);
														
 
															       const auto format = translateSampledTypeToImageFormat(sampledType);
														
 
															       return theBuilder.getImageType(translateType(getElementType(sampledType)),
														
 
															-                                     dim, /*depth*/ 0, isArray, /*MS*/ 0,
														
 
															+                                     dim, /*depth*/ 2, isArray, /*MS*/ 0,
														
 
															                                      /*Sampled*/ 2u, format);
														
 
															     }
														
 
															   }
														
@@ -1465,7 +1523,7 @@ uint32_t TypeTranslator::translateResourceType(QualType type, LayoutRule rule,
 
															     const auto format = translateSampledTypeToImageFormat(sampledType);
														
 
															     return theBuilder.getImageType(
														
 
															         translateType(getElementType(sampledType)), spv::Dim::Buffer,
														
 
															-        /*depth*/ 0, /*isArray*/ 0, /*ms*/ 0,
														
 
															+        /*depth*/ 2, /*isArray*/ 0, /*ms*/ 0,
														
 
															         /*sampled*/ name == "Buffer" ? 1 : 2, format);
														
 
															   }
														
@@ -1495,7 +1553,7 @@ uint32_t TypeTranslator::translateResourceType(QualType type, LayoutRule rule,
 
															     const auto sampledType = hlsl::GetHLSLResourceResultType(type);
														
 
															     return theBuilder.getImageType(
														
 
															         translateType(getElementType(sampledType)), spv::Dim::SubpassData,
														
 
															-        /*depth*/ 0, /*isArray*/ false, /*ms*/ name == "SubpassInputMS",
														
 
															+        /*depth*/ 2, /*isArray*/ false, /*ms*/ name == "SubpassInputMS",
														
 
															         /*sampled*/ 2);
														
 
															   }
														
@@ -1655,6 +1713,16 @@ TypeTranslator::getAlignmentAndSize(QualType type, LayoutRule rule,
 
															         case BuiltinType::LongLong:
														
 
															         case BuiltinType::ULongLong:
														
 
															           return {8, 8};
														
 
															+        case BuiltinType::Short:
														
 
															+        case BuiltinType::UShort:
														
 
															+        case BuiltinType::Min12Int:
														
 
															+        case BuiltinType::Half:
														
 
															+        case BuiltinType::Min10Float: {
														
 
															+          if (spirvOptions.enable16BitTypes)
														
 
															+            return {2, 2};
														
 
															+          else
														
 
															+            return {4, 4};
														
 
															+        }
														
 
															         default:
														
 
															           emitError("alignment and size calculation for type %0 unimplemented")
														
 
															               << type;
														
@@ -1813,6 +1881,22 @@ std::string TypeTranslator::getName(QualType type) {
 
															           return "uint";
														
 
															         case BuiltinType::Float:
														
 
															           return "float";
														
 
															+        case BuiltinType::Double:
														
 
															+          return "double";
														
 
															+        case BuiltinType::LongLong:
														
 
															+          return "int64";
														
 
															+        case BuiltinType::ULongLong:
														
 
															+          return "uint64";
														
 
															+        case BuiltinType::Short:
														
 
															+          return "short";
														
 
															+        case BuiltinType::UShort:
														
 
															+          return "ushort";
														
 
															+        case BuiltinType::Half:
														
 
															+          return "half";
														
 
															+        case BuiltinType::Min12Int:
														
 
															+          return "min12int";
														
 
															+        case BuiltinType::Min10Float:
														
 
															+          return "min10float";
														
 
															         default:
														
 
															           return "";
														
 
															         }
														
--- a/tools/clang/lib/SPIRV/TypeTranslator.h
+++ b/tools/clang/lib/SPIRV/TypeTranslator.h
@@ -55,29 +55,11 @@ public:
 
															   uint32_t translateType(QualType type,
														
 
															                          LayoutRule layoutRule = LayoutRule::Void);
														
 
															-  /// \brief Translates the given HLSL resource type into its SPIR-V
														
 
															-  /// instructions and returns the <result-id>. Returns 0 on failure.
														
 
															-  uint32_t translateResourceType(QualType type, LayoutRule rule,
														
 
															-                                 bool isDepthCmp = false);
														
 
															-
														
 
															   /// \brief Generates the SPIR-V type for the counter associated with a
														
 
															   /// {Append|Consume}StructuredBuffer: an OpTypeStruct with a single 32-bit
														
 
															   /// integer value. This type will be decorated with BufferBlock.
														
 
															   uint32_t getACSBufferCounter();
														
 
															-  /// \brief Returns the type for the gl_PerVertex struct:
														
 
															-  ///
														
 
															-  /// struct gl_PerVertex {
														
 
															-  ///   float4 gl_Position;
														
 
															-  ///   float  gl_PointSize;
														
 
															-  ///   float  gl_ClipDistance[];
														
 
															-  ///   float  gl_CullDistance[];
														
 
															-  /// };
														
 
															-  uint32_t
														
 
															-  getGlPerVertexStruct(uint32_t clipArraySize, uint32_t cullArraySize,
														
 
															-                       llvm::StringRef structName,
														
 
															-                       const llvm::SmallVector<std::string, 4> &fieldSemantics);
														
 
															-
														
 
															   /// \brief Returns true if the given type is a (RW)StructuredBuffer type.
														
 
															   static bool isStructuredBuffer(QualType type);
														
@@ -106,6 +88,9 @@ public:
 
															   /// containing one of the above.
														
 
															   static bool isOrContainsAKindOfStructuredOrByteBuffer(QualType type);
														
 
															+  /// \brief Returns true if the given type is or contains 16-bit type.
														
 
															+  bool isOrContains16BitType(QualType type);
														
 
															+
														
 
															   /// \brief Returns true if the given type is the HLSL Buffer type.
														
 
															   static bool isBuffer(QualType type);
														
@@ -303,6 +288,10 @@ private:
 
															   /// constnesss and literalness.
														
 
															   static bool canTreatAsSameScalarType(QualType type1, QualType type2);
														
 
															+  /// \brief Translates the given HLSL resource type into its SPIR-V
														
 
															+  /// instructions and returns the <result-id>. Returns 0 on failure.
														
 
															+  uint32_t translateResourceType(QualType type, LayoutRule rule);
														
 
															+
														
 
															   /// \brief For the given sampled type, returns the corresponding image format
														
 
															   /// that can be used to create an image object.
														
 
															   spv::ImageFormat translateSampledTypeToImageFormat(QualType type);
														
--- a/tools/clang/lib/Sema/SemaHLSL.cpp
+++ b/tools/clang/lib/Sema/SemaHLSL.cpp
@@ -4149,7 +4149,7 @@ public:
 
															   /// <param name="RHS">Right hand side.</param>
														
 
															   /// <param name="QuestionLoc">Location of question mark in operator.</param>
														
 
															   /// <returns>Result type of vector conditional expression.</returns>
														
 
															-  clang::QualType HLSLExternalSource::CheckVectorConditional(
														
 
															+  clang::QualType CheckVectorConditional(
														
 
															     _In_ ExprResult &Cond,
														
 
															     _In_ ExprResult &LHS,
														
 
															     _In_ ExprResult &RHS,
														
@@ -6343,7 +6343,7 @@ UINT64 HLSLExternalSource::ScoreCast(QualType pLType, QualType pRType)
 
															   }
														
 
															 #define SCORE_COND(shift, cond) { \
														
 
															-  if (cond) uScore += 1UI64 << (SCORE_MIN_SHIFT + SCORE_PARAM_SHIFT * shift); }
														
 
															+  if (cond) uScore += 1ULL << (SCORE_MIN_SHIFT + SCORE_PARAM_SHIFT * shift); }
														
 
															   SCORE_COND(0, uRSize < uLSize);
														
 
															   SCORE_COND(1, bLPromo);
														
 
															   SCORE_COND(2, bRPromo);
														
@@ -7442,6 +7442,9 @@ bool HLSLExternalSource::CanConvert(
 
															   _Out_opt_ TYPE_CONVERSION_REMARKS* remarks,
														
 
															   _Inout_opt_ StandardConversionSequence* standard)
														
 
															 {
														
 
															+  bool bCheckElt = false;
														
 
															+  UINT uTSize, uSSize;
														
 
															+
														
 
															   DXASSERT_NOMSG(sourceExpr != nullptr);
														
 
															   DXASSERT_NOMSG(!target.isNull());
														
@@ -7500,8 +7503,8 @@ bool HLSLExternalSource::CanConvert(
 
															   CollectInfo(target, &TargetInfo);
														
 
															   CollectInfo(source, &SourceInfo);
														
 
															-  UINT uTSize = TargetInfo.uTotalElts;
														
 
															-  UINT uSSize = SourceInfo.uTotalElts;
														
 
															+  uTSize = TargetInfo.uTotalElts;
														
 
															+  uSSize = SourceInfo.uTotalElts;
														
 
															   // TODO: TYPE_CONVERSION_BY_REFERENCE does not seem possible here
														
 
															   // are we missing cases?
														
@@ -7620,7 +7623,6 @@ bool HLSLExternalSource::CanConvert(
 
															   // 5. The result of a matrix and a vector is similar to #4.
														
 
															   //
														
 
															-  bool bCheckElt = false;
														
 
															   switch (TargetInfo.ShapeKind) {
														
 
															   case AR_TOBJ_BASIC:
														
@@ -10664,6 +10666,10 @@ void hlsl::HandleDeclAttributeForHLSL(Sema &S, Decl *D, const AttributeList &A,
 
															     declAttr = ::new (S.Context) VKLocationAttr(A.getRange(), S.Context,
														
 
															       ValidateAttributeIntArg(S, A), A.getAttributeSpellingListIndex());
														
 
															     break;
														
 
															+  case AttributeList::AT_VKIndex:
														
 
															+    declAttr = ::new (S.Context) VKIndexAttr(A.getRange(), S.Context,
														
 
															+      ValidateAttributeIntArg(S, A), A.getAttributeSpellingListIndex());
														
 
															+    break;
														
 
															   case AttributeList::AT_VKBinding:
														
 
															     declAttr = ::new (S.Context) VKBindingAttr(A.getRange(), S.Context,
														
 
															       ValidateAttributeIntArg(S, A), ValidateAttributeIntArg(S, A, 1),
														
@@ -11033,6 +11039,10 @@ bool Sema::DiagnoseHLSLDecl(Declarator &D, DeclContext *DC,
 
															       nestedDiagId = diag::err_hlsl_unsupported_nested_typedef;
														
 
															     }
														
 
															+    if (isField && pType && pType->isIncompleteArrayType()) {
														
 
															+      nestedDiagId = diag::err_hlsl_unsupported_incomplete_array;
														
 
															+    }
														
 
															+
														
 
															     if (nestedDiagId) {
														
 
															       Diag(D.getLocStart(), nestedDiagId);
														
 
															       D.setInvalidType();
														
--- a/tools/clang/test/CodeGenHLSL/quick-test/bool_cast.hlsl
+++ b/tools/clang/test/CodeGenHLSL/quick-test/bool_cast.hlsl
@@ -0,0 +1,12 @@
 
															+// RUN: %dxc -E main -T ps_6_0 %s | FileCheck %s
														
 
															+
														
 
															+
														
 
															+// Make sure it compiles
														
 
															+// CHECK: uitofp i1
														
 
															+
														
 
															+static bool t;
														
 
															+float main( float a:A) : SV_Target
														
 
															+{
														
 
															+    t.x = bool(a);
														
 
															+    return t;
														
 
															+}
														
--- a/tools/clang/test/CodeGenHLSL/quick-test/default-matrix-in-template.hlsl
+++ b/tools/clang/test/CodeGenHLSL/quick-test/default-matrix-in-template.hlsl
@@ -0,0 +1,15 @@
 
															+// RUN: %dxc -E main -T cs_6_0 %s  | FileCheck %s
														
 
															+
														
 
															+// CHECK: %class.StructuredBuffer = type { %class.matrix.float.4.4 }
														
 
															+
														
 
															+StructuredBuffer<matrix> buf1;
														
 
															+// Should be equivalent to:
														
 
															+// StructuredBuffer<matrix<float, 4, 4> > buf1;
														
 
															+
														
 
															+RWBuffer<float4> buf2;
														
 
															+
														
 
															+[RootSignature("DescriptorTable(SRV(t0), UAV(u0))")]
														
 
															+[numthreads(8, 8, 1)]
														
 
															+void main(uint3 tid : SV_DispatchThreadID) {
														
 
															+  buf2[tid.x] = buf1[tid.x][tid.y];
														
 
															+}
														
--- a/tools/clang/test/CodeGenHLSL/quick-test/incomp_array.hlsl
+++ b/tools/clang/test/CodeGenHLSL/quick-test/incomp_array.hlsl
@@ -2,7 +2,7 @@
 
															 // Verify no hang on incomplete array
														
 
															-// CHECK: %struct.Special = type { <4 x float>, [0 x i32] }
														
 
															+// CHECK: %struct.Special = type { <4 x float>, [3 x i32] }
														
 
															 // CHECK: %"$Globals" = type { i32, %struct.Special }
														
 
															 typedef const int inta[];
														
@@ -14,12 +14,12 @@ int i;
 
															 struct Special {
														
 
															   float4 member;
														
 
															-  inta a;
														
 
															+  int a[3];
														
 
															 };
														
 
															 Special c_special;
														
 
															-static const Special s_special = { { 1, 2, 3, 4}, { 1, 2, 3 } };
														
 
															+static const Special s_special = { { 1, 2, 3, 4}, { 5, 6, 7 } };
														
 
															 // CHECK: define <4 x float>
														
 
															 // CHECK: fn1
														
@@ -40,7 +40,14 @@ float4 fn1(in Special in1: SEMANTIC_IN) : SEMANTIC_OUT {
 
															 // CHECK: fn2
														
 
															 // @"\01?fn2@@YA?AV?$vector@M$03@@USpecial@@@Z"
														
 
															 float4 fn2(in Special in1: SEMANTIC_IN) : SEMANTIC_OUT {
														
 
															-  // s_special.a[i] is broken: it just assumes 0.
														
 
															+  // CHECK: call %dx.types.CBufRet.i32 @dx.op.cbufferLoadLegacy.i32(
														
 
															+  // CHECK: i32 0)
														
 
															+  // CHECK: extractvalue
														
 
															+  // CHECK: , 0
														
 
															+  // CHECK: getelementptr
														
 
															+  // CHECK: load i32, i32*
														
 
															+  // CHECK: sitofp i32
														
 
															+  // CHECK: fadd float
														
 
															   return in1.member + (float)s_special.a[i];
														
 
															 }
														
--- a/tools/clang/test/CodeGenHLSL/share_mem_dbg.hlsl
+++ b/tools/clang/test/CodeGenHLSL/share_mem_dbg.hlsl
@@ -1,4 +1,4 @@
 
															-// RUN: %dxc -E main -T cs_6_0 -Zi -Od %s | FileCheck %s
														
 
															+// RUN: %dxc -E main -T cs_6_0 -Zi -Od -DDefineA -DDefineB=0 %s | FileCheck %s
														
 
															 // CHECK: threadId
														
 
															 // CHECK: groupId
														
@@ -6,6 +6,12 @@
 
															 // CHECK: flattenedThreadIdInGroup
														
 
															 // CHECK: addrspace(3)
														
 
															+// Make sure source info exist.
														
 
															+// CHECK: !dx.source.contents
														
 
															+// CHECK: !dx.source.defines
														
 
															+// CHECK: !dx.source.mainFileName
														
 
															+// CHECK: !dx.source.args
														
 
															+
														
 
															 // CHECK: DIGlobalVariable(name: "dataC.1.0"
														
 
															 // CHECK: DIDerivedType(tag: DW_TAG_member, name: ".1.0"
														
 
															 // CHECK: DIGlobalVariable(name: "dataC.1.1"
														
@@ -13,6 +19,13 @@
 
															 // CHECK: DIGlobalVariable(name: "dataC.0
														
 
															 // CHECK: DIDerivedType(tag: DW_TAG_member, name: ".0"
														
 
															+// Make sure source info contents exist.
														
 
															+// CHECK: share_mem_dbg.hlsl", !"// RUN: %dxc
														
 
															+// CHECK: !{!"DefineA=1", !"DefineB=0"}
														
 
															+// CHECK: share_mem_dbg.hlsl"}
														
 
															+// CHECK: !{!"-E", !"main", !"-T", !"cs_6_0", !"-Zi", !"-Od", !"-D", !"DefineA", !"-D", !"DefineB=0"}
														
 
															+
														
 
															+
														
 
															 struct S {
														
 
															   column_major float2x2 d;
														
 
															   float2  b;
														
--- a/tools/clang/test/CodeGenHLSL/srv_ms_load1.hlsl
+++ b/tools/clang/test/CodeGenHLSL/srv_ms_load1.hlsl
@@ -1,6 +1,8 @@
 
															 // RUN: %dxc -E main -T ps_6_0 %s | FileCheck %s
														
 
															-// CHECK: textureLoad
														
 
															+// CHECK-DAG: textureLoad.f32({{.*}}, i32 undef, i32 undef, i32 undef)
														
 
															+// CHECK-DAG: textureLoad.f32({{.*}}, i32 -5, i32 7, i32 undef)
														
 
															+// CHECK-DAG: textureLoad.f32({{.*}}, i32 0, i32 0, i32 undef)
														
 
															 Texture2DMS<float3> srv1 : register(t3);
														
--- a/tools/clang/test/CodeGenSPIRV/bezier.domain.hlsl2spv
+++ b/tools/clang/test/CodeGenSPIRV/bezier.domain.hlsl2spv
@@ -48,15 +48,12 @@ DS_OUTPUT BezierEvalDS( HS_CONSTANT_DATA_OUTPUT input,
 
															 // CHECK-WHOLE-SPIR-V:
														
 
															 // OpCapability Tessellation
														
 
															 // OpMemoryModel Logical GLSL450
														
 
															-// OpEntryPoint TessellationEvaluation %BezierEvalDS "BezierEvalDS" %gl_PerVertexIn %gl_PerVertexOut %gl_TessLevelOuter %gl_TessLevelInner %in_var_TANGENT %in_var_TEXCOORD %in_var_TANUCORNER %in_var_TANVCORNER %in_var_TANWEIGHTS %gl_TessCoord %in_var_BEZIERPOS %out_var_NORMAL %out_var_TEXCOORD %out_var_TANGENT %out_var_BITANGENT
														
 
															+// OpEntryPoint TessellationEvaluation %BezierEvalDS "BezierEvalDS" %gl_TessLevelOuter %gl_TessLevelInner %in_var_TANGENT %in_var_TEXCOORD %in_var_TANUCORNER %in_var_TANVCORNER %in_var_TANWEIGHTS %gl_TessCoord %in_var_BEZIERPOS %out_var_NORMAL %out_var_TEXCOORD %out_var_TANGENT %out_var_BITANGENT %gl_Position
														
 
															 // OpExecutionMode %BezierEvalDS Quads
														
 
															 // OpSource HLSL 600
														
 
															 // OpName %bb_entry "bb.entry"
														
 
															 // OpName %src_BezierEvalDS "src.BezierEvalDS"
														
 
															 // OpName %BezierEvalDS "BezierEvalDS"
														
 
															-// OpName %type_gl_PerVertex "type.gl_PerVertex"
														
 
															-// OpName %gl_PerVertexIn "gl_PerVertexIn"
														
 
															-// OpName %gl_PerVertexOut "gl_PerVertexOut"
														
 
															 // OpName %HS_CONSTANT_DATA_OUTPUT "HS_CONSTANT_DATA_OUTPUT"
														
 
															 // OpMemberName %HS_CONSTANT_DATA_OUTPUT 0 "Edges"
														
 
															 // OpMemberName %HS_CONSTANT_DATA_OUTPUT 1 "Inside"
														
@@ -90,11 +87,6 @@ DS_OUTPUT BezierEvalDS( HS_CONSTANT_DATA_OUTPUT input,
 
															 // OpName %UV "UV"
														
 
															 // OpName %bezpatch "bezpatch"
														
 
															 // OpName %Output "Output"
														
 
															-// OpMemberDecorate %type_gl_PerVertex 0 BuiltIn Position
														
 
															-// OpMemberDecorate %type_gl_PerVertex 1 BuiltIn PointSize
														
 
															-// OpMemberDecorate %type_gl_PerVertex 2 BuiltIn ClipDistance
														
 
															-// OpMemberDecorate %type_gl_PerVertex 3 BuiltIn CullDistance
														
 
															-// OpDecorate %type_gl_PerVertex Block
														
 
															 // OpDecorate %gl_TessLevelOuter BuiltIn TessLevelOuter
														
 
															 // OpDecorate %gl_TessLevelOuter Patch
														
 
															 // OpDecorate %gl_TessLevelInner BuiltIn TessLevelInner
														
@@ -106,6 +98,7 @@ DS_OUTPUT BezierEvalDS( HS_CONSTANT_DATA_OUTPUT input,
 
															 // OpDecorate %in_var_TANWEIGHTS Patch
														
 
															 // OpDecorate %gl_TessCoord BuiltIn TessCoord
														
 
															 // OpDecorate %gl_TessCoord Patch
														
 
															+// OpDecorate %gl_Position BuiltIn Position
														
 
															 // OpDecorate %in_var_BEZIERPOS Location 0
														
 
															 // OpDecorate %in_var_TANGENT Location 1
														
 
															 // OpDecorate %in_var_TANUCORNER Location 5
														
@@ -119,15 +112,8 @@ DS_OUTPUT BezierEvalDS( HS_CONSTANT_DATA_OUTPUT input,
 
															 // %void = OpTypeVoid
														
 
															 // %3 = OpTypeFunction %void
														
 
															 // %float = OpTypeFloat 32
														
 
															-// %v4float = OpTypeVector %float 4
														
 
															 // %uint = OpTypeInt 32 0
														
 
															-// %uint_1 = OpConstant %uint 1
														
 
															-// %_arr_float_uint_1 = OpTypeArray %float %uint_1
														
 
															-// %type_gl_PerVertex = OpTypeStruct %v4float %float %_arr_float_uint_1 %_arr_float_uint_1
														
 
															 // %uint_4 = OpConstant %uint 4
														
 
															-// %_arr_type_gl_PerVertex_uint_4 = OpTypeArray %type_gl_PerVertex %uint_4
														
 
															-// %_ptr_Input__arr_type_gl_PerVertex_uint_4 = OpTypePointer Input %_arr_type_gl_PerVertex_uint_4
														
 
															-// %_ptr_Output_type_gl_PerVertex = OpTypePointer Output %type_gl_PerVertex
														
 
															 // %_arr_float_uint_4 = OpTypeArray %float %uint_4
														
 
															 // %uint_2 = OpConstant %uint 2
														
 
															 // %_arr_float_uint_2 = OpTypeArray %float %uint_2
														
@@ -135,6 +121,7 @@ DS_OUTPUT BezierEvalDS( HS_CONSTANT_DATA_OUTPUT input,
 
															 // %_arr_v3float_uint_4 = OpTypeArray %v3float %uint_4
														
 
															 // %v2float = OpTypeVector %float 2
														
 
															 // %_arr_v2float_uint_4 = OpTypeArray %v2float %uint_4
														
 
															+// %v4float = OpTypeVector %float 4
														
 
															 // %HS_CONSTANT_DATA_OUTPUT = OpTypeStruct %_arr_float_uint_4 %_arr_float_uint_2 %_arr_v3float_uint_4 %_arr_v2float_uint_4 %_arr_v3float_uint_4 %_arr_v3float_uint_4 %v4float
														
 
															 // %_ptr_Function_HS_CONSTANT_DATA_OUTPUT = OpTypePointer Function %HS_CONSTANT_DATA_OUTPUT
														
 
															 // %_ptr_Input__arr_float_uint_4 = OpTypePointer Input %_arr_float_uint_4
														
@@ -151,11 +138,8 @@ DS_OUTPUT BezierEvalDS( HS_CONSTANT_DATA_OUTPUT input,
 
															 // %_ptr_Output_v3float = OpTypePointer Output %v3float
														
 
															 // %_ptr_Output_v2float = OpTypePointer Output %v2float
														
 
															 // %_ptr_Output_v4float = OpTypePointer Output %v4float
														
 
															-// %uint_0 = OpConstant %uint 0
														
 
															-// %85 = OpTypeFunction %DS_OUTPUT %_ptr_Function_HS_CONSTANT_DATA_OUTPUT %_ptr_Function_v2float %_ptr_Function__arr_BEZIER_CONTROL_POINT_uint_4
														
 
															+// %76 = OpTypeFunction %DS_OUTPUT %_ptr_Function_HS_CONSTANT_DATA_OUTPUT %_ptr_Function_v2float %_ptr_Function__arr_BEZIER_CONTROL_POINT_uint_4
														
 
															 // %_ptr_Function_DS_OUTPUT = OpTypePointer Function %DS_OUTPUT
														
 
															-// %gl_PerVertexIn = OpVariable %_ptr_Input__arr_type_gl_PerVertex_uint_4 Input
														
 
															-// %gl_PerVertexOut = OpVariable %_ptr_Output_type_gl_PerVertex Output
														
 
															 // %gl_TessLevelOuter = OpVariable %_ptr_Input__arr_float_uint_4 Input
														
 
															 // %gl_TessLevelInner = OpVariable %_ptr_Input__arr_float_uint_2 Input
														
 
															 // %in_var_TANGENT = OpVariable %_ptr_Input__arr_v3float_uint_4 Input
														
@@ -169,54 +153,54 @@ DS_OUTPUT BezierEvalDS( HS_CONSTANT_DATA_OUTPUT input,
 
															 // %out_var_TEXCOORD = OpVariable %_ptr_Output_v2float Output
														
 
															 // %out_var_TANGENT = OpVariable %_ptr_Output_v3float Output
														
 
															 // %out_var_BITANGENT = OpVariable %_ptr_Output_v3float Output
														
 
															+// %gl_Position = OpVariable %_ptr_Output_v4float Output
														
 
															 // %BezierEvalDS = OpFunction %void None %3
														
 
															-// %17 = OpLabel
														
 
															+// %5 = OpLabel
														
 
															 // %param_var_input = OpVariable %_ptr_Function_HS_CONSTANT_DATA_OUTPUT Function
														
 
															 // %param_var_UV = OpVariable %_ptr_Function_v2float Function
														
 
															 // %param_var_bezpatch = OpVariable %_ptr_Function__arr_BEZIER_CONTROL_POINT_uint_4 Function
														
 
															-// %30 = OpLoad %_arr_float_uint_4 %gl_TessLevelOuter
														
 
															-// %33 = OpLoad %_arr_float_uint_2 %gl_TessLevelInner
														
 
															-// %36 = OpLoad %_arr_v3float_uint_4 %in_var_TANGENT
														
 
															-// %39 = OpLoad %_arr_v2float_uint_4 %in_var_TEXCOORD
														
 
															-// %41 = OpLoad %_arr_v3float_uint_4 %in_var_TANUCORNER
														
 
															-// %43 = OpLoad %_arr_v3float_uint_4 %in_var_TANVCORNER
														
 
															-// %46 = OpLoad %v4float %in_var_TANWEIGHTS
														
 
															-// %47 = OpCompositeConstruct %HS_CONSTANT_DATA_OUTPUT %30 %33 %36 %39 %41 %43 %46
														
 
															-// OpStore %param_var_input %47
														
 
															-// %52 = OpLoad %v3float %gl_TessCoord
														
 
															-// %53 = OpVectorShuffle %v2float %52 %52 0 1
														
 
															-// OpStore %param_var_UV %53
														
 
															-// %59 = OpLoad %_arr_v3float_uint_4 %in_var_BEZIERPOS
														
 
															-// %60 = OpCompositeExtract %v3float %59 0
														
 
															-// %61 = OpCompositeConstruct %BEZIER_CONTROL_POINT %60
														
 
															-// %62 = OpCompositeExtract %v3float %59 1
														
 
															-// %63 = OpCompositeConstruct %BEZIER_CONTROL_POINT %62
														
 
															-// %64 = OpCompositeExtract %v3float %59 2
														
 
															-// %65 = OpCompositeConstruct %BEZIER_CONTROL_POINT %64
														
 
															-// %66 = OpCompositeExtract %v3float %59 3
														
 
															-// %67 = OpCompositeConstruct %BEZIER_CONTROL_POINT %66
														
 
															-// %68 = OpCompositeConstruct %_arr_BEZIER_CONTROL_POINT_uint_4 %61 %63 %65 %67
														
 
															-// OpStore %param_var_bezpatch %68
														
 
															-// %70 = OpFunctionCall %DS_OUTPUT %src_BezierEvalDS %param_var_input %param_var_UV %param_var_bezpatch
														
 
															-// %71 = OpCompositeExtract %v3float %70 0
														
 
															-// OpStore %out_var_NORMAL %71
														
 
															-// %74 = OpCompositeExtract %v2float %70 1
														
 
															-// OpStore %out_var_TEXCOORD %74
														
 
															-// %77 = OpCompositeExtract %v3float %70 2
														
 
															-// OpStore %out_var_TANGENT %77
														
 
															-// %79 = OpCompositeExtract %v3float %70 3
														
 
															-// OpStore %out_var_BITANGENT %79
														
 
															-// %81 = OpCompositeExtract %v4float %70 4
														
 
															-// %84 = OpAccessChain %_ptr_Output_v4float %gl_PerVertexOut %uint_0
														
 
															-// OpStore %84 %81
														
 
															+// %22 = OpLoad %_arr_float_uint_4 %gl_TessLevelOuter
														
 
															+// %25 = OpLoad %_arr_float_uint_2 %gl_TessLevelInner
														
 
															+// %28 = OpLoad %_arr_v3float_uint_4 %in_var_TANGENT
														
 
															+// %31 = OpLoad %_arr_v2float_uint_4 %in_var_TEXCOORD
														
 
															+// %33 = OpLoad %_arr_v3float_uint_4 %in_var_TANUCORNER
														
 
															+// %35 = OpLoad %_arr_v3float_uint_4 %in_var_TANVCORNER
														
 
															+// %38 = OpLoad %v4float %in_var_TANWEIGHTS
														
 
															+// %39 = OpCompositeConstruct %HS_CONSTANT_DATA_OUTPUT %22 %25 %28 %31 %33 %35 %38
														
 
															+// OpStore %param_var_input %39
														
 
															+// %44 = OpLoad %v3float %gl_TessCoord
														
 
															+// %45 = OpVectorShuffle %v2float %44 %44 0 1
														
 
															+// OpStore %param_var_UV %45
														
 
															+// %51 = OpLoad %_arr_v3float_uint_4 %in_var_BEZIERPOS
														
 
															+// %52 = OpCompositeExtract %v3float %51 0
														
 
															+// %53 = OpCompositeConstruct %BEZIER_CONTROL_POINT %52
														
 
															+// %54 = OpCompositeExtract %v3float %51 1
														
 
															+// %55 = OpCompositeConstruct %BEZIER_CONTROL_POINT %54
														
 
															+// %56 = OpCompositeExtract %v3float %51 2
														
 
															+// %57 = OpCompositeConstruct %BEZIER_CONTROL_POINT %56
														
 
															+// %58 = OpCompositeExtract %v3float %51 3
														
 
															+// %59 = OpCompositeConstruct %BEZIER_CONTROL_POINT %58
														
 
															+// %60 = OpCompositeConstruct %_arr_BEZIER_CONTROL_POINT_uint_4 %53 %55 %57 %59
														
 
															+// OpStore %param_var_bezpatch %60
														
 
															+// %62 = OpFunctionCall %DS_OUTPUT %src_BezierEvalDS %param_var_input %param_var_UV %param_var_bezpatch
														
 
															+// %63 = OpCompositeExtract %v3float %62 0
														
 
															+// OpStore %out_var_NORMAL %63
														
 
															+// %66 = OpCompositeExtract %v2float %62 1
														
 
															+// OpStore %out_var_TEXCOORD %66
														
 
															+// %69 = OpCompositeExtract %v3float %62 2
														
 
															+// OpStore %out_var_TANGENT %69
														
 
															+// %71 = OpCompositeExtract %v3float %62 3
														
 
															+// OpStore %out_var_BITANGENT %71
														
 
															+// %73 = OpCompositeExtract %v4float %62 4
														
 
															+// OpStore %gl_Position %73
														
 
															 // OpReturn
														
 
															 // OpFunctionEnd
														
 
															-// %src_BezierEvalDS = OpFunction %DS_OUTPUT None %85
														
 
															+// %src_BezierEvalDS = OpFunction %DS_OUTPUT None %76
														
 
															 // %input = OpFunctionParameter %_ptr_Function_HS_CONSTANT_DATA_OUTPUT
														
 
															 // %UV = OpFunctionParameter %_ptr_Function_v2float
														
 
															 // %bezpatch = OpFunctionParameter %_ptr_Function__arr_BEZIER_CONTROL_POINT_uint_4
														
 
															 // %bb_entry = OpLabel
														
 
															 // %Output = OpVariable %_ptr_Function_DS_OUTPUT Function
														
 
															-// %92 = OpLoad %DS_OUTPUT %Output
														
 
															-// OpReturnValue %92
														
 
															+// %83 = OpLoad %DS_OUTPUT %Output
														
 
															+// OpReturnValue %83
														
 
															 // OpFunctionEnd
														
--- a/tools/clang/test/CodeGenSPIRV/bezier.hull.hlsl2spv
+++ b/tools/clang/test/CodeGenSPIRV/bezier.hull.hlsl2spv
@@ -59,7 +59,7 @@ BEZIER_CONTROL_POINT SubDToBezierHS(InputPatch<VS_CONTROL_POINT_OUTPUT, MAX_POIN
 
															 // CHECK-WHOLE-SPIR-V:
														
 
															 // OpCapability Tessellation
														
 
															 // OpMemoryModel Logical GLSL450
														
 
															-// OpEntryPoint TessellationControl %SubDToBezierHS "SubDToBezierHS" %gl_PerVertexIn %gl_PerVertexOut %in_var_WORLDPOS %in_var_TEXCOORD0 %in_var_TANGENT %gl_InvocationID %gl_PrimitiveID %out_var_BEZIERPOS %gl_TessLevelOuter %gl_TessLevelInner %out_var_TANGENT %out_var_TEXCOORD %out_var_TANUCORNER %out_var_TANVCORNER %out_var_TANWEIGHTS
														
 
															+// OpEntryPoint TessellationControl %SubDToBezierHS "SubDToBezierHS" %in_var_WORLDPOS %in_var_TEXCOORD0 %in_var_TANGENT %gl_InvocationID %gl_PrimitiveID %out_var_BEZIERPOS %gl_TessLevelOuter %gl_TessLevelInner %out_var_TANGENT %out_var_TEXCOORD %out_var_TANUCORNER %out_var_TANVCORNER %out_var_TANWEIGHTS
														
 
															 // OpExecutionMode %SubDToBezierHS Quads
														
 
															 // OpExecutionMode %SubDToBezierHS SpacingFractionalOdd
														
 
															 // OpExecutionMode %SubDToBezierHS VertexOrderCcw
														
@@ -71,9 +71,6 @@ BEZIER_CONTROL_POINT SubDToBezierHS(InputPatch<VS_CONTROL_POINT_OUTPUT, MAX_POIN
 
															 // OpName %bb_entry_0 "bb.entry"
														
 
															 // OpName %src_SubDToBezierHS "src.SubDToBezierHS"
														
 
															 // OpName %SubDToBezierHS "SubDToBezierHS"
														
 
															-// OpName %type_gl_PerVertex "type.gl_PerVertex"
														
 
															-// OpName %gl_PerVertexIn "gl_PerVertexIn"
														
 
															-// OpName %gl_PerVertexOut "gl_PerVertexOut"
														
 
															 // OpName %VS_CONTROL_POINT_OUTPUT "VS_CONTROL_POINT_OUTPUT"
														
 
															 // OpMemberName %VS_CONTROL_POINT_OUTPUT 0 "vPosition"
														
 
															 // OpMemberName %VS_CONTROL_POINT_OUTPUT 1 "vUV"
														
@@ -109,11 +106,6 @@ BEZIER_CONTROL_POINT SubDToBezierHS(InputPatch<VS_CONTROL_POINT_OUTPUT, MAX_POIN
 
															 // OpName %PatchID_0 "PatchID"
														
 
															 // OpName %vsOutput "vsOutput"
														
 
															 // OpName %result "result"
														
 
															-// OpMemberDecorate %type_gl_PerVertex 0 BuiltIn Position
														
 
															-// OpMemberDecorate %type_gl_PerVertex 1 BuiltIn PointSize
														
 
															-// OpMemberDecorate %type_gl_PerVertex 2 BuiltIn ClipDistance
														
 
															-// OpMemberDecorate %type_gl_PerVertex 3 BuiltIn CullDistance
														
 
															-// OpDecorate %type_gl_PerVertex Block
														
 
															 // OpDecorate %gl_InvocationID BuiltIn InvocationId
														
 
															 // OpDecorate %gl_PrimitiveID BuiltIn PrimitiveId
														
 
															 // OpDecorate %gl_TessLevelOuter BuiltIn TessLevelOuter
														
@@ -137,18 +129,11 @@ BEZIER_CONTROL_POINT SubDToBezierHS(InputPatch<VS_CONTROL_POINT_OUTPUT, MAX_POIN
 
															 // %void = OpTypeVoid
														
 
															 // %3 = OpTypeFunction %void
														
 
															 // %float = OpTypeFloat 32
														
 
															-// %v4float = OpTypeVector %float 4
														
 
															-// %uint = OpTypeInt 32 0
														
 
															-// %uint_1 = OpConstant %uint 1
														
 
															-// %_arr_float_uint_1 = OpTypeArray %float %uint_1
														
 
															-// %type_gl_PerVertex = OpTypeStruct %v4float %float %_arr_float_uint_1 %_arr_float_uint_1
														
 
															-// %uint_3 = OpConstant %uint 3
														
 
															-// %_arr_type_gl_PerVertex_uint_3 = OpTypeArray %type_gl_PerVertex %uint_3
														
 
															-// %_ptr_Input__arr_type_gl_PerVertex_uint_3 = OpTypePointer Input %_arr_type_gl_PerVertex_uint_3
														
 
															-// %_ptr_Output__arr_type_gl_PerVertex_uint_3 = OpTypePointer Output %_arr_type_gl_PerVertex_uint_3
														
 
															 // %v3float = OpTypeVector %float 3
														
 
															 // %v2float = OpTypeVector %float 2
														
 
															 // %VS_CONTROL_POINT_OUTPUT = OpTypeStruct %v3float %v2float %v3float
														
 
															+// %uint = OpTypeInt 32 0
														
 
															+// %uint_3 = OpConstant %uint 3
														
 
															 // %_arr_VS_CONTROL_POINT_OUTPUT_uint_3 = OpTypeArray %VS_CONTROL_POINT_OUTPUT %uint_3
														
 
															 // %_ptr_Function__arr_VS_CONTROL_POINT_OUTPUT_uint_3 = OpTypePointer Function %_arr_VS_CONTROL_POINT_OUTPUT_uint_3
														
 
															 // %_arr_v3float_uint_3 = OpTypeArray %v3float %uint_3
														
@@ -161,20 +146,21 @@ BEZIER_CONTROL_POINT SubDToBezierHS(InputPatch<VS_CONTROL_POINT_OUTPUT, MAX_POIN
 
															 // %_ptr_Output__arr_v3float_uint_3 = OpTypePointer Output %_arr_v3float_uint_3
														
 
															 // %_ptr_Output_v3float = OpTypePointer Output %v3float
														
 
															 // %uint_0 = OpConstant %uint 0
														
 
															+// %uint_4 = OpConstant %uint 4
														
 
															 // %uint_2 = OpConstant %uint 2
														
 
															 // %bool = OpTypeBool
														
 
															-// %uint_4 = OpConstant %uint 4
														
 
															 // %_arr_float_uint_4 = OpTypeArray %float %uint_4
														
 
															 // %_arr_float_uint_2 = OpTypeArray %float %uint_2
														
 
															 // %_arr_v3float_uint_4 = OpTypeArray %v3float %uint_4
														
 
															 // %_arr_v2float_uint_4 = OpTypeArray %v2float %uint_4
														
 
															+// %v4float = OpTypeVector %float 4
														
 
															 // %HS_CONSTANT_DATA_OUTPUT = OpTypeStruct %_arr_float_uint_4 %_arr_float_uint_2 %_arr_v3float_uint_4 %_arr_v2float_uint_4 %_arr_v3float_uint_4 %_arr_v3float_uint_4 %v4float
														
 
															 // %_ptr_Output__arr_float_uint_4 = OpTypePointer Output %_arr_float_uint_4
														
 
															 // %_ptr_Output__arr_float_uint_2 = OpTypePointer Output %_arr_float_uint_2
														
 
															 // %_ptr_Output__arr_v3float_uint_4 = OpTypePointer Output %_arr_v3float_uint_4
														
 
															 // %_ptr_Output__arr_v2float_uint_4 = OpTypePointer Output %_arr_v2float_uint_4
														
 
															 // %_ptr_Output_v4float = OpTypePointer Output %v4float
														
 
															-// %95 = OpTypeFunction %HS_CONSTANT_DATA_OUTPUT %_ptr_Function__arr_VS_CONTROL_POINT_OUTPUT_uint_3 %_ptr_Function_uint
														
 
															+// %87 = OpTypeFunction %HS_CONSTANT_DATA_OUTPUT %_ptr_Function__arr_VS_CONTROL_POINT_OUTPUT_uint_3 %_ptr_Function_uint
														
 
															 // %_ptr_Function_HS_CONSTANT_DATA_OUTPUT = OpTypePointer Function %HS_CONSTANT_DATA_OUTPUT
														
 
															 // %float_1 = OpConstant %float 1
														
 
															 // %int = OpTypeInt 32 1
														
@@ -188,12 +174,10 @@ BEZIER_CONTROL_POINT SubDToBezierHS(InputPatch<VS_CONTROL_POINT_OUTPUT, MAX_POIN
 
															 // %int_3 = OpConstant %int 3
														
 
															 // %float_5 = OpConstant %float 5
														
 
															 // %float_6 = OpConstant %float 6
														
 
															-// %120 = OpTypeFunction %BEZIER_CONTROL_POINT %_ptr_Function__arr_VS_CONTROL_POINT_OUTPUT_uint_3 %_ptr_Function_uint %_ptr_Function_uint
														
 
															+// %112 = OpTypeFunction %BEZIER_CONTROL_POINT %_ptr_Function__arr_VS_CONTROL_POINT_OUTPUT_uint_3 %_ptr_Function_uint %_ptr_Function_uint
														
 
															 // %_ptr_Function_VS_CONTROL_POINT_OUTPUT = OpTypePointer Function %VS_CONTROL_POINT_OUTPUT
														
 
															 // %_ptr_Function_BEZIER_CONTROL_POINT = OpTypePointer Function %BEZIER_CONTROL_POINT
														
 
															 // %_ptr_Function_v3float = OpTypePointer Function %v3float
														
 
															-// %gl_PerVertexIn = OpVariable %_ptr_Input__arr_type_gl_PerVertex_uint_3 Input
														
 
															-// %gl_PerVertexOut = OpVariable %_ptr_Output__arr_type_gl_PerVertex_uint_3 Output
														
 
															 // %in_var_WORLDPOS = OpVariable %_ptr_Input__arr_v3float_uint_3 Input
														
 
															 // %in_var_TEXCOORD0 = OpVariable %_ptr_Input__arr_v2float_uint_3 Input
														
 
															 // %in_var_TANGENT = OpVariable %_ptr_Input__arr_v3float_uint_3 Input
														
@@ -208,90 +192,90 @@ BEZIER_CONTROL_POINT SubDToBezierHS(InputPatch<VS_CONTROL_POINT_OUTPUT, MAX_POIN
 
															 // %out_var_TANVCORNER = OpVariable %_ptr_Output__arr_v3float_uint_4 Output
														
 
															 // %out_var_TANWEIGHTS = OpVariable %_ptr_Output_v4float Output
														
 
															 // %SubDToBezierHS = OpFunction %void None %3
														
 
															-// %17 = OpLabel
														
 
															+// %5 = OpLabel
														
 
															 // %param_var_ip = OpVariable %_ptr_Function__arr_VS_CONTROL_POINT_OUTPUT_uint_3 Function
														
 
															 // %param_var_cpid = OpVariable %_ptr_Function_uint Function
														
 
															 // %param_var_PatchID = OpVariable %_ptr_Function_uint Function
														
 
															-// %27 = OpLoad %_arr_v3float_uint_3 %in_var_WORLDPOS
														
 
															-// %31 = OpLoad %_arr_v2float_uint_3 %in_var_TEXCOORD0
														
 
															-// %33 = OpLoad %_arr_v3float_uint_3 %in_var_TANGENT
														
 
															-// %34 = OpCompositeExtract %v3float %27 0
														
 
															-// %35 = OpCompositeExtract %v2float %31 0
														
 
															-// %36 = OpCompositeExtract %v3float %33 0
														
 
															-// %37 = OpCompositeConstruct %VS_CONTROL_POINT_OUTPUT %34 %35 %36
														
 
															-// %38 = OpCompositeExtract %v3float %27 1
														
 
															-// %39 = OpCompositeExtract %v2float %31 1
														
 
															-// %40 = OpCompositeExtract %v3float %33 1
														
 
															-// %41 = OpCompositeConstruct %VS_CONTROL_POINT_OUTPUT %38 %39 %40
														
 
															-// %42 = OpCompositeExtract %v3float %27 2
														
 
															-// %43 = OpCompositeExtract %v2float %31 2
														
 
															-// %44 = OpCompositeExtract %v3float %33 2
														
 
															-// %45 = OpCompositeConstruct %VS_CONTROL_POINT_OUTPUT %42 %43 %44
														
 
															-// %46 = OpCompositeConstruct %_arr_VS_CONTROL_POINT_OUTPUT_uint_3 %37 %41 %45
														
 
															-// OpStore %param_var_ip %46
														
 
															-// %51 = OpLoad %uint %gl_InvocationID
														
 
															-// OpStore %param_var_cpid %51
														
 
															-// %54 = OpLoad %uint %gl_PrimitiveID
														
 
															-// OpStore %param_var_PatchID %54
														
 
															-// %56 = OpFunctionCall %BEZIER_CONTROL_POINT %src_SubDToBezierHS %param_var_ip %param_var_cpid %param_var_PatchID
														
 
															-// %57 = OpCompositeExtract %v3float %56 0
														
 
															-// %61 = OpAccessChain %_ptr_Output_v3float %out_var_BEZIERPOS %51
														
 
															-// OpStore %61 %57
														
 
															-// OpControlBarrier %uint_2 %uint_1 %uint_0
														
 
															-// %65 = OpIEqual %bool %51 %uint_0
														
 
															+// %18 = OpLoad %_arr_v3float_uint_3 %in_var_WORLDPOS
														
 
															+// %22 = OpLoad %_arr_v2float_uint_3 %in_var_TEXCOORD0
														
 
															+// %24 = OpLoad %_arr_v3float_uint_3 %in_var_TANGENT
														
 
															+// %25 = OpCompositeExtract %v3float %18 0
														
 
															+// %26 = OpCompositeExtract %v2float %22 0
														
 
															+// %27 = OpCompositeExtract %v3float %24 0
														
 
															+// %28 = OpCompositeConstruct %VS_CONTROL_POINT_OUTPUT %25 %26 %27
														
 
															+// %29 = OpCompositeExtract %v3float %18 1
														
 
															+// %30 = OpCompositeExtract %v2float %22 1
														
 
															+// %31 = OpCompositeExtract %v3float %24 1
														
 
															+// %32 = OpCompositeConstruct %VS_CONTROL_POINT_OUTPUT %29 %30 %31
														
 
															+// %33 = OpCompositeExtract %v3float %18 2
														
 
															+// %34 = OpCompositeExtract %v2float %22 2
														
 
															+// %35 = OpCompositeExtract %v3float %24 2
														
 
															+// %36 = OpCompositeConstruct %VS_CONTROL_POINT_OUTPUT %33 %34 %35
														
 
															+// %37 = OpCompositeConstruct %_arr_VS_CONTROL_POINT_OUTPUT_uint_3 %28 %32 %36
														
 
															+// OpStore %param_var_ip %37
														
 
															+// %42 = OpLoad %uint %gl_InvocationID
														
 
															+// OpStore %param_var_cpid %42
														
 
															+// %45 = OpLoad %uint %gl_PrimitiveID
														
 
															+// OpStore %param_var_PatchID %45
														
 
															+// %47 = OpFunctionCall %BEZIER_CONTROL_POINT %src_SubDToBezierHS %param_var_ip %param_var_cpid %param_var_PatchID
														
 
															+// %48 = OpCompositeExtract %v3float %47 0
														
 
															+// %52 = OpAccessChain %_ptr_Output_v3float %out_var_BEZIERPOS %42
														
 
															+// OpStore %52 %48
														
 
															+// OpControlBarrier %uint_2 %uint_4 %uint_0
														
 
															+// %57 = OpIEqual %bool %42 %uint_0
														
 
															 // OpSelectionMerge %if_merge None
														
 
															-// OpBranchConditional %65 %if_true %if_merge
														
 
															+// OpBranchConditional %57 %if_true %if_merge
														
 
															 // %if_true = OpLabel
														
 
															-// %75 = OpFunctionCall %HS_CONSTANT_DATA_OUTPUT %SubDToBezierConstantsHS %param_var_ip %param_var_PatchID
														
 
															-// %76 = OpCompositeExtract %_arr_float_uint_4 %75 0
														
 
															-// OpStore %gl_TessLevelOuter %76
														
 
															-// %79 = OpCompositeExtract %_arr_float_uint_2 %75 1
														
 
															-// OpStore %gl_TessLevelInner %79
														
 
															-// %82 = OpCompositeExtract %_arr_v3float_uint_4 %75 2
														
 
															-// OpStore %out_var_TANGENT %82
														
 
															-// %85 = OpCompositeExtract %_arr_v2float_uint_4 %75 3
														
 
															-// OpStore %out_var_TEXCOORD %85
														
 
															-// %88 = OpCompositeExtract %_arr_v3float_uint_4 %75 4
														
 
															-// OpStore %out_var_TANUCORNER %88
														
 
															-// %90 = OpCompositeExtract %_arr_v3float_uint_4 %75 5
														
 
															-// OpStore %out_var_TANVCORNER %90
														
 
															-// %92 = OpCompositeExtract %v4float %75 6
														
 
															-// OpStore %out_var_TANWEIGHTS %92
														
 
															+// %67 = OpFunctionCall %HS_CONSTANT_DATA_OUTPUT %SubDToBezierConstantsHS %param_var_ip %param_var_PatchID
														
 
															+// %68 = OpCompositeExtract %_arr_float_uint_4 %67 0
														
 
															+// OpStore %gl_TessLevelOuter %68
														
 
															+// %71 = OpCompositeExtract %_arr_float_uint_2 %67 1
														
 
															+// OpStore %gl_TessLevelInner %71
														
 
															+// %74 = OpCompositeExtract %_arr_v3float_uint_4 %67 2
														
 
															+// OpStore %out_var_TANGENT %74
														
 
															+// %77 = OpCompositeExtract %_arr_v2float_uint_4 %67 3
														
 
															+// OpStore %out_var_TEXCOORD %77
														
 
															+// %80 = OpCompositeExtract %_arr_v3float_uint_4 %67 4
														
 
															+// OpStore %out_var_TANUCORNER %80
														
 
															+// %82 = OpCompositeExtract %_arr_v3float_uint_4 %67 5
														
 
															+// OpStore %out_var_TANVCORNER %82
														
 
															+// %84 = OpCompositeExtract %v4float %67 6
														
 
															+// OpStore %out_var_TANWEIGHTS %84
														
 
															 // OpBranch %if_merge
														
 
															 // %if_merge = OpLabel
														
 
															 // OpReturn
														
 
															 // OpFunctionEnd
														
 
															-// %SubDToBezierConstantsHS = OpFunction %HS_CONSTANT_DATA_OUTPUT None %95
														
 
															+// %SubDToBezierConstantsHS = OpFunction %HS_CONSTANT_DATA_OUTPUT None %87
														
 
															 // %ip = OpFunctionParameter %_ptr_Function__arr_VS_CONTROL_POINT_OUTPUT_uint_3
														
 
															 // %PatchID = OpFunctionParameter %_ptr_Function_uint
														
 
															 // %bb_entry = OpLabel
														
 
															 // %Output = OpVariable %_ptr_Function_HS_CONSTANT_DATA_OUTPUT Function
														
 
															-// %105 = OpAccessChain %_ptr_Function_float %Output %int_0 %int_0
														
 
															-// OpStore %105 %float_1
														
 
															-// %108 = OpAccessChain %_ptr_Function_float %Output %int_0 %int_1
														
 
															-// OpStore %108 %float_2
														
 
															-// %111 = OpAccessChain %_ptr_Function_float %Output %int_0 %int_2
														
 
															-// OpStore %111 %float_3
														
 
															-// %114 = OpAccessChain %_ptr_Function_float %Output %int_0 %int_3
														
 
															-// OpStore %114 %float_4
														
 
															-// %116 = OpAccessChain %_ptr_Function_float %Output %int_1 %int_0
														
 
															-// OpStore %116 %float_5
														
 
															-// %118 = OpAccessChain %_ptr_Function_float %Output %int_1 %int_1
														
 
															-// OpStore %118 %float_6
														
 
															-// %119 = OpLoad %HS_CONSTANT_DATA_OUTPUT %Output
														
 
															-// OpReturnValue %119
														
 
															+// %97 = OpAccessChain %_ptr_Function_float %Output %int_0 %int_0
														
 
															+// OpStore %97 %float_1
														
 
															+// %100 = OpAccessChain %_ptr_Function_float %Output %int_0 %int_1
														
 
															+// OpStore %100 %float_2
														
 
															+// %103 = OpAccessChain %_ptr_Function_float %Output %int_0 %int_2
														
 
															+// OpStore %103 %float_3
														
 
															+// %106 = OpAccessChain %_ptr_Function_float %Output %int_0 %int_3
														
 
															+// OpStore %106 %float_4
														
 
															+// %108 = OpAccessChain %_ptr_Function_float %Output %int_1 %int_0
														
 
															+// OpStore %108 %float_5
														
 
															+// %110 = OpAccessChain %_ptr_Function_float %Output %int_1 %int_1
														
 
															+// OpStore %110 %float_6
														
 
															+// %111 = OpLoad %HS_CONSTANT_DATA_OUTPUT %Output
														
 
															+// OpReturnValue %111
														
 
															 // OpFunctionEnd
														
 
															-// %src_SubDToBezierHS = OpFunction %BEZIER_CONTROL_POINT None %120
														
 
															+// %src_SubDToBezierHS = OpFunction %BEZIER_CONTROL_POINT None %112
														
 
															 // %ip_0 = OpFunctionParameter %_ptr_Function__arr_VS_CONTROL_POINT_OUTPUT_uint_3
														
 
															 // %cpid = OpFunctionParameter %_ptr_Function_uint
														
 
															 // %PatchID_0 = OpFunctionParameter %_ptr_Function_uint
														
 
															 // %bb_entry_0 = OpLabel
														
 
															 // %vsOutput = OpVariable %_ptr_Function_VS_CONTROL_POINT_OUTPUT Function
														
 
															 // %result = OpVariable %_ptr_Function_BEZIER_CONTROL_POINT Function
														
 
															-// %130 = OpAccessChain %_ptr_Function_v3float %vsOutput %int_0
														
 
															-// %131 = OpLoad %v3float %130
														
 
															-// %132 = OpAccessChain %_ptr_Function_v3float %result %int_0
														
 
															-// OpStore %132 %131
														
 
															-// %133 = OpLoad %BEZIER_CONTROL_POINT %result
														
 
															-// OpReturnValue %133
														
 
															+// %122 = OpAccessChain %_ptr_Function_v3float %vsOutput %int_0
														
 
															+// %123 = OpLoad %v3float %122
														
 
															+// %124 = OpAccessChain %_ptr_Function_v3float %result %int_0
														
 
															+// OpStore %124 %123
														
 
															+// %125 = OpLoad %BEZIER_CONTROL_POINT %result
														
 
															+// OpReturnValue %125
														
 
															 // OpFunctionEnd
														
--- a/tools/clang/test/CodeGenSPIRV/empty-struct-interface.vs.hlsl2spv
+++ b/tools/clang/test/CodeGenSPIRV/empty-struct-interface.vs.hlsl2spv
@@ -15,47 +15,32 @@ VSOut main(VSIn input)
 
															 // CHECK-WHOLE-SPIR-V:
														
 
															 // OpCapability Shader
														
 
															 // OpMemoryModel Logical GLSL450
														
 
															-// OpEntryPoint Vertex %main "main" %gl_PerVertexOut
														
 
															+// OpEntryPoint Vertex %main "main"
														
 
															 // OpSource HLSL 600
														
 
															 // OpName %bb_entry "bb.entry"
														
 
															 // OpName %src_main "src.main"
														
 
															 // OpName %main "main"
														
 
															-// OpName %type_gl_PerVertex "type.gl_PerVertex"
														
 
															-// OpName %gl_PerVertexOut "gl_PerVertexOut"
														
 
															 // OpName %VSIn "VSIn"
														
 
															 // OpName %param_var_input "param.var.input"
														
 
															 // OpName %input "input"
														
 
															 // OpName %result "result"
														
 
															-// OpMemberDecorate %type_gl_PerVertex 0 BuiltIn Position
														
 
															-// OpMemberDecorate %type_gl_PerVertex 1 BuiltIn PointSize
														
 
															-// OpMemberDecorate %type_gl_PerVertex 2 BuiltIn ClipDistance
														
 
															-// OpMemberDecorate %type_gl_PerVertex 3 BuiltIn CullDistance
														
 
															-// OpDecorate %type_gl_PerVertex Block
														
 
															 // %void = OpTypeVoid
														
 
															 // %3 = OpTypeFunction %void
														
 
															-// %float = OpTypeFloat 32
														
 
															-// %v4float = OpTypeVector %float 4
														
 
															-// %uint = OpTypeInt 32 0
														
 
															-// %uint_1 = OpConstant %uint 1
														
 
															-// %_arr_float_uint_1 = OpTypeArray %float %uint_1
														
 
															-// %type_gl_PerVertex = OpTypeStruct %v4float %float %_arr_float_uint_1 %_arr_float_uint_1
														
 
															-// %_ptr_Output_type_gl_PerVertex = OpTypePointer Output %type_gl_PerVertex
														
 
															 // %VSIn = OpTypeStruct
														
 
															 // %_ptr_Function_VSIn = OpTypePointer Function %VSIn
														
 
															-// %19 = OpTypeFunction %VSIn %_ptr_Function_VSIn
														
 
															-// %gl_PerVertexOut = OpVariable %_ptr_Output_type_gl_PerVertex Output
														
 
															+// %11 = OpTypeFunction %VSIn %_ptr_Function_VSIn
														
 
															 // %main = OpFunction %void None %3
														
 
															-// %13 = OpLabel
														
 
															+// %5 = OpLabel
														
 
															 // %param_var_input = OpVariable %_ptr_Function_VSIn Function
														
 
															-// %17 = OpCompositeConstruct %VSIn
														
 
															-// OpStore %param_var_input %17
														
 
															-// %18 = OpFunctionCall %VSIn %src_main %param_var_input
														
 
															+// %9 = OpCompositeConstruct %VSIn
														
 
															+// OpStore %param_var_input %9
														
 
															+// %10 = OpFunctionCall %VSIn %src_main %param_var_input
														
 
															 // OpReturn
														
 
															 // OpFunctionEnd
														
 
															-// %src_main = OpFunction %VSIn None %19
														
 
															+// %src_main = OpFunction %VSIn None %11
														
 
															 // %input = OpFunctionParameter %_ptr_Function_VSIn
														
 
															 // %bb_entry = OpLabel
														
 
															 // %result = OpVariable %_ptr_Function_VSIn Function
														
 
															-// %23 = OpLoad %VSIn %result
														
 
															-// OpReturnValue %23
														
 
															-// OpFunctionEnd
														
 
															+// %15 = OpLoad %VSIn %result
														
 
															+// OpReturnValue %15
														
 
															+// OpFunctionEnd
														
--- a/tools/clang/test/CodeGenSPIRV/fn.param.inout.hlsl
+++ b/tools/clang/test/CodeGenSPIRV/fn.param.inout.hlsl
@@ -11,36 +11,18 @@ float fnInOut(uniform float a, in float b, out float c, inout float d, inout Pix
 
															 }
														
 
															 float main(float val: A) : B {
														
 
															-// CHECK-LABEL: %src_main = OpFunction
														
 
															     float m, n;
														
 
															     Pixel p;
														
 
															 // CHECK:      %param_var_a = OpVariable %_ptr_Function_float Function
														
 
															 // CHECK-NEXT: %param_var_b = OpVariable %_ptr_Function_float Function
														
 
															-// CHECK-NEXT: %param_var_c = OpVariable %_ptr_Function_float Function
														
 
															-// CHECK-NEXT: %param_var_d = OpVariable %_ptr_Function_float Function
														
 
															-// CHECK-NEXT: %param_var_e = OpVariable %_ptr_Function_Pixel Function
														
 
															 // CHECK-NEXT:                OpStore %param_var_a %float_5
														
 
															 // CHECK-NEXT: [[val:%\d+]] = OpLoad %float %val
														
 
															 // CHECK-NEXT:                OpStore %param_var_b [[val]]
														
 
															-// CHECK-NEXT:   [[m:%\d+]] = OpLoad %float %m
														
 
															-// CHECK-NEXT:                OpStore %param_var_c [[m]]
														
 
															-// CHECK-NEXT:   [[n:%\d+]] = OpLoad %float %n
														
 
															-// CHECK-NEXT:                OpStore %param_var_d [[n]]
														
 
															-// CHECK-NEXT:   [[p:%\d+]] = OpLoad %Pixel %p
														
 
															-// CHECK-NEXT:                OpStore %param_var_e [[p]]
														
 
															-// CHECK-NEXT: [[ret:%\d+]] = OpFunctionCall %float %fnInOut %param_var_a %param_var_b %param_var_c %param_var_d
														
 
															-
														
 
															-// CHECK-NEXT:   [[c:%\d+]] = OpLoad %float %param_var_c
														
 
															-// CHECK-NEXT:                OpStore %m [[c]]
														
 
															-// CHECK-NEXT:   [[d:%\d+]] = OpLoad %float %param_var_d
														
 
															-// CHECK-NEXT:                OpStore %n [[d]]
														
 
															-// CHECK-NEXT:   [[e:%\d+]] = OpLoad %Pixel %param_var_e
														
 
															-// CHECK-NEXT:                OpStore %p [[e]]
														
 
															+// CHECK-NEXT: [[ret:%\d+]] = OpFunctionCall %float %fnInOut %param_var_a %param_var_b %m %n %p
														
 
															 // CHECK-NEXT:                OpReturnValue [[ret]]
														
 
															     return fnInOut(5., val, m, n, p);
														
 
															-// CHECK-NEXT: OpFunctionEnd
														
 
															 }
														
--- a/tools/clang/test/CodeGenSPIRV/fn.param.inout.no-copy.hlsl
+++ b/tools/clang/test/CodeGenSPIRV/fn.param.inout.no-copy.hlsl
@@ -0,0 +1,37 @@
 
															+// Run: %dxc -T vs_6_0 -E main
														
 
															+
														
 
															+struct S {
														
 
															+    float4 val;
														
 
															+};
														
 
															+
														
 
															+void foo(
														
 
															+    out   int      a,
														
 
															+    inout uint2    b,
														
 
															+    out   float2x3 c,
														
 
															+    inout S        d,
														
 
															+    out   float    e[4]
														
 
															+) {
														
 
															+    a = 0;
														
 
															+    b = 1;
														
 
															+    c = 2.0;
														
 
															+    d.val = 3.0;
														
 
															+    e[0] = 4.0;
														
 
															+}
														
 
															+
														
 
															+void main() {
														
 
															+    int      a;
														
 
															+    uint2    b;
														
 
															+    float2x3 c;
														
 
															+    S        d;
														
 
															+    float    e[4];
														
 
															+
														
 
															+// CHECK: %a = OpVariable %_ptr_Function_int Function
														
 
															+// CHECK: %b = OpVariable %_ptr_Function_v2uint Function
														
 
															+// CHECK: %c = OpVariable %_ptr_Function_mat2v3float Function
														
 
															+// CHECK: %d = OpVariable %_ptr_Function_S Function
														
 
															+// CHECK: %e = OpVariable %_ptr_Function__arr_float_uint_4 Function
														
 
															+
														
 
															+// CHECK:      OpFunctionCall %void %foo %a %b %c %d %e
														
 
															+
														
 
															+    foo(a, b, c, d, e);
														
 
															+}
														
--- a/tools/clang/test/CodeGenSPIRV/fn.param.inout.storage-class.hlsl
+++ b/tools/clang/test/CodeGenSPIRV/fn.param.inout.storage-class.hlsl
@@ -0,0 +1,30 @@
 
															+// Run: %dxc -T vs_6_0 -E main
														
 
															+
														
 
															+RWStructuredBuffer<float> Data;
														
 
															+
														
 
															+void foo(in float a, inout float b, out float c) {
														
 
															+    b += a;
														
 
															+    c = a + b;
														
 
															+}
														
 
															+
														
 
															+void main(float input : INPUT) {
														
 
															+// CHECK: %param_var_a = OpVariable %_ptr_Function_float Function
														
 
															+// CHECK: %param_var_b = OpVariable %_ptr_Function_float Function
														
 
															+// CHECK: %param_var_c = OpVariable %_ptr_Function_float Function
														
 
															+
														
 
															+// CHECK: [[val:%\d+]] = OpLoad %float %input
														
 
															+// CHECK:                OpStore %param_var_a [[val]]
														
 
															+// CHECK:  [[p0:%\d+]] = OpAccessChain %_ptr_Uniform_float %Data %int_0 %uint_0
														
 
															+// CHECK: [[val:%\d+]] = OpLoad %float [[p0]]
														
 
															+// CHECK:                OpStore %param_var_b [[val]]
														
 
															+// CHECK:  [[p1:%\d+]] = OpAccessChain %_ptr_Uniform_float %Data %int_0 %uint_1
														
 
															+// CHECK: [[val:%\d+]] = OpLoad %float [[p1]]
														
 
															+// CHECK:                OpStore %param_var_c [[val]]
														
 
															+
														
 
															+// CHECK:                OpFunctionCall %void %foo %param_var_a %param_var_b %param_var_c
														
 
															+    foo(input, Data[0], Data[1]);
														
 
															+// CHECK: [[val:%\d+]] = OpLoad %float %param_var_b
														
 
															+// CHECK:                OpStore [[p0]] [[val]]
														
 
															+// CHECK: [[val:%\d+]] = OpLoad %float %param_var_c
														
 
															+// CHECK:                OpStore [[p1]] [[val]]
														
 
															+}
														
--- a/tools/clang/test/CodeGenSPIRV/fn.param.inout.vector.hlsl
+++ b/tools/clang/test/CodeGenSPIRV/fn.param.inout.vector.hlsl
@@ -13,14 +13,12 @@ float4 main() : C {
 
															 // CHECK-NEXT:                OpImageWrite [[buf]] %uint_5 [[a]]
														
 
															 // CHECK-NEXT:   [[b:%\d+]] = OpLoad %v3float %param_var_b
														
 
															 // CHECK-NEXT: [[tex:%\d+]] = OpLoad %type_2d_image %MyRWTexture
														
 
															-// CHECK-NEXT:                OpImageWrite [[tex]] %36 [[b]]
														
 
															+// CHECK-NEXT:                OpImageWrite [[tex]] {{%\d+}} [[b]]
														
 
															     foo(MyRWBuffer[5], MyRWTexture[uint2(6, 7)]);
														
 
															     float4 val;
														
 
															 // CHECK:    [[z_ptr:%\d+]] = OpAccessChain %_ptr_Function_float %val %int_2
														
 
															-// CHECK:          {{%\d+}} = OpFunctionCall %void %bar %param_var_x %param_var_y %param_var_z %param_var_w
														
 
															-// CHECK-NEXT:   [[x:%\d+]] = OpLoad %v4float %param_var_x
														
 
															-// CHECK-NEXT:                OpStore %val [[x]]
														
 
															+// CHECK:          {{%\d+}} = OpFunctionCall %void %bar %val %param_var_y %param_var_z %param_var_w
														
 
															 // CHECK-NEXT:   [[y:%\d+]] = OpLoad %v3float %param_var_y
														
 
															 // CHECK-NEXT: [[old:%\d+]] = OpLoad %v4float %val
														
 
															     // Write to val.zwx:
														
--- a/tools/clang/test/CodeGenSPIRV/gs.emit.hlsl
+++ b/tools/clang/test/CodeGenSPIRV/gs.emit.hlsl
@@ -28,7 +28,7 @@ void main(in    line float2 foo[2] : FOO,
 
															 // Write back to stage output variables
														
 
															 // CHECK-NEXT: [[vertex:%\d+]] = OpLoad %GsPerVertexOut %vertex
														
 
															 // CHECK-NEXT:    [[pos:%\d+]] = OpCompositeExtract %v4float [[vertex]] 0
														
 
															-// CHECK-NEXT:                   OpStore %gl_Position [[pos]]
														
 
															+// CHECK-NEXT:                   OpStore %gl_Position_0 [[pos]]
														
 
															 // CHECK-NEXT:    [[foo:%\d+]] = OpCompositeExtract %v3float [[vertex]] 1
														
 
															 // CHECK-NEXT:                   OpStore %out_var_FOO [[foo]]
														
 
															 // CHECK-NEXT:      [[s:%\d+]] = OpCompositeExtract %GsInnerOut [[vertex]] 2
														
@@ -41,7 +41,7 @@ void main(in    line float2 foo[2] : FOO,
 
															 // Write back to stage output variables
														
 
															 // CHECK-NEXT: [[vertex:%\d+]] = OpLoad %GsPerVertexOut %vertex
														
 
															 // CHECK-NEXT:    [[pos:%\d+]] = OpCompositeExtract %v4float [[vertex]] 0
														
 
															-// CHECK-NEXT:                   OpStore %gl_Position [[pos]]
														
 
															+// CHECK-NEXT:                   OpStore %gl_Position_0 [[pos]]
														
 
															 // CHECK-NEXT:    [[foo:%\d+]] = OpCompositeExtract %v3float [[vertex]] 1
														
 
															 // CHECK-NEXT:                   OpStore %out_var_FOO [[foo]]
														
 
															 // CHECK-NEXT:      [[s:%\d+]] = OpCompositeExtract %GsInnerOut [[vertex]] 2
														
--- a/tools/clang/test/CodeGenSPIRV/hs.structure.hlsl
+++ b/tools/clang/test/CodeGenSPIRV/hs.structure.hlsl
@@ -12,7 +12,7 @@
 
															 // CHECK:      {{%\d+}} = OpFunctionCall %BEZIER_CONTROL_POINT %src_main %param_var_ip %param_var_i %param_var_PatchID
														
 
															-// CHECK:                 OpControlBarrier %uint_2 %uint_1 %uint_0
														
 
															+// CHECK:                 OpControlBarrier %uint_2 %uint_4 %uint_0
														
 
															 // CHECK: [[cond:%\d+]] = OpIEqual %bool [[id]] %uint_0
														
 
															 // CHECK:                 OpSelectionMerge %if_merge None
	`@@ -1 +1 @@`
	`-Subproject commit 3a4dbdde9a9b2cf23736694ba70262dce27fbeaa`
			`+Subproject commit 3ce3e49d73b8abbf2ffe33f829f941fb2a40f552`
	`@@ -1 +1 @@`
	`-Subproject commit 42840d15e4bf5cba4a7345639b409c6e962b96c2`
			`+Subproject commit b09e3ce8427c7cfffcc4950f5bd05fa4c586b23c`
	`@@ -1 +1 @@`
	`-Subproject commit 82febb8eafc0425601b0d46567dc66c7750233ff`
			`+Subproject commit 08d5b1f33af8c18785fb8ca02792b5fac81e248f`
	`@@ -1 +1 @@`
	`-Subproject commit f2cc1aeb5de463c45d020c446cbcb028385b49f3`
			`+Subproject commit 1c7eb5604bc46c0198fc7bc35b32985ffe57ca93`