8 years ago · ae69cf0a58
--- a/include/dxc/HLSL/DxilOperations.h
+++ b/include/dxc/HLSL/DxilOperations.h
@@ -21,6 +21,7 @@ class Value;
 
															 class Instruction;
														
 
															 };
														
 
															 #include "llvm/IR/Attributes.h"
														
 
															+#include "llvm/ADT/StringRef.h"
														
 
															 #include "DxilConstants.h"
														
 
															 #include <unordered_map>
														
@@ -72,6 +73,7 @@ public:
 
															   static const char *GetOpCodeClassName(OpCode OpCode);
														
 
															   static bool IsOverloadLegal(OpCode OpCode, llvm::Type *pType);
														
 
															   static bool CheckOpCodeTable();
														
 
															+  static bool IsDxilOpFuncName(llvm::StringRef name);
														
 
															   static bool IsDxilOpFunc(const llvm::Function *F);
														
 
															   static bool IsDxilOpFuncCallInst(const llvm::Instruction *I);
														
 
															   static bool IsDxilOpFuncCallInst(const llvm::Instruction *I, OpCode opcode);
														
--- a/include/llvm/Analysis/ConstantFolding.h
+++ b/include/llvm/Analysis/ConstantFolding.h
@@ -22,6 +22,7 @@
 
															 namespace llvm {
														
 
															   class Constant;
														
 
															+  class ConstantFP;
														
 
															   class ConstantExpr;
														
 
															   class Instruction;
														
 
															   class DataLayout;
														
@@ -108,6 +109,11 @@ bool canConstantFoldCallTo(const Function *F);
 
															 /// with the specified arguments, returning null if unsuccessful.
														
 
															 Constant *ConstantFoldCall(Function *F, ArrayRef<Constant *> Operands,
														
 
															                            const TargetLibraryInfo *TLI = nullptr);
														
 
															+
														
 
															+/// HLSL Change - make these functions external so we can call them from 
														
 
															+/// DxilConstantFolding.cpp.
														
 
															+Constant *ConstantFoldFP(double(__cdecl *NativeFP)(double), double V, Type *Ty);
														
 
															+double getValueAsDouble(ConstantFP *Op);
														
 
															 }
														
 
															 #endif
														
--- a/include/llvm/Analysis/DxilConstantFolding.h
+++ b/include/llvm/Analysis/DxilConstantFolding.h
@@ -0,0 +1,41 @@
 
															+//===-- DxilConstantFolding.h - Constant folding for Dxil ------*- C++ -*-===//
														
 
															+//
														
 
															+//                     The LLVM Compiler Infrastructure
														
 
															+//
														
 
															+// This file is distributed under the University of Illinois Open Source
														
 
															+// License. See LICENSE.TXT for details.
														
 
															+//
														
 
															+// Copyright (C) Microsoft Corporation. All rights reserved.
														
 
															+//===----------------------------------------------------------------------===//
														
 
															+//
														
 
															+// This file declares routines for folding dxil intrinsics into constants when
														
 
															+// all operands are constants.
														
 
															+//
														
 
															+// We hook into the LLVM routines for constant folding so the function
														
 
															+// interfaces are dictated by what llvm provides.
														
 
															+//
														
 
															+//===----------------------------------------------------------------------===//
														
 
															+
														
 
															+#ifndef LLVM_ANALYSIS_HLSLCONSTANTFOLDING_H
														
 
															+#define LLVM_ANALYSIS_HLSLCONSTANTFOLDING_H
														
 
															+#include "llvm/ADT/StringRef.h"
														
 
															+
														
 
															+namespace llvm {
														
 
															+  class Constant;
														
 
															+  class Function;
														
 
															+  class Type;
														
 
															+  template<typename T>
														
 
															+  class ArrayRef;
														
 
															+}
														
 
															+
														
 
															+namespace hlsl {
														
 
															+  /// ConstantFoldScalarCall - Try to constant fold the call instruction.
														
 
															+  /// If successful, the constant result is returned, if not, null is returned.
														
 
															+  llvm::Constant *ConstantFoldScalarCall(llvm::StringRef Name, llvm::Type *Ty, llvm::ArrayRef<llvm::Constant *> Operands);
														
 
															+
														
 
															+  /// CanConstantFoldCallTo - Return true if we can potentially constant
														
 
															+  /// fold a call to the given function.
														
 
															+  bool CanConstantFoldCallTo(const llvm::Function *F);
														
 
															+}
														
 
															+
														
 
															+#endif
														
--- a/lib/Analysis/CMakeLists.txt
+++ b/lib/Analysis/CMakeLists.txt
@@ -25,6 +25,7 @@ add_llvm_library(LLVMAnalysis
 
															   DivergenceAnalysis.cpp
														
 
															   DomPrinter.cpp
														
 
															   DominanceFrontier.cpp
														
 
															+  DxilConstantFolding.cpp
														
 
															   IVUsers.cpp
														
 
															   InstCount.cpp
														
 
															   InstructionSimplify.cpp
														
--- a/lib/Analysis/ConstantFolding.cpp
+++ b/lib/Analysis/ConstantFolding.cpp
@@ -37,6 +37,8 @@
 
															 #include <cerrno>
														
 
															 #include <cmath>
														
 
															+#include "llvm/Analysis/DxilConstantFolding.h" // HLSL Change
														
 
															+
														
 
															 #ifdef HAVE_FENV_H
														
 
															 #include <fenv.h>
														
 
															 #endif
														
@@ -1222,6 +1224,9 @@ Constant *llvm::ConstantFoldLoadThroughGEPIndices(Constant *C,
 
															 /// Return true if it's even possible to fold a call to the specified function.
														
 
															 bool llvm::canConstantFoldCallTo(const Function *F) {
														
 
															+  if (hlsl::CanConstantFoldCallTo(F)) // HLSL Change
														
 
															+    return true;
														
 
															+
														
 
															   switch (F->getIntrinsicID()) {
														
 
															   case Intrinsic::fabs:
														
 
															   case Intrinsic::minnum:
														
@@ -1336,8 +1341,8 @@ static inline bool llvm_fenv_testexcept() {
 
															 }
														
 
															 } // End namespace
														
 
															-// HLSL Change: changed calling convention of NativeFP to __cdecl
														
 
															-static Constant *ConstantFoldFP(double (__cdecl *NativeFP)(double), double V,
														
 
															+// HLSL Change: changed calling convention of NativeFP to __cdecl and make non-static
														
 
															+Constant *llvm::ConstantFoldFP(double (__cdecl *NativeFP)(double), double V,
														
 
															                                 Type *Ty) {
														
 
															   llvm_fenv_clearexcept();
														
 
															   V = NativeFP(V);
														
@@ -1388,7 +1393,8 @@ static Constant *ConstantFoldConvertToInt(const APFloat &Val,
 
															   return ConstantInt::get(Ty, UIntVal, /*isSigned=*/true);
														
 
															 }
														
 
															-static double getValueAsDouble(ConstantFP *Op) {
														
 
															+// HLSL Change - make non-static.
														
 
															+double llvm::getValueAsDouble(ConstantFP *Op) {
														
 
															   Type *Ty = Op->getType();
														
 
															   if (Ty->isFloatTy())
														
@@ -1406,6 +1412,9 @@ static double getValueAsDouble(ConstantFP *Op) {
 
															 static Constant *ConstantFoldScalarCall(StringRef Name, unsigned IntrinsicID,
														
 
															                                         Type *Ty, ArrayRef<Constant *> Operands,
														
 
															                                         const TargetLibraryInfo *TLI) {
														
 
															+  if (Constant *C = hlsl::ConstantFoldScalarCall(Name, Ty, Operands)) // HLSL Change - Try hlsl constant folding first.
														
 
															+    return C;
														
 
															+
														
 
															   if (Operands.size() == 1) {
														
 
															     if (ConstantFP *Op = dyn_cast<ConstantFP>(Operands[0])) {
														
 
															       if (IntrinsicID == Intrinsic::convert_to_fp16) {
														
--- a/lib/Analysis/DxilConstantFolding.cpp
+++ b/lib/Analysis/DxilConstantFolding.cpp
@@ -0,0 +1,553 @@
 
															+//===-- DxilConstantFolding.cpp - Fold dxil intrinsics into constants -----===//
														
 
															+//
														
 
															+//                     The LLVM Compiler Infrastructure
														
 
															+//
														
 
															+// This file is distributed under the University of Illinois Open Source
														
 
															+// License. See LICENSE.TXT for details.
														
 
															+//
														
 
															+// Copyright (C) Microsoft Corporation. All rights reserved.
														
 
															+//
														
 
															+//===----------------------------------------------------------------------===//
														
 
															+//
														
 
															+//
														
 
															+//===----------------------------------------------------------------------===//
														
 
															+#include "llvm/Analysis/DxilConstantFolding.h"
														
 
															+#include "llvm/Analysis/ConstantFolding.h"
														
 
															+#include "llvm/ADT/SmallPtrSet.h"
														
 
															+#include "llvm/ADT/SmallVector.h"
														
 
															+#include "llvm/ADT/StringMap.h"
														
 
															+#include "llvm/Analysis/TargetLibraryInfo.h"
														
 
															+#include "llvm/Analysis/ValueTracking.h"
														
 
															+#include "llvm/Config/config.h"
														
 
															+#include "llvm/IR/Constants.h"
														
 
															+#include "llvm/IR/DataLayout.h"
														
 
															+#include "llvm/IR/DerivedTypes.h"
														
 
															+#include "llvm/IR/Function.h"
														
 
															+#include "llvm/IR/GetElementPtrTypeIterator.h"
														
 
															+#include "llvm/IR/GlobalVariable.h"
														
 
															+#include "llvm/IR/Instructions.h"
														
 
															+#include "llvm/IR/Intrinsics.h"
														
 
															+#include "llvm/IR/Operator.h"
														
 
															+#include "llvm/Support/ErrorHandling.h"
														
 
															+#include "llvm/Support/MathExtras.h"
														
 
															+#include <cerrno>
														
 
															+#include <cmath>
														
 
															+#include <algorithm>
														
 
															+#include <functional>
														
 
															+
														
 
															+#include "dxc/HLSL/Dxil.h"
														
 
															+
														
 
															+using namespace llvm;
														
 
															+using namespace hlsl;
														
 
															+
														
 
															+// Check if the given function is a dxil intrinsic and if so extract the
														
 
															+// opcode for the instrinsic being called.
														
 
															+static bool GetDxilOpcode(StringRef Name, ArrayRef<Constant *> Operands, OP::OpCode &out) {
														
 
															+  if (!OP::IsDxilOpFuncName(Name))
														
 
															+    return false;
														
 
															+  if (!Operands.size())
														
 
															+    return false;
														
 
															+  if (ConstantInt *ci = dyn_cast<ConstantInt>(Operands[0])) {
														
 
															+    uint64_t opcode = ci->getLimitedValue();
														
 
															+    if (opcode < static_cast<uint64_t>(OP::OpCode::NumOpCodes)) {
														
 
															+      out = static_cast<OP::OpCode>(opcode);
														
 
															+      return true;
														
 
															+    }
														
 
															+  }
														
 
															+
														
 
															+  return false;
														
 
															+}
														
 
															+
														
 
															+// Typedefs for passing function pointers to evaluate float constants.
														
 
															+typedef double(__cdecl *NativeFPUnaryOp)(double);
														
 
															+typedef std::function<APFloat::opStatus(APFloat&)> APFloatUnaryOp;
														
 
															+
														
 
															+/// Currently APFloat versions of these functions do not exist, so we use
														
 
															+/// the host native double versions.  Float versions are not called
														
 
															+/// directly but for all these it is true (float)(f((double)arg)) ==
														
 
															+/// f(arg).  Long double not supported yet.
														
 
															+///
														
 
															+/// Calls out to the llvm constant folding function to do the real work.
														
 
															+static Constant *DxilConstantFoldFP(NativeFPUnaryOp NativeFP, ConstantFP *C, Type *Ty) {
														
 
															+  double V = llvm::getValueAsDouble(C);
														
 
															+  return llvm::ConstantFoldFP(NativeFP, V, Ty);
														
 
															+}
														
 
															+
														
 
															+// Constant fold using the provided function on APFloats.
														
 
															+static Constant *HLSLConstantFoldAPFloat(APFloatUnaryOp NativeFP, ConstantFP *C, Type *Ty) {
														
 
															+  APFloat APF = C->getValueAPF();
														
 
															+
														
 
															+  if (NativeFP(APF) != APFloat::opStatus::opOK)
														
 
															+    return nullptr;
														
 
															+
														
 
															+  return ConstantFP::get(Ty->getContext(), APF);
														
 
															+}
														
 
															+
														
 
															+// Constant fold a round dxil intrinsic.
														
 
															+static Constant *HLSLConstantFoldRound(APFloat::roundingMode roundingMode, ConstantFP *C, Type *Ty) {
														
 
															+  APFloatUnaryOp f = [roundingMode](APFloat &x) { return x.roundToIntegral(roundingMode); };
														
 
															+  return HLSLConstantFoldAPFloat(f, C, Ty);
														
 
															+}
														
 
															+
														
 
															+namespace {
														
 
															+// Wrapper for call operands that "shifts past" the hlsl intrinsic opcode.
														
 
															+// Also provides accessors that dyn_cast the operand to a constant type.
														
 
															+class DxilIntrinsicOperands {
														
 
															+public:
														
 
															+  DxilIntrinsicOperands(ArrayRef<Constant *> RawCallOperands) : m_RawCallOperands(RawCallOperands) {}
														
 
															+  Constant * const &operator[](size_t index) const {
														
 
															+    return m_RawCallOperands[index + 1];
														
 
															+  }
														
 
															+
														
 
															+  ConstantInt *GetConstantInt(size_t index) const {
														
 
															+    return dyn_cast<ConstantInt>(this->operator[](index));
														
 
															+  }
														
 
															+  
														
 
															+  ConstantFP *GetConstantFloat(size_t index) const {
														
 
															+    return dyn_cast<ConstantFP>(this->operator[](index));
														
 
															+  }
														
 
															+
														
 
															+  size_t Size() const {
														
 
															+    return m_RawCallOperands.size() - 1;
														
 
															+  }
														
 
															+private:
														
 
															+  ArrayRef<Constant *> m_RawCallOperands;
														
 
															+};
														
 
															+}
														
 
															+
														
 
															+/// We only fold functions with finite arguments. Folding NaN and inf is
														
 
															+/// likely to be aborted with an exception anyway, and some host libms
														
 
															+/// have known errors raising exceptions.
														
 
															+static bool IsFinite(ConstantFP *C) {
														
 
															+  if (C->getValueAPF().isNaN() || C->getValueAPF().isInfinity())
														
 
															+    return false;
														
 
															+
														
 
															+  return true;
														
 
															+}
														
 
															+
														
 
															+// Check that the op is non-null and finite.
														
 
															+static bool IsValidOp(ConstantFP *C) {
														
 
															+  if (!C || !IsFinite(C))
														
 
															+    return false;
														
 
															+
														
 
															+  return true;
														
 
															+}
														
 
															+
														
 
															+// Check that all ops are valid.
														
 
															+static bool AllValidOps(ArrayRef<ConstantFP *> Ops) {
														
 
															+  return std::all_of(Ops.begin(), Ops.end(), IsValidOp);
														
 
															+}
														
 
															+
														
 
															+// Constant fold unary floating point intrinsics.
														
 
															+static Constant *ConstantFoldUnaryFPIntrinsic(OP::OpCode opcode, Type *Ty, ConstantFP *Op) {
														
 
															+  switch (opcode) {
														
 
															+  default: break;
														
 
															+  case OP::OpCode::FAbs: return DxilConstantFoldFP(fabs, Op, Ty);
														
 
															+  case OP::OpCode::Saturate: {
														
 
															+    NativeFPUnaryOp f = [](double x) { return std::max(std::min(x, 1.0), 0.0); };
														
 
															+    return DxilConstantFoldFP(f, Op, Ty);
														
 
															+  }
														
 
															+  case OP::OpCode::Cos:  return DxilConstantFoldFP(cos, Op, Ty);
														
 
															+  case OP::OpCode::Sin:  return DxilConstantFoldFP(sin, Op, Ty);
														
 
															+  case OP::OpCode::Tan:  return DxilConstantFoldFP(tan, Op, Ty);
														
 
															+  case OP::OpCode::Acos: return DxilConstantFoldFP(acos, Op, Ty);
														
 
															+  case OP::OpCode::Asin: return DxilConstantFoldFP(asin, Op, Ty);
														
 
															+  case OP::OpCode::Atan: return DxilConstantFoldFP(atan, Op, Ty);
														
 
															+  case OP::OpCode::Hcos: return DxilConstantFoldFP(cosh, Op, Ty);
														
 
															+  case OP::OpCode::Hsin: return DxilConstantFoldFP(sinh, Op, Ty);
														
 
															+  case OP::OpCode::Htan: return DxilConstantFoldFP(tanh, Op, Ty);
														
 
															+  case OP::OpCode::Exp:  return DxilConstantFoldFP(exp2, Op, Ty);
														
 
															+  case OP::OpCode::Frc: {
														
 
															+    NativeFPUnaryOp f = [](double x) { double unused; return fabs(modf(x, &unused)); };
														
 
															+    return DxilConstantFoldFP(f, Op, Ty);
														
 
															+  }
														
 
															+  case OP::OpCode::Log: return DxilConstantFoldFP(log2, Op, Ty);
														
 
															+  case OP::OpCode::Sqrt: return DxilConstantFoldFP(sqrt, Op, Ty);
														
 
															+  case OP::OpCode::Rsqrt: {
														
 
															+    NativeFPUnaryOp f = [](double x) { return 1.0 / sqrt(x); };
														
 
															+    return DxilConstantFoldFP(f, Op, Ty);
														
 
															+  }
														
 
															+  case OP::OpCode::Round_ne: return HLSLConstantFoldRound(APFloat::roundingMode::rmNearestTiesToEven, Op, Ty);
														
 
															+  case OP::OpCode::Round_ni: return HLSLConstantFoldRound(APFloat::roundingMode::rmTowardNegative, Op, Ty);
														
 
															+  case OP::OpCode::Round_pi: return HLSLConstantFoldRound(APFloat::roundingMode::rmTowardPositive, Op, Ty);
														
 
															+  case OP::OpCode::Round_z: return HLSLConstantFoldRound(APFloat::roundingMode::rmTowardZero, Op, Ty);
														
 
															+  }
														
 
															+  
														
 
															+  return nullptr;
														
 
															+}
														
 
															+
														
 
															+// Constant fold binary floating point intrinsics.
														
 
															+static Constant *ConstantFoldBinaryFPIntrinsic(OP::OpCode opcode, Type *Ty, ConstantFP *Op1, ConstantFP *Op2) {
														
 
															+  const APFloat &C1 = Op1->getValueAPF();
														
 
															+  const APFloat &C2 = Op2->getValueAPF();
														
 
															+  switch (opcode) {
														
 
															+  default: break;
														
 
															+  case OP::OpCode::FMax: return ConstantFP::get(Ty->getContext(), maxnum(C1, C2));
														
 
															+  case OP::OpCode::FMin: return ConstantFP::get(Ty->getContext(), minnum(C1, C2));
														
 
															+  }
														
 
															+
														
 
															+  return nullptr;
														
 
															+}
														
 
															+
														
 
															+// Constant fold ternary floating point intrinsics.
														
 
															+static Constant *ConstantFoldTernaryFPIntrinsic(OP::OpCode opcode, Type *Ty, ConstantFP *Op1, ConstantFP *Op2, ConstantFP *Op3) {
														
 
															+  const APFloat &C1 = Op1->getValueAPF();
														
 
															+  const APFloat &C2 = Op2->getValueAPF();
														
 
															+  const APFloat &C3 = Op3->getValueAPF();
														
 
															+  APFloat::roundingMode roundingMode = APFloat::rmNearestTiesToEven;
														
 
															+  switch (opcode) {
														
 
															+  default: break;
														
 
															+  case OP::OpCode::FMad: {
														
 
															+    APFloat result(C1);
														
 
															+    result.multiply(C2, roundingMode);
														
 
															+    result.add(C3, roundingMode);
														
 
															+    return ConstantFP::get(Ty->getContext(), result);
														
 
															+  }
														
 
															+  case OP::OpCode::Fma: {
														
 
															+    APFloat result(C1);
														
 
															+    result.fusedMultiplyAdd(C2, C3, roundingMode);
														
 
															+    return ConstantFP::get(Ty->getContext(), result);
														
 
															+  }
														
 
															+  }
														
 
															+  return nullptr;
														
 
															+}
														
 
															+
														
 
															+// Compute dot product for arbitrary sized vectors.
														
 
															+static Constant *ComputeDot(Type *Ty, ArrayRef<ConstantFP *> A, ArrayRef<ConstantFP *> B) {
														
 
															+  if (A.size() != B.size() || !A.size()) {
														
 
															+    assert(false && "invalid call to compute dot");
														
 
															+    return nullptr;
														
 
															+  }
														
 
															+
														
 
															+  if (!AllValidOps(A) || !AllValidOps(B))
														
 
															+    return nullptr;
														
 
															+  
														
 
															+  APFloat::roundingMode roundingMode = APFloat::roundingMode::rmNearestTiesToEven;
														
 
															+  APFloat sum = APFloat::getZero(A[0]->getValueAPF().getSemantics());
														
 
															+  for (int i = 0, e = A.size(); i != e; ++i) {
														
 
															+    APFloat  val(A[i]->getValueAPF());
														
 
															+    val.multiply(B[i]->getValueAPF(), roundingMode);
														
 
															+    sum.add(val, roundingMode);
														
 
															+  }
														
 
															+
														
 
															+  return ConstantFP::get(Ty->getContext(), sum);
														
 
															+
														
 
															+}
														
 
															+
														
 
															+// Constant folding for dot2, dot3, and dot4.
														
 
															+static Constant *ConstantFoldDot(OP::OpCode opcode, Type *Ty, const DxilIntrinsicOperands &operands) {
														
 
															+  switch (opcode) {
														
 
															+  default: break;
														
 
															+  case OP::OpCode::Dot2: {
														
 
															+    ConstantFP *Ax = operands.GetConstantFloat(0);
														
 
															+    ConstantFP *Ay = operands.GetConstantFloat(1);
														
 
															+    ConstantFP *Bx = operands.GetConstantFloat(2);
														
 
															+    ConstantFP *By = operands.GetConstantFloat(3);
														
 
															+    return ComputeDot(Ty, { Ax, Ay }, { Bx, By });
														
 
															+  }
														
 
															+  case OP::OpCode::Dot3: {
														
 
															+    ConstantFP *Ax = operands.GetConstantFloat(0);
														
 
															+    ConstantFP *Ay = operands.GetConstantFloat(1);
														
 
															+    ConstantFP *Az = operands.GetConstantFloat(2);
														
 
															+    ConstantFP *Bx = operands.GetConstantFloat(3);
														
 
															+    ConstantFP *By = operands.GetConstantFloat(4);
														
 
															+    ConstantFP *Bz = operands.GetConstantFloat(5);
														
 
															+    return ComputeDot(Ty, { Ax, Ay, Az }, { Bx, By, Bz });
														
 
															+  }
														
 
															+  case OP::OpCode::Dot4: {
														
 
															+    ConstantFP *Ax = operands.GetConstantFloat(0);
														
 
															+    ConstantFP *Ay = operands.GetConstantFloat(1);
														
 
															+    ConstantFP *Az = operands.GetConstantFloat(2);
														
 
															+    ConstantFP *Aw = operands.GetConstantFloat(3);
														
 
															+    ConstantFP *Bx = operands.GetConstantFloat(4);
														
 
															+    ConstantFP *By = operands.GetConstantFloat(5);
														
 
															+    ConstantFP *Bz = operands.GetConstantFloat(6);
														
 
															+    ConstantFP *Bw = operands.GetConstantFloat(7);
														
 
															+    return ComputeDot(Ty, { Ax, Ay, Az, Aw }, { Bx, By, Bz, Bw });
														
 
															+  }
														
 
															+  }
														
 
															+
														
 
															+  return nullptr;
														
 
															+}
														
 
															+
														
 
															+// Constant fold a Bfrev dxil intrinsic.
														
 
															+static Constant *HLSLConstantFoldBfrev(ConstantInt *C, Type *Ty) {
														
 
															+  APInt API = C->getValue();
														
 
															+
														
 
															+  uint64_t result = 0;
														
 
															+  if (Ty == Type::getInt32Ty(Ty->getContext())) {
														
 
															+    uint32_t val = static_cast<uint32_t>(API.getLimitedValue());
														
 
															+    result = llvm::reverseBits(val);
														
 
															+  }
														
 
															+  else if (Ty == Type::getInt16Ty(Ty->getContext())) {
														
 
															+    uint16_t val = static_cast<uint16_t>(API.getLimitedValue());
														
 
															+    result = llvm::reverseBits(val);
														
 
															+  }
														
 
															+  else if (Ty == Type::getInt64Ty(Ty->getContext())) {
														
 
															+    uint64_t val = static_cast<uint64_t>(API.getLimitedValue());
														
 
															+    result = llvm::reverseBits(val);
														
 
															+  }
														
 
															+  else {
														
 
															+    return nullptr;
														
 
															+  }
														
 
															+  return ConstantInt::get(Ty, result);
														
 
															+}
														
 
															+
														
 
															+// Handle special case for findfirst* bit functions.
														
 
															+// When the position is equal to the bitwidth the value was not found
														
 
															+// and we need to return a result of -1.
														
 
															+static Constant *HLSLConstantFoldFindBit(Type *Ty, unsigned position, unsigned bitwidth) {
														
 
															+  if (position == bitwidth)
														
 
															+    return ConstantInt::get(Ty, APInt::getAllOnesValue(Ty->getScalarSizeInBits()));
														
 
															+
														
 
															+  return ConstantInt::get(Ty, position);
														
 
															+}
														
 
															+
														
 
															+// Constant fold unary integer intrinsics.
														
 
															+static Constant *ConstantFoldUnaryIntIntrinsic(OP::OpCode opcode, Type *Ty, ConstantInt *Op) {
														
 
															+  APInt API = Op->getValue();
														
 
															+  switch (opcode) {
														
 
															+  default: break;
														
 
															+  case OP::OpCode::Bfrev:      return HLSLConstantFoldBfrev(Op, Ty);
														
 
															+  case OP::OpCode::Countbits:  return ConstantInt::get(Ty, API.countPopulation());
														
 
															+  case OP::OpCode::FirstbitLo: return HLSLConstantFoldFindBit(Ty, API.countTrailingZeros(), API.getBitWidth());
														
 
															+  case OP::OpCode::FirstbitHi: return HLSLConstantFoldFindBit(Ty, API.countLeadingZeros(), API.getBitWidth());
														
 
															+  case OP::OpCode::FirstbitSHi: {
														
 
															+    if (API.isNegative())
														
 
															+      return HLSLConstantFoldFindBit(Ty, API.countLeadingOnes(), API.getBitWidth());
														
 
															+    else
														
 
															+      return HLSLConstantFoldFindBit(Ty, API.countLeadingZeros(), API.getBitWidth());
														
 
															+  }
														
 
															+  }
														
 
															+  
														
 
															+  return nullptr;
														
 
															+}
														
 
															+
														
 
															+// Constant fold binary integer intrinsics.
														
 
															+static Constant *ConstantFoldBinaryIntIntrinsic(OP::OpCode opcode, Type *Ty, ConstantInt *Op1, ConstantInt *Op2) {
														
 
															+  APInt C1 = Op1->getValue();
														
 
															+  APInt C2 = Op2->getValue();
														
 
															+  switch (opcode) {
														
 
															+  default: break;
														
 
															+  case OP::OpCode::IMin: {
														
 
															+    APInt minVal = C1.slt(C2) ? C1 : C2;
														
 
															+    return ConstantInt::get(Ty, minVal);
														
 
															+  }
														
 
															+  case OP::OpCode::IMax: {
														
 
															+    APInt maxVal = C1.sgt(C2) ? C1 : C2;
														
 
															+    return ConstantInt::get(Ty, maxVal);
														
 
															+  }
														
 
															+  case OP::OpCode::UMin: {
														
 
															+    APInt minVal = C1.ult(C2) ? C1 : C2;
														
 
															+    return ConstantInt::get(Ty, minVal);
														
 
															+  }
														
 
															+  case OP::OpCode::UMax: {
														
 
															+    APInt maxVal = C1.ugt(C2) ? C1 : C2;
														
 
															+    return ConstantInt::get(Ty, maxVal);
														
 
															+  }
														
 
															+  }
														
 
															+
														
 
															+  return nullptr;
														
 
															+}
														
 
															+
														
 
															+// Compute bit field extract for ibfe and ubfe.
														
 
															+// The comptuation for ibfe and ubfe is the same except for the right shift,
														
 
															+// which is an arithemetic shift for ibfe and logical shift for ubfe.
														
 
															+// ubfe: https://msdn.microsoft.com/en-us/library/windows/desktop/hh447243(v=vs.85).aspx
														
 
															+// ibfe: https://msdn.microsoft.com/en-us/library/windows/desktop/hh447243(v=vs.85).aspx
														
 
															+static Constant *ComputeBFE(Type *Ty, APInt width, APInt offset, APInt val, std::function<APInt(APInt, APInt)> shr) {
														
 
															+    const APInt bitwidth(width.getBitWidth(), width.getBitWidth());
														
 
															+	// Limit width and offset to the bitwidth of the value.
														
 
															+    width  = width.And(bitwidth-1); 
														
 
															+    offset = offset.And(bitwidth-1);
														
 
															+    
														
 
															+    if (width == 0) {
														
 
															+      return ConstantInt::get(Ty, 0);
														
 
															+    }
														
 
															+    else if ((width + offset).ult(bitwidth)) {
														
 
															+      APInt dest = val.shl(bitwidth - (width + offset));
														
 
															+      dest = shr(dest, bitwidth - width);
														
 
															+      return ConstantInt::get(Ty, dest);
														
 
															+    }
														
 
															+    else {
														
 
															+      APInt dest = shr(val, offset);
														
 
															+      return ConstantInt::get(Ty, dest);
														
 
															+    }
														
 
															+}
														
 
															+
														
 
															+// Constant fold ternary integer intrinsic.
														
 
															+static Constant *ConstantFoldTernaryIntIntrinsic(OP::OpCode opcode, Type *Ty, ConstantInt *Op1, ConstantInt *Op2, ConstantInt *Op3) {
														
 
															+  APInt C1 = Op1->getValue();
														
 
															+  APInt C2 = Op2->getValue();
														
 
															+  APInt C3 = Op3->getValue();
														
 
															+  switch (opcode) {
														
 
															+  default: break;
														
 
															+  case OP::OpCode::IMad:
														
 
															+  case OP::OpCode::UMad: {
														
 
															+    // Result is same for signed/unsigned since this is twos complement and we only
														
 
															+    // keep the lower half of the multiply.
														
 
															+    APInt result = C1 * C2 + C3;
														
 
															+    return ConstantInt::get(Ty, result);
														
 
															+  }
														
 
															+  case OP::OpCode::Ubfe: return ComputeBFE(Ty, C1, C2, C3, [](APInt val, APInt amt) {return val.lshr(amt); });
														
 
															+  case OP::OpCode::Ibfe: return ComputeBFE(Ty, C1, C2, C3, [](APInt val, APInt amt) {return val.ashr(amt); });
														
 
															+  }
														
 
															+
														
 
															+  return nullptr;
														
 
															+}
														
 
															+
														
 
															+// Constant fold quaternary integer intrinsic.
														
 
															+//
														
 
															+// Currently we only have one quaternary intrinsic: Bfi.
														
 
															+// The Bfi computaion is described here:
														
 
															+// https://msdn.microsoft.com/en-us/library/windows/desktop/hh446837(v=vs.85).aspx
														
 
															+static Constant *ConstantFoldQuaternaryIntInstrinsic(OP::OpCode opcode, Type *Ty, ConstantInt *Op1, ConstantInt *Op2, ConstantInt *Op3, ConstantInt *Op4) {
														
 
															+  if (opcode != OP::OpCode::Bfi)
														
 
															+    return nullptr;
														
 
															+
														
 
															+  APInt bitwidth(Op1->getValue().getBitWidth(), Op1->getValue().getBitWidth());
														
 
															+  APInt width  = Op1->getValue().And(bitwidth-1);
														
 
															+  APInt offset = Op2->getValue().And(bitwidth-1);
														
 
															+  APInt src = Op3->getValue();
														
 
															+  APInt dst = Op4->getValue();
														
 
															+  APInt one(bitwidth.getBitWidth(), 1);
														
 
															+  APInt allOnes = APInt::getAllOnesValue(bitwidth.getBitWidth());
														
 
															+
														
 
															+  // bitmask = (((1 << width)-1) << offset) & 0xffffffff
														
 
															+  // dest = ((src2 << offset) & bitmask) | (src3 & ~bitmask)
														
 
															+  APInt bitmask = (one.shl(width) - 1).shl(offset).And(allOnes);
														
 
															+  APInt result = (src.shl(offset).And(bitmask)).Or(dst.And(~bitmask));
														
 
															+
														
 
															+  return ConstantInt::get(Ty, result);
														
 
															+}
														
 
															+
														
 
															+// Return true if opcode is for a dot operation.
														
 
															+static bool IsDotOpcode(OP::OpCode opcode) {
														
 
															+  return opcode == OP::OpCode::Dot2
														
 
															+      || opcode == OP::OpCode::Dot3
														
 
															+      || opcode == OP::OpCode::Dot4;
														
 
															+}
														
 
															+
														
 
															+// Top level function to constant fold floating point intrinsics.
														
 
															+static Constant *ConstantFoldFPIntrinsic(OP::OpCode opcode, Type *Ty, const DxilIntrinsicOperands &IntrinsicOperands) {
														
 
															+  if (!Ty->isHalfTy() && !Ty->isFloatTy() && !Ty->isDoubleTy())
														
 
															+    return nullptr;
														
 
															+
														
 
															+  if (IntrinsicOperands.Size() == 1) {
														
 
															+    ConstantFP *Op = IntrinsicOperands.GetConstantFloat(0);
														
 
															+
														
 
															+    if (!IsValidOp(Op))
														
 
															+      return nullptr;
														
 
															+
														
 
															+    return ConstantFoldUnaryFPIntrinsic(opcode, Ty, Op);
														
 
															+  }
														
 
															+  else if (IntrinsicOperands.Size() == 2) {
														
 
															+    ConstantFP *Op1 = IntrinsicOperands.GetConstantFloat(0);
														
 
															+    ConstantFP *Op2 = IntrinsicOperands.GetConstantFloat(1);
														
 
															+
														
 
															+    if (!IsValidOp(Op1) || !IsValidOp(Op2))
														
 
															+      return nullptr;
														
 
															+
														
 
															+    return ConstantFoldBinaryFPIntrinsic(opcode, Ty, Op1, Op2);
														
 
															+  }
														
 
															+  else if (IntrinsicOperands.Size() == 3) {
														
 
															+    ConstantFP *Op1 = IntrinsicOperands.GetConstantFloat(0);
														
 
															+    ConstantFP *Op2 = IntrinsicOperands.GetConstantFloat(1);
														
 
															+    ConstantFP *Op3 = IntrinsicOperands.GetConstantFloat(2);
														
 
															+
														
 
															+    if (!IsValidOp(Op1) || !IsValidOp(Op2) || !IsValidOp(Op3))
														
 
															+      return nullptr;
														
 
															+
														
 
															+    return ConstantFoldTernaryFPIntrinsic(opcode, Ty, Op1, Op2, Op3);
														
 
															+  }
														
 
															+  else if (IsDotOpcode(opcode)) {
														
 
															+    return ConstantFoldDot(opcode, Ty, IntrinsicOperands);
														
 
															+  }
														
 
															+
														
 
															+  return nullptr;
														
 
															+}
														
 
															+
														
 
															+// Top level function to constant fold integer intrinsics.
														
 
															+static Constant *ConstantFoldIntIntrinsic(OP::OpCode opcode, Type *Ty, const DxilIntrinsicOperands &IntrinsicOperands) {
														
 
															+  if (Ty->getScalarSizeInBits() > (sizeof(int64_t) * CHAR_BIT))
														
 
															+    return nullptr;
														
 
															+
														
 
															+  if (IntrinsicOperands.Size() == 1) {
														
 
															+    ConstantInt *Op = IntrinsicOperands.GetConstantInt(0);
														
 
															+    if (!Op)
														
 
															+      return nullptr;
														
 
															+
														
 
															+    return ConstantFoldUnaryIntIntrinsic(opcode, Ty, Op);
														
 
															+  }
														
 
															+  else if (IntrinsicOperands.Size() == 2) {
														
 
															+    ConstantInt *Op1 = IntrinsicOperands.GetConstantInt(0);
														
 
															+    ConstantInt *Op2 = IntrinsicOperands.GetConstantInt(1);
														
 
															+    if (!Op1 || !Op2)
														
 
															+      return nullptr;
														
 
															+    
														
 
															+    return ConstantFoldBinaryIntIntrinsic(opcode, Ty, Op1, Op2);
														
 
															+  }
														
 
															+  else if (IntrinsicOperands.Size() == 3) {
														
 
															+    ConstantInt *Op1 = IntrinsicOperands.GetConstantInt(0);
														
 
															+    ConstantInt *Op2 = IntrinsicOperands.GetConstantInt(1);
														
 
															+    ConstantInt *Op3 = IntrinsicOperands.GetConstantInt(2);
														
 
															+    if (!Op1 || !Op2 || !Op3)
														
 
															+      return nullptr;
														
 
															+    
														
 
															+    return ConstantFoldTernaryIntIntrinsic(opcode, Ty, Op1, Op2, Op3);
														
 
															+  }
														
 
															+  else if (IntrinsicOperands.Size() == 4) {
														
 
															+    ConstantInt *Op1 = IntrinsicOperands.GetConstantInt(0);
														
 
															+    ConstantInt *Op2 = IntrinsicOperands.GetConstantInt(1);
														
 
															+    ConstantInt *Op3 = IntrinsicOperands.GetConstantInt(2);
														
 
															+    ConstantInt *Op4 = IntrinsicOperands.GetConstantInt(3);
														
 
															+    if (!Op1 || !Op2 || !Op3 || !Op4)
														
 
															+      return nullptr;
														
 
															+
														
 
															+    return ConstantFoldQuaternaryIntInstrinsic(opcode, Ty, Op1, Op2, Op3, Op4);
														
 
															+  }
														
 
															+  return nullptr;
														
 
															+}
														
 
															+
														
 
															+// External entry point to constant fold dxil intrinsics.
														
 
															+// Called from the llvm constant folding routine.
														
 
															+Constant *hlsl::ConstantFoldScalarCall(StringRef Name, Type *Ty, ArrayRef<Constant *> RawOperands) {
														
 
															+  OP::OpCode opcode;
														
 
															+  if (GetDxilOpcode(Name, RawOperands, opcode)) {
														
 
															+    DxilIntrinsicOperands IntrinsicOperands(RawOperands);
														
 
															+
														
 
															+    if (Ty->isFloatingPointTy()) {
														
 
															+      return ConstantFoldFPIntrinsic(opcode, Ty, IntrinsicOperands);
														
 
															+    }
														
 
															+    else if (Ty->isIntegerTy()) {
														
 
															+      return ConstantFoldIntIntrinsic(opcode, Ty, IntrinsicOperands);
														
 
															+    }
														
 
															+  }
														
 
															+  return nullptr;
														
 
															+}
														
 
															+
														
 
															+// External entry point to determine if we can constant fold calls to
														
 
															+// the given function. We have to overestimate the set of functions because
														
 
															+// we only have the function value here instead of the call. We need the
														
 
															+// actual call to get the opcode for the intrinsic.
														
 
															+bool hlsl::CanConstantFoldCallTo(const Function *F) {
														
 
															+  if (!OP::IsDxilOpFunc(F))
														
 
															+    return false;
														
 
															+
														
 
															+  // Check match using startswith to get all overloads.
														
 
															+  StringRef Name = F->getName();
														
 
															+  if (Name.startswith("dx.op.unary"))
														
 
															+    return true;
														
 
															+  else if (Name.startswith("dx.op.unaryBits"))
														
 
															+    return true;
														
 
															+  else if (Name.startswith("dx.op.binary"))
														
 
															+    return true;
														
 
															+  else if (Name.startswith("dx.op.tertiary"))
														
 
															+    return true;
														
 
															+  else if (Name.startswith("dx.op.quaternary"))
														
 
															+    return true;
														
 
															+  else if (Name.startswith("dx.op.dot"))
														
 
															+    return true;
														
 
															+
														
 
															+  return false;
														
 
															+}
														
--- a/lib/HLSL/DxilOperations.cpp
+++ b/lib/HLSL/DxilOperations.cpp
@@ -324,11 +324,16 @@ bool OP::CheckOpCodeTable() {
 
															   return true;
														
 
															 }
														
 
															-bool OP::IsDxilOpFunc(const llvm::Function *F) {
														
 
															-  StringRef name = F->getName();
														
 
															+bool OP::IsDxilOpFuncName(StringRef name) {
														
 
															   return name.startswith(OP::m_NamePrefix);
														
 
															 }
														
 
															+bool OP::IsDxilOpFunc(const llvm::Function *F) {
														
 
															+  if (!F->hasName())
														
 
															+    return false;
														
 
															+  return IsDxilOpFuncName(F->getName());
														
 
															+}
														
 
															+
														
 
															 bool OP::IsDxilOpFuncCallInst(const llvm::Instruction *I) {
														
 
															   const CallInst *CI = dyn_cast<CallInst>(I);
														
 
															   if (CI == nullptr) return false;
														
--- a/tools/clang/test/CodeGenHLSL/Samples/DX11/SubD11_SmoothPS.hlsl
+++ b/tools/clang/test/CodeGenHLSL/Samples/DX11/SubD11_SmoothPS.hlsl
@@ -9,7 +9,6 @@
 
															 // CHECK: sample
														
 
															 // CHECK: Log
														
 
															 // CHECK: Exp
														
 
															-// CHECK: dot3
														
 
															 // CHECK: Sqrt
														
 
															 // CHECK: dot3
														
 
															 // CHECK: Saturate
														
--- a/tools/clang/test/CodeGenHLSL/firstbitHi.hlsl
+++ b/tools/clang/test/CodeGenHLSL/firstbitHi.hlsl
@@ -1,19 +1,19 @@
 
															 // RUN: %dxc -E main -T ps_6_0 %s | FileCheck %s
														
 
															-// CHECK: FirstbitHi
														
 
															+// CHECK: call {{.*}} FirstbitHi
														
 
															 // CHECK: sub i32 31
														
 
															 // CHECK: icmp eq i32 {{.*}}, -1
														
 
															 // CHECK: select
														
 
															 // CHECK: i32 -1
														
 
															-// CHECK: FirstbitSHi
														
 
															+// CHECK: call {{.*}} FirstbitSHi
														
 
															 // CHECK: sub i32 31
														
 
															 // CHECK: icmp eq i32 {{.*}}, -1
														
 
															 // CHECK: select
														
 
															 // CHECK: i32 -1
														
 
															-// CHECK: FirstbitSHi
														
 
															-// CHECK: FirstbitSHi
														
 
															+// CHECK: call void @dx.op.bufferStore.i32{{.*}}, i32 5 
														
 
															+// CHECK: call void @dx.op.bufferStore.i32{{.*}}, i32 8
														
 
															 // CHECK: dx.op.unaryBits.i64(i32 33, i64
														
 
															 // CHECK: sub i32 63
														
--- a/tools/clang/test/CodeGenHLSL/firstbitLo.hlsl
+++ b/tools/clang/test/CodeGenHLSL/firstbitLo.hlsl
@@ -1,14 +1,13 @@
 
															 // RUN: %dxc -E main -T ps_6_0 %s | FileCheck %s
														
 
															-// CHECK: FirstbitLo
														
 
															+// CHECK: call i32 @dx.op.unaryBits.i32{{.*}} FirstbitLo
														
 
															-// CHECK: FirstbitLo
														
 
															+// CHECK: call i32 @dx.op.unaryBits.i32{{.*}} FirstbitLo
														
 
															-// CHECK: FirstbitLo
														
 
															-// CHECK: FirstbitLo
														
 
															+// CHECK: call void @dx.op.bufferStore.i32{{.*}}, i32 5 
														
 
															+// CHECK: call void @dx.op.bufferStore.i32{{.*}}, i32 9 
														
 
															-// CHECK: dx.op.unaryBits.i64
														
 
															-// CHECK: FirstbitLo
														
 
															+// CHECK: call i32 @dx.op.unaryBits.i64{{.*}} FirstbitLo
														
 
															 uint a;
														
 
															 int2 b;
														
--- a/tools/clang/test/CodeGenHLSL/firstbitshi_const.hlsl
+++ b/tools/clang/test/CodeGenHLSL/firstbitshi_const.hlsl
@@ -1,6 +1,6 @@
 
															 // RUN: %dxc -E main -T ps_6_0 %s | FileCheck %s
														
 
															-// CHECK: FirstbitSHi
														
 
															+// CHECK: call void @dx.op.storeOutput.i32{{.*}}, i32 -1
														
 
															 [RootSignature("")]
														
 
															 int main() : SV_Target {
														
--- a/tools/clang/test/HLSL/constprop/Acos.hlsl
+++ b/tools/clang/test/HLSL/constprop/Acos.hlsl
@@ -0,0 +1,8 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} float 0x3FF0C15240000000 
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+float main(float x : A) : SV_Target {
														
 
															+    float y = 0.5;
														
 
															+    return acos(y);
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/Asin.hlsl
+++ b/tools/clang/test/HLSL/constprop/Asin.hlsl
@@ -0,0 +1,8 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} float 0x3FE0C15240000000 
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+float main(float x : A) : SV_Target {
														
 
															+    float y = 0.5;
														
 
															+    return asin(y);
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/Atan.hlsl
+++ b/tools/clang/test/HLSL/constprop/Atan.hlsl
@@ -0,0 +1,9 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} float 0x3FDDAC6700000000 
														
 
															+
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+float main(float x : A) : SV_Target {
														
 
															+    float y = 0.5;
														
 
															+    return atan(y);
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/Bfrev.hlsl
+++ b/tools/clang/test/HLSL/constprop/Bfrev.hlsl
@@ -0,0 +1,9 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} i32 1532713819
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+int main() : SV_Target {
														
 
															+    uint64_t s = reversebits(114ULL);
														
 
															+    int x = 0xdadadada;
														
 
															+    return reversebits(x);
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/Cos.hlsl
+++ b/tools/clang/test/HLSL/constprop/Cos.hlsl
@@ -0,0 +1,8 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} float 0x3FB21BD540000000 
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+float main(float x : A) : SV_Target {
														
 
															+    float y = 1.5;
														
 
															+    return cos(y);
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/Countbits.hlsl
+++ b/tools/clang/test/HLSL/constprop/Countbits.hlsl
@@ -0,0 +1,9 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} i32 23
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+int main() : SV_Target {
														
 
															+    int x = 0xdadadada;
														
 
															+    uint64_t y = 0x30100000000ULL;
														
 
															+    return countbits(x) + countbits(y);
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/Dot2.hlsl
+++ b/tools/clang/test/HLSL/constprop/Dot2.hlsl
@@ -0,0 +1,9 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} float 1.328125e-01
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+float main() : SV_Target {
														
 
															+    float2 x = float2(0.5, 0.125);
														
 
															+    float2 y = float2(0.25, 0.0625);
														
 
															+    return dot(x, y);
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/Dot3.hlsl
+++ b/tools/clang/test/HLSL/constprop/Dot3.hlsl
@@ -0,0 +1,9 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} float 0x400F100000000000
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+float main() : SV_Target {
														
 
															+    float3 x = float3(0.5, 0.125, 1.5);
														
 
															+    float3 y = float3(0.25, 0.0625, 2.5);
														
 
															+    return dot(x, y);
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/Dot4.hlsl
+++ b/tools/clang/test/HLSL/constprop/Dot4.hlsl
@@ -0,0 +1,9 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} float 0x4044010000000000
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+float main() : SV_Target {
														
 
															+    float4 x = float4(0.5, 0.125, 1.5, 8.5);
														
 
															+    float4 y = float4(0.25, 0.0625, 2.5, 4.25);
														
 
															+    return dot(x, y);
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/Exp.hlsl
+++ b/tools/clang/test/HLSL/constprop/Exp.hlsl
@@ -0,0 +1,9 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} float 0x3FD346C420000000
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+float main() : SV_Target {
														
 
															+    float x = -1.2;
														
 
															+    return exp(x);
														
 
															+}
														
 
															+
														
--- a/tools/clang/test/HLSL/constprop/FAbs.hlsl
+++ b/tools/clang/test/HLSL/constprop/FAbs.hlsl
@@ -0,0 +1,9 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} float 0x3FF3333340000000
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+float main() : SV_Target {
														
 
															+    float x = -1.2;
														
 
															+    return abs(x);
														
 
															+}
														
 
															+
														
--- a/tools/clang/test/HLSL/constprop/FMad.hlsl
+++ b/tools/clang/test/HLSL/constprop/FMad.hlsl
@@ -0,0 +1,17 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} float 5.078125e-01
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+float main() : SV_Target {
														
 
															+    float   x = 0.5;
														
 
															+    float   y = 0.25;
														
 
															+    float   z = 0.125;
														
 
															+    float   f = mad(x, y, z);    // 0.25
														
 
															+
														
 
															+    double d1 = 0.0625;
														
 
															+    double d2 = 0.125;
														
 
															+    double d3 = 0.25;
														
 
															+    double d  = mad(d1, d2, d3); // 0.2578125
														
 
															+
														
 
															+    return f + d;
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/FMax.hlsl
+++ b/tools/clang/test/HLSL/constprop/FMax.hlsl
@@ -0,0 +1,13 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} float 1.000000e+00
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+float main() : SV_Target {
														
 
															+    float x = 0.5;
														
 
															+    float y = 0.25;
														
 
															+    
														
 
															+    double d1 = 0.5;
														
 
															+    double d2 = 0.25;
														
 
															+
														
 
															+    return max(x, y) + max(d1, d2);
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/FMin.hlsl
+++ b/tools/clang/test/HLSL/constprop/FMin.hlsl
@@ -0,0 +1,13 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} float 5.000000e-01
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+float main() : SV_Target {
														
 
															+    float x = 0.5;
														
 
															+    float y = 0.25;
														
 
															+    
														
 
															+    double d1 = 0.5;
														
 
															+    double d2 = 0.25;
														
 
															+
														
 
															+    return min(x, y) + min(d1, d2);
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/Firstbithi.hlsl
+++ b/tools/clang/test/HLSL/constprop/Firstbithi.hlsl
@@ -0,0 +1,37 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} i32 189
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+int main() : SV_Target {
														
 
															+    int x = 0x0;           // firstbithigh(y) = -1
														
 
															+    int y = 0x0010;        // firstbithigh(y) =  4
														
 
															+    int z = 0x80000000;    // firstbithigh(z) = 30
														
 
															+    int w = 0xffffffff;    // firstbithigh(w) = -1
														
 
															+    
														
 
															+    uint ux = 0x0;         // firstbithigh(ux) = -1
														
 
															+    uint uy = 0x1000;      // firstbithigh(uy) = 12
														
 
															+    uint uz = 0x80000000;  // firstbithigh(uz) = 31
														
 
															+    uint uw = 0xffffffff;  // firstbithigh(uw) = 31
														
 
															+    
														
 
															+    // TODO: add tests for int64_t when constant literals are fixed
														
 
															+    
														
 
															+    uint64_t lux = 0x0ULL;           // firstbithigh(lux) = -1
														
 
															+    uint64_t luy = 0x1000ULL;        // firstbithigh(luy) = 12
														
 
															+    uint64_t luz = 0x00100000000ULL; // firstbithi(luz) = 32
														
 
															+    uint64_t luw = 0x30000000000ULL; // firstbithi(luw) = 41
														
 
															+    
														
 
															+    
														
 
															+    return firstbithigh(x)
														
 
															+         + firstbithigh(y)
														
 
															+         + firstbithigh(z)
														
 
															+         + firstbithigh(w)
														
 
															+         + firstbithigh(ux)
														
 
															+         + firstbithigh(uy)
														
 
															+         + firstbithigh(uz)
														
 
															+         + firstbithigh(uw)
														
 
															+         + firstbithigh(lux)
														
 
															+         + firstbithigh(luy)
														
 
															+         + firstbithigh(luz)
														
 
															+         + firstbithigh(luw)
														
 
															+         ;
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/Firstbitlo.hlsl
+++ b/tools/clang/test/HLSL/constprop/Firstbitlo.hlsl
@@ -0,0 +1,12 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} i32 42
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+int main() : SV_Target {
														
 
															+    int x = 0x0;                   // firstbitlow(x) = -1
														
 
															+    int y = 0x100;                 // firstbitlow(y) =  8
														
 
															+    int z = 0x110;                 // firstbitlow(y) =  4
														
 
															+    uint64_t w = 0x30100000000ULL; // firstbitlow(w) = 32
														
 
															+    uint64_t s = 0x0ULL;           // firstbitlow(w) = -1
														
 
															+    return firstbitlow(x) + firstbitlow(y) + firstbitlow(z) + firstbitlow(w) + firstbitlow(s);
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/Fma.hlsl
+++ b/tools/clang/test/HLSL/constprop/Fma.hlsl
@@ -0,0 +1,12 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} float 2.500000e-01
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+float main() : SV_Target {
														
 
															+    double x = 0.5;
														
 
															+    double y = 0.25;
														
 
															+    double z = 0.125;
														
 
															+    double d = fma(x, y, z); // 0.25
														
 
															+
														
 
															+    return d;
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/Frc.hlsl
+++ b/tools/clang/test/HLSL/constprop/Frc.hlsl
@@ -0,0 +1,8 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} float 5.000000e-01
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+float main(float x : A) : SV_Target {
														
 
															+    float y = -1.5;
														
 
															+    return frac(y);
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/Hcos.hlsl
+++ b/tools/clang/test/HLSL/constprop/Hcos.hlsl
@@ -0,0 +1,8 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} float 0x3FF20AC180000000 
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+float main(float x : A) : SV_Target {
														
 
															+    float y = 0.5;
														
 
															+    return cosh(y);
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/Hsin.hlsl
+++ b/tools/clang/test/HLSL/constprop/Hsin.hlsl
@@ -0,0 +1,8 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} float 0x3FE0ACD000000000 
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+float main(float x : A) : SV_Target {
														
 
															+    float y = 0.5;
														
 
															+    return sinh(y);
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/Htan.hlsl
+++ b/tools/clang/test/HLSL/constprop/Htan.hlsl
@@ -0,0 +1,8 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} float 0x3FDD9353E0000000 
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+float main(float x : A) : SV_Target {
														
 
															+    float y = 0.5;
														
 
															+    return tanh(y);
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/IMad.hlsl
+++ b/tools/clang/test/HLSL/constprop/IMad.hlsl
@@ -0,0 +1,10 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} i32 -7
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+int main() : SV_Target {
														
 
															+    int x = -2;
														
 
															+    int y = 5;
														
 
															+    int z = 3;
														
 
															+    return mad(x, y ,z); // -7
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/IMax.hlsl
+++ b/tools/clang/test/HLSL/constprop/IMax.hlsl
@@ -0,0 +1,11 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} i32 25
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+int main() : SV_Target {
														
 
															+    int x = 5;
														
 
															+    int y = 25;
														
 
															+    int z = -1;
														
 
															+
														
 
															+    return max(max(x, y), z);
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/IMin.hlsl
+++ b/tools/clang/test/HLSL/constprop/IMin.hlsl
@@ -0,0 +1,11 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} i32 -1
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+int main() : SV_Target {
														
 
															+    int x = 5;
														
 
															+    int y = 25;
														
 
															+    int z = -1;
														
 
															+
														
 
															+    return min(min(x, y), z);
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/Log.hlsl
+++ b/tools/clang/test/HLSL/constprop/Log.hlsl
@@ -0,0 +1,8 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} float 0x3FD9F323E0000000
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+float main(float x : A) : SV_Target {
														
 
															+    float y = 1.5;
														
 
															+    return log(y);
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/Round_ne.hlsl
+++ b/tools/clang/test/HLSL/constprop/Round_ne.hlsl
@@ -0,0 +1,9 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} float 4.000000e+00
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+float main() : SV_Target {
														
 
															+    float x = 1.5;
														
 
															+    float y = 2.5;
														
 
															+    return round(x) + round(y);
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/Round_ni.hlsl
+++ b/tools/clang/test/HLSL/constprop/Round_ni.hlsl
@@ -0,0 +1,9 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} float 3.000000e+00
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+float main() : SV_Target {
														
 
															+    float x = 1.5;
														
 
															+    float y = 2.5;
														
 
															+    return floor(x) + floor(y);
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/Round_pi.hlsl
+++ b/tools/clang/test/HLSL/constprop/Round_pi.hlsl
@@ -0,0 +1,9 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} float 5.000000e+00
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+float main() : SV_Target {
														
 
															+    float x = 1.5;
														
 
															+    float y = 2.5;
														
 
															+    return ceil(x) + ceil(y);
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/Round_z.hlsl
+++ b/tools/clang/test/HLSL/constprop/Round_z.hlsl
@@ -0,0 +1,9 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} float 1.000000e+00
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+float main() : SV_Target {
														
 
															+    float x = -1.5;
														
 
															+    float y = 2.5;
														
 
															+    return trunc(x) + trunc(y);
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/Rsqrt.hlsl
+++ b/tools/clang/test/HLSL/constprop/Rsqrt.hlsl
@@ -0,0 +1,8 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} float 4.000000e+00
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+float main(float x : A) : SV_Target {
														
 
															+    float y = 0.0625;
														
 
															+    return rsqrt(y);
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/Saturate_double.hlsl
+++ b/tools/clang/test/HLSL/constprop/Saturate_double.hlsl
@@ -0,0 +1,12 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} float 1.500000e+00 
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+float main() : SV_Target {
														
 
															+    double x = -1.2;
														
 
															+    double y = 1.2;
														
 
															+    double z = 0.5;
														
 
															+    return saturate(x)
														
 
															+         + saturate(y)
														
 
															+         + saturate(z);
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/Saturate_float.hlsl
+++ b/tools/clang/test/HLSL/constprop/Saturate_float.hlsl
@@ -0,0 +1,12 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} float 1.500000e+00 
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+float main() : SV_Target {
														
 
															+    float x = -1.2;
														
 
															+    float y =  1.2;
														
 
															+    float z =  0.5;
														
 
															+    return saturate(x)
														
 
															+         + saturate(y)
														
 
															+         + saturate(z);
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/Saturate_half.hlsl
+++ b/tools/clang/test/HLSL/constprop/Saturate_half.hlsl
@@ -0,0 +1,12 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} float 1.500000e+00 
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+float main() : SV_Target {
														
 
															+    min16float x = -1.2;
														
 
															+    min16float y = 1.2;
														
 
															+    min16float z = 0.5;
														
 
															+    return saturate(x)
														
 
															+         + saturate(y)
														
 
															+         + saturate(z);
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/Sin.hlsl
+++ b/tools/clang/test/HLSL/constprop/Sin.hlsl
@@ -0,0 +1,8 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} float 0x3FEFEB7AA0000000
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+float main(float x : A) : SV_Target {
														
 
															+    float y = 1.5;
														
 
															+    return sin(y);
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/Sqrt.hlsl
+++ b/tools/clang/test/HLSL/constprop/Sqrt.hlsl
@@ -0,0 +1,8 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} float 2.500000e-01
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+float main(float x : A) : SV_Target {
														
 
															+    float y = 0.0625;
														
 
															+    return sqrt(y);
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/Tan.hlsl
+++ b/tools/clang/test/HLSL/constprop/Tan.hlsl
@@ -0,0 +1,8 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} float 0x402C33ED60000000
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+float main(float x : A) : SV_Target {
														
 
															+    float y = 1.5;
														
 
															+    return tan(y);
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/UMad.hlsl
+++ b/tools/clang/test/HLSL/constprop/UMad.hlsl
@@ -0,0 +1,15 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} i32 -4
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+uint main() : SV_Target {
														
 
															+    uint x = -2;
														
 
															+    uint y = 5;
														
 
															+    uint z = 3;
														
 
															+
														
 
															+    uint64_t xl = 0x100000000ULL;
														
 
															+    uint64_t yl = 0x000000002ULL;
														
 
															+    uint64_t zl = 0x000000003ULL;
														
 
															+    return mad(x, y ,z)     // -7
														
 
															+         + mad(xl, yl, zl); // 0x200000003
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/UMax.hlsl
+++ b/tools/clang/test/HLSL/constprop/UMax.hlsl
@@ -0,0 +1,15 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} i32 -2
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+uint main() : SV_Target {
														
 
															+    uint ux = 5;
														
 
															+    uint uy = 25;
														
 
															+    uint uz = -1;
														
 
															+    
														
 
															+    uint64_t lx = 7ULL;
														
 
															+    uint64_t ly = 25ULL;
														
 
															+    uint64_t lz = -1ULL;
														
 
															+
														
 
															+    return max(max(ux, uy), uz) + max(max(lx, ly), lz);
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/UMin.hlsl
+++ b/tools/clang/test/HLSL/constprop/UMin.hlsl
@@ -0,0 +1,15 @@
 
															+// RUN: %dxc -T ps_6_0 %s -E main | %FileCheck %s
														
 
															+// CHECK: call void @dx.op.storeOutput{{.*}} i32 12
														
 
															+
														
 
															+[RootSignature("")]
														
 
															+uint main() : SV_Target {
														
 
															+    uint ux = 5;
														
 
															+    uint uy = 25;
														
 
															+    uint uz = -1;
														
 
															+    
														
 
															+    uint64_t lx = 7ULL;
														
 
															+    uint64_t ly = 25ULL;
														
 
															+    uint64_t lz = -1ULL;
														
 
															+
														
 
															+    return min(min(ux, uy), uz) + min(min(lx, ly), lz);
														
 
															+}
														
--- a/tools/clang/test/HLSL/constprop/bfi.ll
+++ b/tools/clang/test/HLSL/constprop/bfi.ll
@@ -0,0 +1,95 @@
 
															+; RUN: %opt %s -sccp -S | FileCheck %s
														
 
															+
														
 
															+target datalayout = "e-m:e-p:32:32-i64:64-f80:32-n8:16:32-a:0:32-S32"
														
 
															+target triple = "dxil-ms-dx"
														
 
															+
														
 
															+%dx.types.Handle = type { i8* }
														
 
															+%struct.RWByteAddressBuffer = type { i32 }
														
 
															+
														
 
															+define void @main() {
														
 
															+entry:
														
 
															+  %buf_UAV_rawbuf = call %dx.types.Handle @dx.op.createHandle(i32 57, i8 1, i32 0, i32 0, i1 false)  ; CreateHandle(resourceClass,rangeId,index,nonUniformIndex)
														
 
															+  
														
 
															+  ; CHECK: @dx.op.bufferStore{{.*}}, i32 510,
														
 
															+  %0 = call i32 @dx.op.quaternary.i32(i32 53, i32 8, i32 1, i32 255, i32 0)
														
 
															+  call void @dx.op.bufferStore.i32(i32 69, %dx.types.Handle %buf_UAV_rawbuf, i32 0, i32 undef, i32 %0, i32 undef, i32 undef, i32 undef, i8 1)  ; BufferStore(uav,coord0,coord1,value0,value1,value2,value3,mask)
														
 
															+  
														
 
															+  ; CHECK: @dx.op.bufferStore{{.*}}, i32 255,
														
 
															+  %1 = call i32 @dx.op.quaternary.i32(i32 53, i32 8, i32 32, i32 255, i32 0)
														
 
															+  call void @dx.op.bufferStore.i32(i32 69, %dx.types.Handle %buf_UAV_rawbuf, i32 4, i32 undef, i32 %1, i32 undef, i32 undef, i32 undef, i8 1)  ; BufferStore(uav,coord0,coord1,value0,value1,value2,value3,mask)
														
 
															+  
														
 
															+  ; CHECK: @dx.op.bufferStore{{.*}}, i32 -1091584273,
														
 
															+  %2 = call i32 @dx.op.quaternary.i32(i32 53, i32 16, i32 16, i32 48879, i32 3735928559)
														
 
															+  call void @dx.op.bufferStore.i32(i32 69, %dx.types.Handle %buf_UAV_rawbuf, i32 8, i32 undef, i32 %2, i32 undef, i32 undef, i32 undef, i8 1)  ; BufferStore(uav,coord0,coord1,value0,value1,value2,value3,mask)
														
 
															+  
														
 
															+  ; CHECK: @dx.op.bufferStore{{.*}}, i32 322420463,
														
 
															+  %3 = call i32 @dx.op.quaternary.i32(i32 53, i32 8, i32 16, i32 55, i32 318815983)
														
 
															+  call void @dx.op.bufferStore.i32(i32 69, %dx.types.Handle %buf_UAV_rawbuf, i32 12, i32 undef, i32 %3, i32 undef, i32 undef, i32 undef, i8 1)  ; BufferStore(uav,coord0,coord1,value0,value1,value2,value3,mask)
														
 
															+  
														
 
															+  ; CHECK: @dx.op.bufferStore{{.*}}, i32 15,
														
 
															+  %4 = call i32 @dx.op.quaternary.i32(i32 53, i32 0, i32 8, i32 0, i32 15)
														
 
															+  call void @dx.op.bufferStore.i32(i32 69, %dx.types.Handle %buf_UAV_rawbuf, i32 16, i32 undef, i32 %4, i32 undef, i32 undef, i32 undef, i8 1)  ; BufferStore(uav,coord0,coord1,value0,value1,value2,value3,mask)
														
 
															+  
														
 
															+  ; CHECK: @dx.op.bufferStore{{.*}}, i32 2560,
														
 
															+  %5 = call i64 @dx.op.quaternary.i64(i32 53, i64 4, i64 8, i64 4010, i64 0)
														
 
															+  %6 = trunc i64 %5 to i32
														
 
															+  call void @dx.op.bufferStore.i32(i32 69, %dx.types.Handle %buf_UAV_rawbuf, i32 20, i32 undef, i32 %6, i32 undef, i32 undef, i32 undef, i8 1)  ; BufferStore(uav,coord0,coord1,value0,value1,value2,value3,mask)
														
 
															+  
														
 
															+  ; CHECK: @dx.op.bufferStore{{.*}}, i32 10,
														
 
															+  %7 = call i64 @dx.op.quaternary.i64(i32 53, i64 4, i64 32, i64 4010, i64 0)
														
 
															+  %8 = lshr i64 %7, 32
														
 
															+  %9 = trunc i64 %8 to i32
														
 
															+  call void @dx.op.bufferStore.i32(i32 69, %dx.types.Handle %buf_UAV_rawbuf, i32 24, i32 undef, i32 %9, i32 undef, i32 undef, i32 undef, i8 1)  ; BufferStore(uav,coord0,coord1,value0,value1,value2,value3,mask)
														
 
															+  
														
 
															+  call void @dx.op.storeOutput.i32(i32 5, i32 0, i32 0, i8 0, i32 0)  ; StoreOutput(outputtSigId,rowIndex,colIndex,value)
														
 
															+  ret void
														
 
															+}
														
 
															+
														
 
															+; Function Attrs: nounwind readnone
														
 
															+declare i32 @dx.op.loadInput.i32(i32, i32, i32, i8, i32) #0
														
 
															+
														
 
															+; Function Attrs: nounwind
														
 
															+declare void @dx.op.storeOutput.i32(i32, i32, i32, i8, i32) #1
														
 
															+
														
 
															+; Function Attrs: nounwind
														
 
															+declare void @dx.op.bufferStore.i32(i32, %dx.types.Handle, i32, i32, i32, i32, i32, i32, i8) #1
														
 
															+
														
 
															+; Function Attrs: nounwind readonly
														
 
															+declare %dx.types.Handle @dx.op.createHandle(i32, i8, i32, i32, i1) #2
														
 
															+
														
 
															+declare i32 @dx.op.quaternary.i32(i32, i32, i32, i32, i32) #1
														
 
															+declare i64 @dx.op.quaternary.i64(i32, i64, i64, i64, i64) #1
														
 
															+
														
 
															+attributes #0 = { nounwind readnone }
														
 
															+attributes #1 = { nounwind }
														
 
															+attributes #2 = { nounwind readonly }
														
 
															+
														
 
															+!llvm.ident = !{!0}
														
 
															+!dx.valver = !{!1}
														
 
															+!dx.version = !{!1}
														
 
															+!dx.shaderModel = !{!2}
														
 
															+!dx.resources = !{!3}
														
 
															+!dx.typeAnnotations = !{!6, !9}
														
 
															+!dx.entryPoints = !{!13}
														
 
															+
														
 
															+!0 = !{!"clang version 3.7 (tags/RELEASE_370/final)"}
														
 
															+!1 = !{i32 1, i32 0}
														
 
															+!2 = !{!"ps", i32 6, i32 0}
														
 
															+!3 = !{null, !4, null, null}
														
 
															+!4 = !{!5}
														
 
															+!5 = !{i32 0, %struct.RWByteAddressBuffer* undef, !"buf", i32 0, i32 0, i32 1, i32 11, i1 false, i1 false, i1 false, null}
														
 
															+!6 = !{i32 0, %struct.RWByteAddressBuffer undef, !7}
														
 
															+!7 = !{i32 4, !8}
														
 
															+!8 = !{i32 6, !"h", i32 3, i32 0, i32 7, i32 4}
														
 
															+!9 = !{i32 1, void ()* @main, !10}
														
 
															+!10 = !{!11}
														
 
															+!11 = !{i32 0, !12, !12}
														
 
															+!12 = !{}
														
 
															+!13 = !{void ()* @main, !"main", !14, !3, !20}
														
 
															+!14 = !{!15, !18, null}
														
 
															+!15 = !{!16}
														
 
															+!16 = !{i32 0, !"A", i8 4, i8 0, !17, i8 1, i32 1, i8 1, i32 0, i8 0, null}
														
 
															+!17 = !{i32 0}
														
 
															+!18 = !{!19}
														
 
															+!19 = !{i32 0, !"SV_Target", i8 4, i8 16, !17, i8 0, i32 1, i8 1, i32 0, i8 0, null}
														
 
															+!20 = !{i32 0, i64 16}
														
--- a/tools/clang/test/HLSL/constprop/ibfe.ll
+++ b/tools/clang/test/HLSL/constprop/ibfe.ll
@@ -0,0 +1,103 @@
 
															+; RUN: %opt %s -sccp -S | FileCheck %s
														
 
															+
														
 
															+target datalayout = "e-m:e-p:32:32-i64:64-f80:32-n8:16:32-a:0:32-S32"
														
 
															+target triple = "dxil-ms-dx"
														
 
															+
														
 
															+%dx.types.Handle = type { i8* }
														
 
															+%struct.RWByteAddressBuffer = type { i32 }
														
 
															+
														
 
															+define void @main() {
														
 
															+entry:
														
 
															+  %buf_UAV_rawbuf = call %dx.types.Handle @dx.op.createHandle(i32 57, i8 1, i32 0, i32 0, i1 false)  ; CreateHandle(resourceClass,rangeId,index,nonUniformIndex)
														
 
															+  
														
 
															+  ; CHECK: @dx.op.bufferStore{{.*}}, i32 -9510,
														
 
															+  %0 = call i32 @dx.op.tertiary.i32(i32 51, i32 16, i32 16, i32 3671719936)
														
 
															+  call void @dx.op.bufferStore.i32(i32 69, %dx.types.Handle %buf_UAV_rawbuf, i32 0, i32 undef, i32 %0, i32 undef, i32 undef, i32 undef, i8 1)  ; BufferStore(uav,coord0,coord1,value0,value1,value2,value3,mask)
														
 
															+  
														
 
															+  ; CHECK: @dx.op.bufferStore{{.*}}, i32 0,
														
 
															+  %1 = call i32 @dx.op.tertiary.i32(i32 51, i32 32, i32 16, i32 3671719936)
														
 
															+  call void @dx.op.bufferStore.i32(i32 69, %dx.types.Handle %buf_UAV_rawbuf, i32 4, i32 undef, i32 %1, i32 undef, i32 undef, i32 undef, i8 1)  ; BufferStore(uav,coord0,coord1,value0,value1,value2,value3,mask)
														
 
															+  
														
 
															+  ; CHECK: @dx.op.bufferStore{{.*}}, i32 -255,
														
 
															+  %2 = call i32 @dx.op.tertiary.i32(i32 51, i32 11, i32 0, i32 3841)
														
 
															+  call void @dx.op.bufferStore.i32(i32 69, %dx.types.Handle %buf_UAV_rawbuf, i32 8, i32 undef, i32 %2, i32 undef, i32 undef, i32 undef, i8 1)  ; BufferStore(uav,coord0,coord1,value0,value1,value2,value3,mask)
														
 
															+  
														
 
															+  ; CHECK: @dx.op.bufferStore{{.*}}, i32 -1,
														
 
															+  %3 = call i32 @dx.op.tertiary.i32(i32 51, i32 1, i32 0, i32 3841)
														
 
															+  call void @dx.op.bufferStore.i32(i32 69, %dx.types.Handle %buf_UAV_rawbuf, i32 12, i32 undef, i32 %3, i32 undef, i32 undef, i32 undef, i8 1)  ; BufferStore(uav,coord0,coord1,value0,value1,value2,value3,mask)
														
 
															+  
														
 
															+  ; CHECK: @dx.op.bufferStore{{.*}}, i32 -1,
														
 
															+  %4 = call i64 @dx.op.tertiary.i64(i32 51, i64 1, i64 32, i64 4294967296)
														
 
															+  %5 = lshr i64 %4, 0
														
 
															+  %6 = trunc i64 %5 to i32
														
 
															+  call void @dx.op.bufferStore.i32(i32 69, %dx.types.Handle %buf_UAV_rawbuf, i32 16, i32 undef, i32 %6, i32 undef, i32 undef, i32 undef, i8 1)  ; BufferStore(uav,coord0,coord1,value0,value1,value2,value3,mask)
														
 
															+  
														
 
															+  ; CHECK: @dx.op.bufferStore{{.*}}, i32 1,
														
 
															+  %7 = call i64 @dx.op.tertiary.i64(i32 51, i64 2, i64 32, i64 4294967296)
														
 
															+  %8 = lshr i64 %7, 0
														
 
															+  %9 = trunc i64 %8 to i32
														
 
															+  call void @dx.op.bufferStore.i32(i32 69, %dx.types.Handle %buf_UAV_rawbuf, i32 20, i32 undef, i32 %9, i32 undef, i32 undef, i32 undef, i8 1)  ; BufferStore(uav,coord0,coord1,value0,value1,value2,value3,mask)
														
 
															+  
														
 
															+  ; CHECK: @dx.op.bufferStore{{.*}}, i32 -15,
														
 
															+  %10 = call i64 @dx.op.tertiary.i64(i32 51, i64 39, i64 0, i64 1035087118336)
														
 
															+  %11 = lshr i64 %10, 32
														
 
															+  %12 = trunc i64 %11 to i32
														
 
															+  call void @dx.op.bufferStore.i32(i32 69, %dx.types.Handle %buf_UAV_rawbuf, i32 24, i32 undef, i32 %12, i32 undef, i32 undef, i32 undef, i8 1)  ; BufferStore(uav,coord0,coord1,value0,value1,value2,value3,mask)
														
 
															+  
														
 
															+  ; CHECK: @dx.op.bufferStore{{.*}}, i32 1,
														
 
															+  %13 = call i64 @dx.op.tertiary.i64(i32 51, i64 66, i64 0, i64 1)
														
 
															+  %14 = trunc i64 %13 to i32
														
 
															+  call void @dx.op.bufferStore.i32(i32 69, %dx.types.Handle %buf_UAV_rawbuf, i32 28, i32 undef, i32 %14, i32 undef, i32 undef, i32 undef, i8 1)  ; BufferStore(uav,coord0,coord1,value0,value1,value2,value3,mask)
														
 
															+
														
 
															+  call void @dx.op.storeOutput.i32(i32 5, i32 0, i32 0, i8 0, i32 0)  ; StoreOutput(outputtSigId,rowIndex,colIndex,value)
														
 
															+  ret void
														
 
															+}
														
 
															+
														
 
															+; Function Attrs: nounwind readnone
														
 
															+declare i32 @dx.op.loadInput.i32(i32, i32, i32, i8, i32) #0
														
 
															+
														
 
															+; Function Attrs: nounwind
														
 
															+declare void @dx.op.storeOutput.i32(i32, i32, i32, i8, i32) #1
														
 
															+
														
 
															+; Function Attrs: nounwind
														
 
															+declare void @dx.op.bufferStore.i32(i32, %dx.types.Handle, i32, i32, i32, i32, i32, i32, i8) #1
														
 
															+
														
 
															+; Function Attrs: nounwind readonly
														
 
															+declare %dx.types.Handle @dx.op.createHandle(i32, i8, i32, i32, i1) #2
														
 
															+
														
 
															+declare i32 @dx.op.tertiary.i32(i32, i32, i32, i32) #1
														
 
															+declare i64 @dx.op.tertiary.i64(i32, i64, i64, i64) #1
														
 
															+
														
 
															+attributes #0 = { nounwind readnone }
														
 
															+attributes #1 = { nounwind }
														
 
															+attributes #2 = { nounwind readonly }
														
 
															+
														
 
															+!llvm.ident = !{!0}
														
 
															+!dx.valver = !{!1}
														
 
															+!dx.version = !{!1}
														
 
															+!dx.shaderModel = !{!2}
														
 
															+!dx.resources = !{!3}
														
 
															+!dx.typeAnnotations = !{!6, !9}
														
 
															+!dx.entryPoints = !{!13}
														
 
															+
														
 
															+!0 = !{!"clang version 3.7 (tags/RELEASE_370/final)"}
														
 
															+!1 = !{i32 1, i32 0}
														
 
															+!2 = !{!"ps", i32 6, i32 0}
														
 
															+!3 = !{null, !4, null, null}
														
 
															+!4 = !{!5}
														
 
															+!5 = !{i32 0, %struct.RWByteAddressBuffer* undef, !"buf", i32 0, i32 0, i32 1, i32 11, i1 false, i1 false, i1 false, null}
														
 
															+!6 = !{i32 0, %struct.RWByteAddressBuffer undef, !7}
														
 
															+!7 = !{i32 4, !8}
														
 
															+!8 = !{i32 6, !"h", i32 3, i32 0, i32 7, i32 4}
														
 
															+!9 = !{i32 1, void ()* @main, !10}
														
 
															+!10 = !{!11}
														
 
															+!11 = !{i32 0, !12, !12}
														
 
															+!12 = !{}
														
 
															+!13 = !{void ()* @main, !"main", !14, !3, !20}
														
 
															+!14 = !{!15, !18, null}
														
 
															+!15 = !{!16}
														
 
															+!16 = !{i32 0, !"A", i8 4, i8 0, !17, i8 1, i32 1, i8 1, i32 0, i8 0, null}
														
 
															+!17 = !{i32 0}
														
 
															+!18 = !{!19}
														
 
															+!19 = !{i32 0, !"SV_Target", i8 4, i8 16, !17, i8 0, i32 1, i8 1, i32 0, i8 0, null}
														
 
															+!20 = !{i32 0, i64 16}
														
--- a/tools/clang/test/HLSL/constprop/ubfe.ll
+++ b/tools/clang/test/HLSL/constprop/ubfe.ll
@@ -0,0 +1,103 @@
 
															+; RUN: %opt %s -sccp -S | FileCheck %s
														
 
															+
														
 
															+target datalayout = "e-m:e-p:32:32-i64:64-f80:32-n8:16:32-a:0:32-S32"
														
 
															+target triple = "dxil-ms-dx"
														
 
															+
														
 
															+%dx.types.Handle = type { i8* }
														
 
															+%struct.RWByteAddressBuffer = type { i32 }
														
 
															+
														
 
															+define void @main() {
														
 
															+entry:
														
 
															+  %buf_UAV_rawbuf = call %dx.types.Handle @dx.op.createHandle(i32 57, i8 1, i32 0, i32 0, i1 false)  ; CreateHandle(resourceClass,rangeId,index,nonUniformIndex)
														
 
															+  
														
 
															+  ; CHECK: @dx.op.bufferStore{{.*}}, i32 1793,
														
 
															+  %0 = call i32 @dx.op.tertiary.i32(i32 52, i32 11, i32 0, i32 3841)
														
 
															+  call void @dx.op.bufferStore.i32(i32 69, %dx.types.Handle %buf_UAV_rawbuf, i32 0, i32 undef, i32 %0, i32 undef, i32 undef, i32 undef, i8 1)  ; BufferStore(uav,coord0,coord1,value0,value1,value2,value3,mask)
														
 
															+  
														
 
															+  ; CHECK: @dx.op.bufferStore{{.*}}, i32 1,
														
 
															+  %1 = call i32 @dx.op.tertiary.i32(i32 52, i32 1, i32 0, i32 3841)
														
 
															+  call void @dx.op.bufferStore.i32(i32 69, %dx.types.Handle %buf_UAV_rawbuf, i32 4, i32 undef, i32 %1, i32 undef, i32 undef, i32 undef, i8 1)  ; BufferStore(uav,coord0,coord1,value0,value1,value2,value3,mask)
														
 
															+  
														
 
															+  ; CHECK: @dx.op.bufferStore{{.*}}, i32 56026,
														
 
															+  %2 = call i32 @dx.op.tertiary.i32(i32 52, i32 16, i32 16, i32 3671719936)
														
 
															+  call void @dx.op.bufferStore.i32(i32 69, %dx.types.Handle %buf_UAV_rawbuf, i32 8, i32 undef, i32 %2, i32 undef, i32 undef, i32 undef, i8 1)  ; BufferStore(uav,coord0,coord1,value0,value1,value2,value3,mask)
														
 
															+  
														
 
															+  ; CHECK: @dx.op.bufferStore{{.*}}, i32 0,
														
 
															+  %3 = call i32 @dx.op.tertiary.i32(i32 52, i32 32, i32 16, i32 3671719936)
														
 
															+  call void @dx.op.bufferStore.i32(i32 69, %dx.types.Handle %buf_UAV_rawbuf, i32 12, i32 undef, i32 %3, i32 undef, i32 undef, i32 undef, i8 1)  ; BufferStore(uav,coord0,coord1,value0,value1,value2,value3,mask)
														
 
															+  
														
 
															+  ; CHECK: @dx.op.bufferStore{{.*}}, i32 1,
														
 
															+  %4 = call i64 @dx.op.tertiary.i64(i32 52, i64 1, i64 32, i64 4294967296)
														
 
															+  %5 = lshr i64 %4, 0
														
 
															+  %6 = trunc i64 %5 to i32
														
 
															+  call void @dx.op.bufferStore.i32(i32 69, %dx.types.Handle %buf_UAV_rawbuf, i32 16, i32 undef, i32 %6, i32 undef, i32 undef, i32 undef, i8 1)  ; BufferStore(uav,coord0,coord1,value0,value1,value2,value3,mask)
														
 
															+  
														
 
															+  ; CHECK: @dx.op.bufferStore{{.*}}, i32 1,
														
 
															+  %7 = call i64 @dx.op.tertiary.i64(i32 52, i64 2, i64 32, i64 4294967296)
														
 
															+  %8 = lshr i64 %7, 0
														
 
															+  %9 = trunc i64 %8 to i32
														
 
															+  call void @dx.op.bufferStore.i32(i32 69, %dx.types.Handle %buf_UAV_rawbuf, i32 20, i32 undef, i32 %9, i32 undef, i32 undef, i32 undef, i8 1)  ; BufferStore(uav,coord0,coord1,value0,value1,value2,value3,mask)
														
 
															+  
														
 
															+  ; CHECK: @dx.op.bufferStore{{.*}}, i32 113,
														
 
															+  %10 = call i64 @dx.op.tertiary.i64(i32 52, i64 39, i64 0, i64 1035087118336)
														
 
															+  %11 = lshr i64 %10, 32
														
 
															+  %12 = trunc i64 %11 to i32
														
 
															+  call void @dx.op.bufferStore.i32(i32 69, %dx.types.Handle %buf_UAV_rawbuf, i32 24, i32 undef, i32 %12, i32 undef, i32 undef, i32 undef, i8 1)  ; BufferStore(uav,coord0,coord1,value0,value1,value2,value3,mask)
														
 
															+  
														
 
															+  ; CHECK: @dx.op.bufferStore{{.*}}, i32 1,
														
 
															+  %13 = call i64 @dx.op.tertiary.i64(i32 52, i64 66, i64 0, i64 1)
														
 
															+  %14 = trunc i64 %13 to i32
														
 
															+  call void @dx.op.bufferStore.i32(i32 69, %dx.types.Handle %buf_UAV_rawbuf, i32 28, i32 undef, i32 %14, i32 undef, i32 undef, i32 undef, i8 1)  ; BufferStore(uav,coord0,coord1,value0,value1,value2,value3,mask)
														
 
															+
														
 
															+  call void @dx.op.storeOutput.i32(i32 5, i32 0, i32 0, i8 0, i32 0)  ; StoreOutput(outputtSigId,rowIndex,colIndex,value)
														
 
															+  ret void
														
 
															+}
														
 
															+
														
 
															+; Function Attrs: nounwind readnone
														
 
															+declare i32 @dx.op.loadInput.i32(i32, i32, i32, i8, i32) #0
														
 
															+
														
 
															+; Function Attrs: nounwind
														
 
															+declare void @dx.op.storeOutput.i32(i32, i32, i32, i8, i32) #1
														
 
															+
														
 
															+; Function Attrs: nounwind
														
 
															+declare void @dx.op.bufferStore.i32(i32, %dx.types.Handle, i32, i32, i32, i32, i32, i32, i8) #1
														
 
															+
														
 
															+; Function Attrs: nounwind readonly
														
 
															+declare %dx.types.Handle @dx.op.createHandle(i32, i8, i32, i32, i1) #2
														
 
															+
														
 
															+declare i32 @dx.op.tertiary.i32(i32, i32, i32, i32) #1
														
 
															+declare i64 @dx.op.tertiary.i64(i32, i64, i64, i64) #1
														
 
															+
														
 
															+attributes #0 = { nounwind readnone }
														
 
															+attributes #1 = { nounwind }
														
 
															+attributes #2 = { nounwind readonly }
														
 
															+
														
 
															+!llvm.ident = !{!0}
														
 
															+!dx.valver = !{!1}
														
 
															+!dx.version = !{!1}
														
 
															+!dx.shaderModel = !{!2}
														
 
															+!dx.resources = !{!3}
														
 
															+!dx.typeAnnotations = !{!6, !9}
														
 
															+!dx.entryPoints = !{!13}
														
 
															+
														
 
															+!0 = !{!"clang version 3.7 (tags/RELEASE_370/final)"}
														
 
															+!1 = !{i32 1, i32 0}
														
 
															+!2 = !{!"ps", i32 6, i32 0}
														
 
															+!3 = !{null, !4, null, null}
														
 
															+!4 = !{!5}
														
 
															+!5 = !{i32 0, %struct.RWByteAddressBuffer* undef, !"buf", i32 0, i32 0, i32 1, i32 11, i1 false, i1 false, i1 false, null}
														
 
															+!6 = !{i32 0, %struct.RWByteAddressBuffer undef, !7}
														
 
															+!7 = !{i32 4, !8}
														
 
															+!8 = !{i32 6, !"h", i32 3, i32 0, i32 7, i32 4}
														
 
															+!9 = !{i32 1, void ()* @main, !10}
														
 
															+!10 = !{!11}
														
 
															+!11 = !{i32 0, !12, !12}
														
 
															+!12 = !{}
														
 
															+!13 = !{void ()* @main, !"main", !14, !3, !20}
														
 
															+!14 = !{!15, !18, null}
														
 
															+!15 = !{!16}
														
 
															+!16 = !{i32 0, !"A", i8 4, i8 0, !17, i8 1, i32 1, i8 1, i32 0, i8 0, null}
														
 
															+!17 = !{i32 0}
														
 
															+!18 = !{!19}
														
 
															+!19 = !{i32 0, !"SV_Target", i8 4, i8 16, !17, i8 0, i32 1, i8 1, i32 0, i8 0, null}
														
 
															+!20 = !{i32 0, i64 16}
														
--- a/tools/clang/unittests/HLSL/CompilerTest.cpp
+++ b/tools/clang/unittests/HLSL/CompilerTest.cpp
@@ -839,6 +839,7 @@ public:
 
															   TEST_METHOD(CodeGenDx12MiniEngineTonemapcs)
														
 
															   TEST_METHOD(CodeGenDx12MiniEngineUpsampleandblurcs)
														
 
															   TEST_METHOD(DxilGen_StoreOutput)
														
 
															+  TEST_METHOD(ConstantFolding)
														
 
															   dxc::DxcDllSupport m_dllSupport;
														
 
															   bool m_CompilerPreservesBBNames;
														
@@ -4102,6 +4103,56 @@ TEST_F(CompilerTest, DxilGen_StoreOutput) {
 
															   CodeGenTestCheck(L"..\\CodeGenHLSL\\dxilgen_storeoutput.hlsl");
														
 
															 }
														
 
															+TEST_F(CompilerTest, ConstantFolding) {
														
 
															+  CodeGenTestCheck(L"constprop\\FAbs.hlsl");
														
 
															+  CodeGenTestCheck(L"constprop\\Saturate_half.hlsl");
														
 
															+  CodeGenTestCheck(L"constprop\\Saturate_float.hlsl");
														
 
															+  CodeGenTestCheck(L"constprop\\Saturate_double.hlsl");
														
 
															+  CodeGenTestCheck(L"constprop\\Cos.hlsl");
														
 
															+  CodeGenTestCheck(L"constprop\\Sin.hlsl");
														
 
															+  CodeGenTestCheck(L"constprop\\Tan.hlsl");
														
 
															+  CodeGenTestCheck(L"constprop\\Acos.hlsl");
														
 
															+  CodeGenTestCheck(L"constprop\\Asin.hlsl");
														
 
															+  CodeGenTestCheck(L"constprop\\Atan.hlsl");
														
 
															+  CodeGenTestCheck(L"constprop\\Hcos.hlsl");
														
 
															+  CodeGenTestCheck(L"constprop\\Hsin.hlsl");
														
 
															+  CodeGenTestCheck(L"constprop\\Htan.hlsl");
														
 
															+  CodeGenTestCheck(L"constprop\\Exp.hlsl");
														
 
															+  CodeGenTestCheck(L"constprop\\Frc.hlsl");
														
 
															+  CodeGenTestCheck(L"constprop\\Log.hlsl");
														
 
															+  CodeGenTestCheck(L"constprop\\Sqrt.hlsl");
														
 
															+  CodeGenTestCheck(L"constprop\\Rsqrt.hlsl");
														
 
															+  CodeGenTestCheck(L"constprop\\Round_ne.hlsl");
														
 
															+  CodeGenTestCheck(L"constprop\\Round_ni.hlsl");
														
 
															+  CodeGenTestCheck(L"constprop\\Round_pi.hlsl");
														
 
															+  CodeGenTestCheck(L"constprop\\Round_z.hlsl");
														
 
															+  
														
 
															+  CodeGenTestCheck(L"constprop\\Bfrev.hlsl");
														
 
															+  CodeGenTestCheck(L"constprop\\Countbits.hlsl");
														
 
															+  CodeGenTestCheck(L"constprop\\Firstbitlo.hlsl");
														
 
															+  CodeGenTestCheck(L"constprop\\Firstbithi.hlsl");
														
 
															+
														
 
															+  CodeGenTestCheck(L"constprop\\FMin.hlsl");
														
 
															+  CodeGenTestCheck(L"constprop\\FMax.hlsl");
														
 
															+  CodeGenTestCheck(L"constprop\\IMin.hlsl");
														
 
															+  CodeGenTestCheck(L"constprop\\IMax.hlsl");
														
 
															+  CodeGenTestCheck(L"constprop\\UMin.hlsl");
														
 
															+  CodeGenTestCheck(L"constprop\\UMax.hlsl");
														
 
															+  
														
 
															+  CodeGenTestCheck(L"constprop\\FMad.hlsl");
														
 
															+  CodeGenTestCheck(L"constprop\\Fma.hlsl");
														
 
															+  CodeGenTestCheck(L"constprop\\IMad.hlsl");
														
 
															+  CodeGenTestCheck(L"constprop\\UMad.hlsl");
														
 
															+  
														
 
															+  CodeGenTestCheck(L"constprop\\Dot2.hlsl");
														
 
															+  CodeGenTestCheck(L"constprop\\Dot3.hlsl");
														
 
															+  CodeGenTestCheck(L"constprop\\Dot4.hlsl");
														
 
															+
														
 
															+  CodeGenTestCheck(L"constprop\\ibfe.ll");
														
 
															+  CodeGenTestCheck(L"constprop\\ubfe.ll");
														
 
															+  CodeGenTestCheck(L"constprop\\bfi.ll");
														
 
															+}
														
 
															+
														
 
															 TEST_F(CompilerTest, PreprocessWhenValidThenOK) {
														
 
															   CComPtr<IDxcCompiler> pCompiler;
														
 
															   CComPtr<IDxcOperationResult> pResult;
														
--- a/tools/clang/unittests/HLSL/FileCheckerTest.cpp
+++ b/tools/clang/unittests/HLSL/FileCheckerTest.cpp
@@ -341,9 +341,12 @@ static string trim(string value) {
 
															       for (llvm::StringRef S : splitArgs) {
														
 
															         optionStrings.push_back(
														
 
															             Unicode::UTF8ToUTF16StringOrThrow(trim(S.str()).c_str()));
														
 
															-        options.push_back(optionStrings.back().c_str());
														
 
															       }
														
 
															+      // Add the options outside the above loop in case the vector is resized.
														
 
															+      for (const std::wstring& str : optionStrings)
														
 
															+        options.push_back(str.c_str());
														
 
															+
														
 
															       IFT(pOptimizer->RunOptimizer(pSource, options.data(), options.size(),
														
 
															                                    &pOutputModule, &pOutputText));
														
 
															       StdOut = BlobToUtf8(pOutputText);