remove all type promotion

farzonl · farzonl · commit 080b65fcce39 · 2024-02-23T18:53:12.000-05:00
diff --git a/clang/lib/CodeGen/CGBuiltin.cpp b/clang/lib/CodeGen/CGBuiltin.cpp
@@ -17996,8 +17996,10 @@ Value *CodeGenFunction::EmitHLSLBuiltinExpr(unsigned BuiltinID,
     assert(T0->getScalarType() == T1->getScalarType() &&
            "Dot product of vectors need the same element types.");
 
-    auto *VecTy0 = E->getArg(0)->getType()->getAs<VectorType>();
-    auto *VecTy1 = E->getArg(1)->getType()->getAs<VectorType>();
+    [[maybe_unused]] auto *VecTy0 =
+        E->getArg(0)->getType()->getAs<VectorType>();
+    [[maybe_unused]] auto *VecTy1 =
+        E->getArg(1)->getType()->getAs<VectorType>();
     // A HLSLVectorTruncation should have happend
     assert(VecTy0->getNumElements() == VecTy1->getNumElements() &&
            "Dot product requires vectors to be of the same size.");
diff --git a/clang/lib/Headers/hlsl/hlsl_intrinsics.h b/clang/lib/Headers/hlsl/hlsl_intrinsics.h
@@ -182,6 +182,12 @@ double4 cos(double4);
 //===----------------------------------------------------------------------===//
 // dot product builtins
 //===----------------------------------------------------------------------===//
+
+/// \fn K dot(T X, T Y)
+/// \brief Return the dot product (a scalar value) of \a X and \a Y.
+/// \param X The X input value.
+/// \param Y The Y input value.
+
 _HLSL_16BIT_AVAILABILITY(shadermodel, 6.2)
 _HLSL_BUILTIN_ALIAS(__builtin_hlsl_dot)
 half dot(half, half);
diff --git a/clang/lib/Sema/SemaChecking.cpp b/clang/lib/Sema/SemaChecking.cpp
@@ -2962,9 +2962,8 @@ Sema::CheckBuiltinFunctionCall(FunctionDecl *FDecl, unsigned BuiltinID,
   }
   }
 
-  if (getLangOpts().HLSL && CheckHLSLBuiltinFunctionCall(BuiltinID, TheCall)) {
+  if (getLangOpts().HLSL && CheckHLSLBuiltinFunctionCall(BuiltinID, TheCall))
     return ExprError();
-  }
 
   // Since the target specific builtins for each arch overlap, only check those
   // of the arch we are compiling for.
@@ -5166,96 +5165,6 @@ bool Sema::CheckPPCMMAType(QualType Type, SourceLocation TypeLoc) {
   return false;
 }
 
-// Helper function for CheckHLSLBuiltinFunctionCall
-// Note: UsualArithmeticConversions handles the case where at least
-// one arg isn't a bool
-bool PromoteBoolsToInt(Sema *S, CallExpr *TheCall) {
-  unsigned NumArgs = TheCall->getNumArgs();
-
-  for (unsigned i = 0; i < NumArgs; ++i) {
-    ExprResult A = TheCall->getArg(i);
-    if (!A.get()->getType()->isBooleanType())
-      return false;
-  }
-  // if we got here all args are bool
-  for (unsigned i = 0; i < NumArgs; ++i) {
-    ExprResult A = TheCall->getArg(i);
-    ExprResult ResA = S->PerformImplicitConversion(A.get(), S->Context.IntTy,
-                                                   Sema::AA_Converting);
-    if (ResA.isInvalid())
-      return true;
-    TheCall->setArg(i, ResA.get());
-  }
-  return false;
-}
-
-// Helper function for CheckHLSLBuiltinFunctionCall
-// Handles the CK_HLSLVectorTruncation case for builtins
-void PromoteVectorArgTruncation(Sema *S, CallExpr *TheCall) {
-  assert(TheCall->getNumArgs() > 1);
-  ExprResult A = TheCall->getArg(0);
-  ExprResult B = TheCall->getArg(1);
-  QualType ArgTyA = A.get()->getType();
-  QualType ArgTyB = B.get()->getType();
-
-  auto *VecTyA = ArgTyA->getAs<VectorType>();
-  auto *VecTyB = ArgTyB->getAs<VectorType>();
-  if (VecTyA == nullptr && VecTyB == nullptr)
-    return;
-  if (VecTyA == nullptr || VecTyB == nullptr)
-    return;
-  if (VecTyA->getNumElements() == VecTyB->getNumElements())
-    return;
-
-  Expr *LargerArg = B.get();
-  Expr *SmallerArg = A.get();
-  int largerIndex = 1;
-  if (VecTyA->getNumElements() > VecTyB->getNumElements()) {
-    LargerArg = A.get();
-    SmallerArg = B.get();
-    largerIndex = 0;
-  }
-
-  S->Diag(TheCall->getExprLoc(), diag::warn_hlsl_impcast_vector_truncation)
-      << LargerArg->getType() << SmallerArg->getType()
-      << LargerArg->getSourceRange() << SmallerArg->getSourceRange();
-  ExprResult ResLargerArg = S->ImpCastExprToType(
-      LargerArg, SmallerArg->getType(), CK_HLSLVectorTruncation);
-  TheCall->setArg(largerIndex, ResLargerArg.get());
-  return;
-}
-
-// Helper function for CheckHLSLBuiltinFunctionCall
-void CheckVectorFloatPromotion(Sema *S, ExprResult &source, QualType targetTy,
-                               SourceRange targetSrcRange,
-                               SourceLocation BuiltinLoc) {
-  auto *vecTyTarget = source.get()->getType()->getAs<VectorType>();
-  assert(vecTyTarget);
-  QualType vecElemT = vecTyTarget->getElementType();
-  if (!vecElemT->isFloatingType() && targetTy->isFloatingType()) {
-    QualType floatVecTy = S->Context.getVectorType(
-        S->Context.FloatTy, vecTyTarget->getNumElements(), VectorKind::Generic);
-
-    S->Diag(BuiltinLoc, diag::warn_impcast_integer_float_precision)
-        << source.get()->getType() << floatVecTy
-        << source.get()->getSourceRange() << targetSrcRange;
-    source = S->SemaConvertVectorExpr(
-        source.get(), S->Context.CreateTypeSourceInfo(floatVecTy), BuiltinLoc,
-        source.get()->getBeginLoc());
-  }
-}
-
-// Helper function for CheckHLSLBuiltinFunctionCall
-void PromoteVectorArgSplat(Sema *S, ExprResult &source, QualType targetTy) {
-  QualType sourceTy = source.get()->getType();
-  auto *vecTyTarget = targetTy->getAs<VectorType>();
-  QualType vecElemT = vecTyTarget->getElementType();
-  if (vecElemT->isFloatingType() && sourceTy != vecElemT)
-    // if float vec splat wil do an unnecessary cast to double
-    source = S->ImpCastExprToType(source.get(), vecElemT, CK_FloatingCast);
-  source = S->ImpCastExprToType(source.get(), targetTy, CK_VectorSplat);
-}
-
 // Helper function for CheckHLSLBuiltinFunctionCall
 bool CheckVectorElementCallArgs(Sema *S, CallExpr *TheCall) {
   assert(TheCall->getNumArgs() > 1);
@@ -5265,36 +5174,42 @@ bool CheckVectorElementCallArgs(Sema *S, CallExpr *TheCall) {
   QualType ArgTyB = B.get()->getType();
   auto *VecTyA = ArgTyA->getAs<VectorType>();
   auto *VecTyB = ArgTyB->getAs<VectorType>();
-
+  SourceLocation BuiltinLoc = TheCall->getBeginLoc();
   if (VecTyA == nullptr && VecTyB == nullptr)
     return false;
 
   if (VecTyA && VecTyB) {
-    if (VecTyA->getElementType() == VecTyB->getElementType()) {
-      TheCall->setType(VecTyA->getElementType());
-      return false;
+    bool retValue = false;
+    if (VecTyA->getElementType() != VecTyB->getElementType()) {
+      // Note: type promotion is intended to be handeled via the intrinsics
+      //  and not the builtin itself.
+      S->Diag(TheCall->getBeginLoc(), diag::err_vec_builtin_incompatible_vector)
+          << TheCall->getDirectCallee()
+          << SourceRange(A.get()->getBeginLoc(), B.get()->getEndLoc());
+      retValue = true;
+    }
+    if (VecTyA->getNumElements() != VecTyB->getNumElements()) {
+      // if we get here a HLSLVectorTruncation is needed.
+      S->Diag(BuiltinLoc, diag::err_vec_builtin_incompatible_vector)
+          << TheCall->getDirectCallee()
+          << SourceRange(TheCall->getArg(0)->getBeginLoc(),
+                         TheCall->getArg(1)->getEndLoc());
+      retValue = true;
     }
-    // Note: type promotion is intended to be handeled via the intrinsics
-    //  and not the builtin itself.
-    S->Diag(TheCall->getBeginLoc(), diag::err_vec_builtin_incompatible_vector)
-        << TheCall->getDirectCallee()
-        << SourceRange(A.get()->getBeginLoc(), B.get()->getEndLoc());
-    return true;
-  }
 
-  if (VecTyB) {
-    CheckVectorFloatPromotion(S, B, ArgTyA, A.get()->getSourceRange(),
-                              TheCall->getBeginLoc());
-    PromoteVectorArgSplat(S, A, B.get()->getType());
-  }
-  if (VecTyA) {
-    CheckVectorFloatPromotion(S, A, ArgTyB, B.get()->getSourceRange(),
-                              TheCall->getBeginLoc());
-    PromoteVectorArgSplat(S, B, A.get()->getType());
+    if (retValue)
+      TheCall->setType(VecTyA->getElementType());
+
+    return retValue;
   }
-  TheCall->setArg(0, A.get());
-  TheCall->setArg(1, B.get());
-  return false;
+
+  // Note: if we get here one of the args is a scalar which
+  // requires a VectorSplat on Arg0 or Arg1
+  S->Diag(BuiltinLoc, diag::err_vec_builtin_non_vector)
+      << TheCall->getDirectCallee()
+      << SourceRange(TheCall->getArg(0)->getBeginLoc(),
+                     TheCall->getArg(1)->getEndLoc());
+  return true;
 }
 
 // Note: returning true in this case results in CheckBuiltinFunctionCall
@@ -5304,11 +5219,8 @@ bool Sema::CheckHLSLBuiltinFunctionCall(unsigned BuiltinID, CallExpr *TheCall) {
   case Builtin::BI__builtin_hlsl_dot: {
     if (checkArgCount(*this, TheCall, 2))
       return true;
-    if (PromoteBoolsToInt(this, TheCall))
-      return true;
     if (CheckVectorElementCallArgs(this, TheCall))
       return true;
-    PromoteVectorArgTruncation(this, TheCall);
     if (SemaBuiltinVectorToScalarMath(TheCall))
       return true;
     break;
@@ -19759,24 +19671,22 @@ bool Sema::PrepareBuiltinElementwiseMathOneArgCall(CallExpr *TheCall) {
 
 bool Sema::SemaBuiltinElementwiseMath(CallExpr *TheCall) {
   QualType Res;
-  bool result = SemaBuiltinVectorMath(TheCall, Res);
-  if (result)
+  if (SemaBuiltinVectorMath(TheCall, Res))
     return true;
   TheCall->setType(Res);
   return false;
 }
 
 bool Sema::SemaBuiltinVectorToScalarMath(CallExpr *TheCall) {
   QualType Res;
-  bool result = SemaBuiltinVectorMath(TheCall, Res);
-  if (result)
+  if (SemaBuiltinVectorMath(TheCall, Res))
     return true;
 
-  if (auto *VecTy0 = Res->getAs<VectorType>()) {
+  if (auto *VecTy0 = Res->getAs<VectorType>())
     TheCall->setType(VecTy0->getElementType());
-  } else {
+  else
     TheCall->setType(Res);
-  }
+
   return false;
 }
 
diff --git a/clang/test/CodeGenHLSL/builtins/dot-builtin.hlsl b/clang/test/CodeGenHLSL/builtins/dot-builtin.hlsl
@@ -1,44 +1,6 @@
-// RUN: %clang_cc1 -std=hlsl2021 -finclude-default-header -x hlsl -triple \
-// RUN:   dxil-pc-shadermodel6.3-library %s -fnative-half-type \
-// RUN:   -emit-llvm -disable-llvm-passes -O3 -o - | FileCheck %s \ 
-// RUN:   --check-prefixes=CHECK
-
-// CHECK:  %dx.dot = call float @llvm.dx.dot.v2f32(<2 x float> %splat.splat, <2 x float> %1)
-// CHECK: ret float %dx.dot
-float test_builtin_dot_float2_splat ( float p0, float2 p1 ) {
-  return __builtin_hlsl_dot( p0, p1 );
-}
-
-// CHECK:  %dx.dot = call float @llvm.dx.dot.v3f32(<3 x float> %splat.splat, <3 x float> %1)
-// CHECK: ret float %dx.dot
-float test_builtin_dot_float3_splat ( float p0, float3 p1 ) {
-  return __builtin_hlsl_dot( p0, p1 );
-}
-
-// CHECK:  %dx.dot = call float @llvm.dx.dot.v4f32(<4 x float> %splat.splat, <4 x float> %1)
-// CHECK: ret float %dx.dot
-float test_builtin_dot_float4_splat ( float p0, float4 p1 ) {
-  return __builtin_hlsl_dot( p0, p1 );
-}
-
-// CHECK: %conv = sitofp i32 %1 to float
-// CHECK: %splat.splatinsert = insertelement <2 x float> poison, float %conv, i64 0
-// CHECK: %splat.splat = shufflevector <2 x float> %splat.splatinsert, <2 x float> poison, <2 x i32> zeroinitializer
-// CHECK: %dx.dot = call float @llvm.dx.dot.v2f32(<2 x float> %0, <2 x float> %splat.splat)
-// CHECK: ret float %dx.dot
-float test_dot_float2_int_splat ( float2 p0, int p1 ) {
-  return __builtin_hlsl_dot ( p0, p1 );
-}
-
-// CHECK: %conv = sitofp i32 %1 to float
-// CHECK: %splat.splatinsert = insertelement <3 x float> poison, float %conv, i64 0
-// CHECK: %splat.splat = shufflevector <3 x float> %splat.splatinsert, <3 x float> poison, <3 x i32> zeroinitializer
-// CHECK: %dx.dot = call float @llvm.dx.dot.v3f32(<3 x float> %0, <3 x float> %splat.splat)
-// CHECK: ret float %dx.dot
-float test_dot_float3_int_splat ( float3 p0, int p1 ) {
-  return __builtin_hlsl_dot ( p0, p1 );
-}
+// RUN: %clang_cc1 -finclude-default-header -x hlsl -triple dxil-pc-shadermodel6.3-library %s -fnative-half-type -emit-llvm -disable-llvm-passes -o - | FileCheck %s
 
+// CHECK-LABEL: builtin_bool_to_float_type_promotion
 // CHECK: %conv1 = uitofp i1 %tobool to double
 // CHECK: %dx.dot = fmul double %conv, %conv1
 // CHECK: %conv2 = fptrunc double %dx.dot to float
@@ -47,6 +9,7 @@ float builtin_bool_to_float_type_promotion ( float p0, bool p1 ) {
   return __builtin_hlsl_dot ( p0, p1 );
 }
 
+// CHECK-LABEL: builtin_bool_to_float_arg1_type_promotion
 // CHECK: %conv = uitofp i1 %tobool to double
 // CHECK: %conv1 = fpext float %1 to double
 // CHECK: %dx.dot = fmul double %conv, %conv1
@@ -56,28 +19,12 @@ float builtin_bool_to_float_arg1_type_promotion ( bool p0, float p1 ) {
   return __builtin_hlsl_dot ( p0, p1 );
 }
 
-// CHECK: %conv = zext i1 %tobool to i32
-// CHECK: %conv3 = zext i1 %tobool2 to i32
-// CHECK: %dx.dot = mul i32 %conv, %conv3
-// CHECK: ret i32 %dx.dot
-int test_builtin_dot_bool_type_promotion ( bool p0, bool p1 ) {
-  return __builtin_hlsl_dot ( p0, p1 );
-}
-
+// CHECK-LABEL: builtin_dot_int_to_float_promotion
 // CHECK: %conv = fpext float %0 to double
 // CHECK: %conv1 = sitofp i32 %1 to double
 // CHECK: dx.dot = fmul double %conv, %conv1
 // CHECK: %conv2 = fptrunc double %dx.dot to float
 // CHECK: ret float %conv2
-float test_builtin_dot_int_to_float_promotion ( float p0, int p1 ) {
-  return __builtin_hlsl_dot ( p0, p1 );
-}
-
-
-// CHECK: %conv = sitofp <2 x i32> %0 to <2 x float>
-// CHECK: %splat.splat = shufflevector <2 x float> %splat.splatinsert, <2 x float> poison, <2 x i32> zeroinitializer
-// CHECK: %dx.dot = call float @llvm.dx.dot.v2f32(<2 x float> %conv, <2 x float> %splat.splat)
-// CHECK: ret float %dx.dot
-float test_builtin_dot_int_vect_to_float_vec_promotion ( int2 p0, float p1 ) {
+float builtin_dot_int_to_float_promotion ( float p0, int p1 ) {
   return __builtin_hlsl_dot ( p0, p1 );
 }
diff --git a/clang/test/CodeGenHLSL/builtins/dot.hlsl b/clang/test/CodeGenHLSL/builtins/dot.hlsl
@@ -1,8 +1,8 @@
-// RUN: %clang_cc1 -std=hlsl2021 -finclude-default-header -x hlsl -triple \
+// RUN: %clang_cc1 -finclude-default-header -x hlsl -triple \
 // RUN:   dxil-pc-shadermodel6.3-library %s -fnative-half-type \
-// RUN:   -emit-llvm -disable-llvm-passes -O3 -o - | FileCheck %s \ 
+// RUN:   -emit-llvm -disable-llvm-passes -o - | FileCheck %s \ 
 // RUN:   --check-prefixes=CHECK,NATIVE_HALF
-// RUN: %clang_cc1 -std=hlsl2021 -finclude-default-header -x hlsl -triple \
+// RUN: %clang_cc1 -finclude-default-header -x hlsl -triple \
 // RUN:   dxil-pc-shadermodel6.3-library %s -emit-llvm -disable-llvm-passes \
 // RUN:   -o - | FileCheck %s --check-prefixes=CHECK,NO_HALF
 
diff --git a/clang/test/SemaHLSL/BuiltIns/dot-errors.hlsl b/clang/test/SemaHLSL/BuiltIns/dot-errors.hlsl
@@ -1,6 +1,4 @@
-// RUN: %clang_cc1 -std=hlsl2021 -finclude-default-header -x hlsl -triple \
-// RUN:   dxil-pc-shadermodel6.3-library %s -fnative-half-type -emit-llvm \
-// RUN:   -disable-llvm-passes -verify -verify-ignore-unexpected
+// RUN: %clang_cc1 -finclude-default-header -triple dxil-pc-shadermodel6.6-library %s -fnative-half-type -emit-llvm -disable-llvm-passes -verify -verify-ignore-unexpected
 
 float test_no_second_arg ( float2 p0) {
   return __builtin_hlsl_dot ( p0 );
@@ -25,7 +23,7 @@ float test_dot_vector_size_mismatch ( float3 p0, float2 p1 ) {
 
 float test_dot_builtin_vector_size_mismatch ( float3 p0, float2 p1 ) {
   return __builtin_hlsl_dot ( p0, p1 );
-  // expected-warning@-1 {{implicit conversion truncates vector: 'float3' (aka 'vector<float, 3>') to 'float2' (aka 'vector<float, 2>')}}
+  // expected-error@-1 {{first two arguments to '__builtin_hlsl_dot' must have the same type}}
 }
 
 float test_dot_scalar_mismatch ( float p0, int p1 ) {
@@ -75,3 +73,38 @@ int64_t test_builtin_dot_vec_int16_to_int64_promotion( int64_t2 p0, int16_t2 p1
   // expected-error@-1 {{first two arguments to '__builtin_hlsl_dot' must have the same type}}
 }
 #endif
+
+float test_builtin_dot_float2_splat ( float p0, float2 p1 ) {
+  return __builtin_hlsl_dot( p0, p1 );
+  // expected-error@-1 {{first two arguments to '__builtin_hlsl_dot' must be vectors}}
+}
+
+float test_builtin_dot_float3_splat ( float p0, float3 p1 ) {
+  return __builtin_hlsl_dot( p0, p1 );
+  // expected-error@-1 {{first two arguments to '__builtin_hlsl_dot' must be vectors}}
+}
+
+float test_builtin_dot_float4_splat ( float p0, float4 p1 ) {
+  return __builtin_hlsl_dot( p0, p1 );
+  // expected-error@-1 {{first two arguments to '__builtin_hlsl_dot' must be vectors}}
+}
+
+float test_dot_float2_int_splat ( float2 p0, int p1 ) {
+  return __builtin_hlsl_dot ( p0, p1 );
+  // expected-error@-1 {{first two arguments to '__builtin_hlsl_dot' must be vectors}}
+}
+
+float test_dot_float3_int_splat ( float3 p0, int p1 ) {
+  return __builtin_hlsl_dot ( p0, p1 );
+  // expected-error@-1 {{first two arguments to '__builtin_hlsl_dot' must be vectors}}
+}
+
+float test_builtin_dot_int_vect_to_float_vec_promotion ( int2 p0, float p1 ) {
+  return __builtin_hlsl_dot ( p0, p1 );
+  // expected-error@-1 {{first two arguments to '__builtin_hlsl_dot' must be vectors}}
+}
+
+int test_builtin_dot_bool_type_promotion ( bool p0, bool p1 ) {
+  return __builtin_hlsl_dot ( p0, p1 );
+  // expected-error@-1 {{1st argument must be a vector, integer or floating point type (was 'bool')}}
+}