From 3884939853312782e5252084f28cd3f806d705fe Mon Sep 17 00:00:00 2001
From: Chengcheng Jin <chengcheng.jin@intel.com>
Date: Tue, 12 Nov 2024 10:06:06 -0800
Subject: [PATCH] Add support for allow-precision-loss in decimal operations
 (#10383)

Summary:
Each of the decimal operation functions is registered as two functions such as `add_deny_precision_loss` and `add`.
When allowing precision loss, establishing the result type of an arithmetic operation happens according to Hive behavior and SQL ANSI 2011 specification, i.e. rounding the decimal part of the result if an exact representation is not possible. Otherwise, NULL is returned in those cases, as previously.
When not allowing precision loss, not rounding the decimal part.

For example,
  | decimal(38, 7) + decimal(10, 0) result type | 1.1232154   + 1| decimal(38, 18) * decimal(38, 18)| 0.1234567891011 * 1234.1
-- | -- | -- | -- | --
allow   precision loss | decimal(38, 6) | 2.123215 | decimal(38, 6) | 152.358023
deny precision   loss | decimal(38, 7) | 2.1232154 | decimal(38, 36) | NULL

```
spark-sql (default)> set spark.sql.decimalOperations.allowPrecisionLoss=true;

spark-sql (default)> select cast(0.1234567891011 as decimal(38, 18)) * cast(1234.1 as decimal(38, 18));
152.358023

spark-sql (default)> set spark.sql.decimalOperations.allowPrecisionLoss=false;

spark-sql (default)> select cast(0.1234567891011 as decimal(38, 18)) * cast(1234.1 as decimal(38, 18));
NULL
```

Spark implementation: https://github.com/apache/spark/blob/branch-3.5/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/arithmetic.scala#L814

Pull Request resolved: https://github.com/facebookincubator/velox/pull/10383

Reviewed By: pedroerp

Differential Revision: D65612198

Pulled By: kevinwilfong

fbshipit-source-id: 4910aaeb0e375dbe8817c5f3fb41185c67c6dd5b
---
 velox/docs/functions/spark/decimal.rst        |  90 ++++++-
 .../functions/sparksql/DecimalArithmetic.cpp  | 229 +++++++++++++-----
 velox/functions/sparksql/DecimalUtil.h        |  10 +
 .../sparksql/tests/DecimalArithmeticTest.cpp  |  59 +++++
 .../sparksql/tests/DecimalUtilTest.cpp        |  12 +
 5 files changed, 332 insertions(+), 68 deletions(-)

diff --git a/velox/docs/functions/spark/decimal.rst b/velox/docs/functions/spark/decimal.rst
index 19eee325f4b3..e6901166c627 100644
--- a/velox/docs/functions/spark/decimal.rst
+++ b/velox/docs/functions/spark/decimal.rst
@@ -2,15 +2,46 @@
 Decimal Operators
 =================
 
-When calculating the result precision and scale of arithmetic operators,
-the formulas follow Hive which is based on the SQL standard and MS SQL:
+The result precision and scale computation of arithmetic operators contains two stages.
+First stage computes precision and scale using formulas based on the SQL standard and Hive when allow-precision-loss is true.
+The result may exceed maximum allowed precision of 38.
+
+Second stage caps precision at 38 and either reduces the scale or not depending on allow-precision-loss flag.
+
+For example, addition of decimal(38, 7) and decimal(10, 0) requires precision of 39 and scale of 7.
+Since precision exceeds 38 it needs to be capped. When allow-precision-loss, precision is capped at 38 and scale is reduced by 1 to 6.
+When allow-precision-loss is false, precision is capped at 38 as well, but scale is kept at 7.
+With allow-precision-loss all additions will succeed, but accuracy (number of digits after period) of some operations will be reduced.
+Without allow-precision-loss, some additions will return NULL.
+
+For example,
+
+The following queries keep accuracy or return NULL when allow-precision-loss is false:
+
+::
+
+    select cast('1.1232154' as decimal(38, 7)) + cast('1' as decimal(10, 0)); -- 2.123215
+    select cast('9999999999999999999999999999999.2345678' as decimal(38, 7)) + cast('1' as decimal(10, 0)); -- NULL
+
+These same operations succeed when allow-precision-loss is true:
+
+::
+
+    select cast('1.1232154' as decimal(38, 7)) + cast('1' as decimal(10, 0)); -- 2.12321, lost the last digit
+    select cast('9999999999999999999999999999999.2345678' as decimal(38, 7)) + cast('1' as decimal(10, 0)); -- 10000000000000000000000000000000.234568
+
+Decimal Precision and Scale Computation Formulas
+------------------------------------------------
+
+The HiveQL behavior:
 
 https://cwiki.apache.org/confluence/download/attachments/27362075/Hive_Decimal_Precision_Scale_Support.pdf
 
-https://msdn.microsoft.com/en-us/library/ms190476.aspx
+Additionally, the computation of decimal division adapts to the allow-precision-loss flag,
+while the decimal addition, subtraction, and multiplication do not.
 
 Addition and Subtraction
-------------------------
+~~~~~~~~~~~~~~~~~~~~~~~~
 
 ::
 
@@ -18,7 +49,7 @@ Addition and Subtraction
 	s = max(s1, s2)
 
 Multiplication
---------------
+~~~~~~~~~~~~~~
 
 ::
 
@@ -26,25 +57,60 @@ Multiplication
 	s = s1 + s2
 
 Division
---------
+~~~~~~~~
+When allow-precision-loss is true:
 
 ::
 
     p = p1 - s1 + s2 + max(6, s1 + p2 + 1)
     s = max(6, s1 + p2 + 1)
 
-For above arithmetic operators, when the precision of result exceeds 38,
-caps p at 38 and reduces the scale, in order to prevent the truncation of
-the integer part of the decimals. Below formula illustrates how the result
-precision and scale are adjusted.
+When allow-precision-loss is false:
+
+::
+
+    wholeDigits = min(38, p1 - s1 + s2);
+    fractionalDigits = min(38, max(6, s1 + p2 + 1));
+    p = wholeDigits + fractionalDigits
+    s = fractionalDigits
+
+Decimal Precision and Scale Adjustment
+--------------------------------------
+
+When allow-precision-loss is true, rounds the decimal part of the result if an exact representation is not possible.
+Otherwise, returns NULL.
+Notice: some operations succeed if precision loss is allowed and return NULL if not.
+
+For example,
+
+::
+
+    select cast(0.1234567891011 as decimal(38, 18)) * cast(1234.1 as decimal(38, 18));
+    -- 152.358023 if allow-precision-loss, NULL otherwise.
+
+Below formula illustrates how the result precision and scale are adjusted.
 
 ::
 
     precision = 38
     scale = max(38 - (p - s), min(s, 6))
 
-Users experience runtime errors when the actual result cannot be represented
-with the calculated decimal type.
+When precision loss is not allowed, caps p at 38, and keeps scale as is.
+The below formula shows how the precision and scale are adjusted for decimal addition, subtraction, and multiplication.
+
+::
+
+    precision = 38
+    scale = min(38, s)
+
+Decimal division uses a different formula:
+
+::
+
+    precision = 38
+    scale = fractionalDigits - (wholeDigits + fractionalDigits - 38) / 2 - 1
+
+Returns NULL when the actual result cannot be represented with the calculated decimal type.
 
 Decimal Functions
 -----------------
diff --git a/velox/functions/sparksql/DecimalArithmetic.cpp b/velox/functions/sparksql/DecimalArithmetic.cpp
index 61599bce10ea..7f5b48ea7740 100644
--- a/velox/functions/sparksql/DecimalArithmetic.cpp
+++ b/velox/functions/sparksql/DecimalArithmetic.cpp
@@ -21,15 +21,18 @@
 namespace facebook::velox::functions::sparksql {
 namespace {
 
+static constexpr const char* kDenyPrecisionLoss = "_deny_precision_loss";
+
 struct DecimalAddSubtractBase {
  protected:
+  template <bool allowPrecisionLoss>
   void initializeBase(const std::vector<TypePtr>& inputTypes) {
     auto [aPrecision, aScale] = getDecimalPrecisionScale(*inputTypes[0]);
     auto [bPrecision, bScale] = getDecimalPrecisionScale(*inputTypes[1]);
     aScale_ = aScale;
     bScale_ = bScale;
-    auto [rPrecision, rScale] =
-        computeResultPrecisionScale(aPrecision, aScale_, bPrecision, bScale_);
+    auto [rPrecision, rScale] = computeResultPrecisionScale<allowPrecisionLoss>(
+        aPrecision, aScale_, bPrecision, bScale_);
     rPrecision_ = rPrecision;
     rScale_ = rScale;
     aRescale_ = computeRescaleFactor(aScale_, bScale_);
@@ -252,11 +255,13 @@ struct DecimalAddSubtractBase {
     }
   }
 
-  // Computes the result precision and scale for decimal add and subtract
-  // operations following Hive's formulas.
-  // If result is representable with long decimal, the result
-  // scale is the maximum of 'aScale' and 'bScale'. If not, reduces result scale
-  // and caps the result precision at 38.
+  // When `allowPrecisionLoss` is true, computes the result precision and scale
+  // for decimal add and subtract operations following Hive's formulas. If
+  // result is representable with long decimal, the result scale is the maximum
+  // of 'aScale' and 'bScale'. If not, reduces result scale and caps the result
+  // precision at 38.
+  // When `allowPrecisionLoss` is false, caps p and s at 38.
+  template <bool allowPrecisionLoss>
   static std::pair<uint8_t, uint8_t> computeResultPrecisionScale(
       uint8_t aPrecision,
       uint8_t aScale,
@@ -265,7 +270,11 @@ struct DecimalAddSubtractBase {
     auto precision = std::max(aPrecision - aScale, bPrecision - bScale) +
         std::max(aScale, bScale) + 1;
     auto scale = std::max(aScale, bScale);
-    return sparksql::DecimalUtil::adjustPrecisionScale(precision, scale);
+    if constexpr (allowPrecisionLoss) {
+      return sparksql::DecimalUtil::adjustPrecisionScale(precision, scale);
+    } else {
+      return sparksql::DecimalUtil::bounded(precision, scale);
+    }
   }
 
   static uint8_t computeRescaleFactor(uint8_t fromScale, uint8_t toScale) {
@@ -280,7 +289,7 @@ struct DecimalAddSubtractBase {
   uint8_t rScale_;
 };
 
-template <typename TExec>
+template <typename TExec, bool allowPrecisionLoss>
 struct DecimalAddFunction : DecimalAddSubtractBase {
   VELOX_DEFINE_FUNCTION_TYPES(TExec);
 
@@ -290,7 +299,7 @@ struct DecimalAddFunction : DecimalAddSubtractBase {
       const core::QueryConfig& /*config*/,
       A* /*a*/,
       B* /*b*/) {
-    initializeBase(inputTypes);
+    initializeBase<allowPrecisionLoss>(inputTypes);
   }
 
   template <typename R, typename A, typename B>
@@ -299,7 +308,7 @@ struct DecimalAddFunction : DecimalAddSubtractBase {
   }
 };
 
-template <typename TExec>
+template <typename TExec, bool allowPrecisionLoss>
 struct DecimalSubtractFunction : DecimalAddSubtractBase {
   VELOX_DEFINE_FUNCTION_TYPES(TExec);
 
@@ -309,7 +318,7 @@ struct DecimalSubtractFunction : DecimalAddSubtractBase {
       const core::QueryConfig& /*config*/,
       A* /*a*/,
       B* /*b*/) {
-    initializeBase(inputTypes);
+    initializeBase<allowPrecisionLoss>(inputTypes);
   }
 
   template <typename R, typename A, typename B>
@@ -318,7 +327,7 @@ struct DecimalSubtractFunction : DecimalAddSubtractBase {
   }
 };
 
-template <typename TExec>
+template <typename TExec, bool allowPrecisionLoss>
 struct DecimalMultiplyFunction {
   VELOX_DEFINE_FUNCTION_TYPES(TExec);
 
@@ -330,10 +339,16 @@ struct DecimalMultiplyFunction {
       B* /*b*/) {
     auto [aPrecision, aScale] = getDecimalPrecisionScale(*inputTypes[0]);
     auto [bPrecision, bScale] = getDecimalPrecisionScale(*inputTypes[1]);
-    auto [rPrecision, rScale] = DecimalUtil::adjustPrecisionScale(
-        aPrecision + bPrecision + 1, aScale + bScale);
-    rPrecision_ = rPrecision;
-    deltaScale_ = aScale + bScale - rScale;
+    std::pair<uint8_t, uint8_t> rPrecisionScale;
+    if constexpr (allowPrecisionLoss) {
+      rPrecisionScale = DecimalUtil::adjustPrecisionScale(
+          aPrecision + bPrecision + 1, aScale + bScale);
+    } else {
+      rPrecisionScale =
+          DecimalUtil::bounded(aPrecision + bPrecision + 1, aScale + bScale);
+    }
+    rPrecision_ = rPrecisionScale.first;
+    deltaScale_ = aScale + bScale - rPrecisionScale.second;
   }
 
   template <typename R, typename A, typename B>
@@ -426,7 +441,7 @@ struct DecimalMultiplyFunction {
   int32_t deltaScale_;
 };
 
-template <typename TExec>
+template <typename TExec, bool allowPrecisionLoss>
 struct DecimalDivideFunction {
   VELOX_DEFINE_FUNCTION_TYPES(TExec);
 
@@ -453,14 +468,30 @@ struct DecimalDivideFunction {
   }
 
  private:
+  // When allowing precision loss, computes the result precision and scale
+  // following Hive's formulas. When denying precision loss, calculates the
+  // number of whole digits and fraction digits. If the total number of digits
+  // exceed 38, we reduce both the number of fraction digits and whole digits to
+  // fit within this limit.
   static std::pair<uint8_t, uint8_t> computeResultPrecisionScale(
       uint8_t aPrecision,
       uint8_t aScale,
       uint8_t bPrecision,
       uint8_t bScale) {
-    auto scale = std::max(6, aScale + bPrecision + 1);
-    auto precision = aPrecision - aScale + bScale + scale;
-    return DecimalUtil::adjustPrecisionScale(precision, scale);
+    if constexpr (allowPrecisionLoss) {
+      auto scale = std::max(6, aScale + bPrecision + 1);
+      auto precision = aPrecision - aScale + bScale + scale;
+      return DecimalUtil::adjustPrecisionScale(precision, scale);
+    } else {
+      auto wholeDigits = std::min(38, aPrecision - aScale + bScale);
+      auto fractionDigits = std::min(38, std::max(6, aScale + bPrecision + 1));
+      auto diff = (wholeDigits + fractionDigits) - 38;
+      if (diff > 0) {
+        fractionDigits -= diff / 2 + 1;
+        wholeDigits = 38 - fractionDigits;
+      }
+      return DecimalUtil::bounded(wholeDigits + fractionDigits, fractionDigits);
+    }
   }
 
   uint8_t aRescale_;
@@ -507,16 +538,24 @@ void registerDecimalBinary(
       ShortDecimal<P2, S2>>({name}, constraints);
 }
 
+// Used in function registration to generate the string to cap value at 38.
+std::string bounded(const std::string& value) {
+  return fmt::format("({}) <= 38 ? ({}) : 38", value, value);
+}
+
 std::vector<exec::SignatureVariable> makeConstraints(
     const std::string& rPrecision,
-    const std::string& rScale) {
-  std::string finalScale = fmt::format(
-      "({}) <= 38 ? ({}) : max(({}) - ({}) + 38, min(({}), 6))",
-      rPrecision,
-      rScale,
-      rScale,
-      rPrecision,
-      rScale);
+    const std::string& rScale,
+    bool allowPrecisionLoss) {
+  std::string finalScale = allowPrecisionLoss
+      ? fmt::format(
+            "({}) <= 38 ? ({}) : max(({}) - ({}) + 38, min(({}), 6))",
+            rPrecision,
+            rScale,
+            rScale,
+            rPrecision,
+            rScale)
+      : bounded(rScale);
   return {
       exec::SignatureVariable(
           P3::name(),
@@ -527,8 +566,7 @@ std::vector<exec::SignatureVariable> makeConstraints(
           S3::name(), finalScale, exec::ParameterType::kIntegerParameter)};
 }
 
-template <template <class> typename Func>
-void registerDecimalAddSubtract(const std::string& name) {
+std::pair<std::string, std::string> getAddSubtractResultPrecisionScale() {
   std::string rPrecision = fmt::format(
       "max({a_precision} - {a_scale}, {b_precision} - {b_scale}) + max({a_scale}, {b_scale}) + 1",
       fmt::arg("a_precision", P1::name()),
@@ -539,33 +577,67 @@ void registerDecimalAddSubtract(const std::string& name) {
       "max({a_scale}, {b_scale})",
       fmt::arg("a_scale", S1::name()),
       fmt::arg("b_scale", S2::name()));
-  registerDecimalBinary<Func>(name, makeConstraints(rPrecision, rScale));
+  return {rPrecision, rScale};
 }
 
-} // namespace
+template <typename TExec>
+using AddFunctionAllowPrecisionLoss = DecimalAddFunction<TExec, true>;
 
-void registerDecimalAdd(const std::string& prefix) {
-  registerDecimalAddSubtract<DecimalAddFunction>(prefix + "add");
-}
+template <typename TExec>
+using AddFunctionDenyPrecisionLoss = DecimalAddFunction<TExec, false>;
 
-void registerDecimalSubtract(const std::string& prefix) {
-  registerDecimalAddSubtract<DecimalSubtractFunction>(prefix + "subtract");
-}
+template <typename TExec>
+using SubtractFunctionAllowPrecisionLoss = DecimalSubtractFunction<TExec, true>;
 
-void registerDecimalMultiply(const std::string& prefix) {
-  std::string rPrecision = fmt::format(
-      "{a_precision} + {b_precision} + 1",
+template <typename TExec>
+using SubtractFunctionDenyPrecisionLoss = DecimalSubtractFunction<TExec, false>;
+
+template <typename TExec>
+using MultiplyFunctionAllowPrecisionLoss = DecimalMultiplyFunction<TExec, true>;
+
+template <typename TExec>
+using MultiplyFunctionDenyPrecisionLoss = DecimalMultiplyFunction<TExec, false>;
+
+template <typename TExec>
+using DivideFunctionAllowPrecisionLoss = DecimalDivideFunction<TExec, true>;
+
+template <typename TExec>
+using DivideFunctionDenyPrecisionLoss = DecimalDivideFunction<TExec, false>;
+
+std::vector<exec::SignatureVariable> getDivideConstraintsDenyPrecisionLoss() {
+  std::string wholeDigits = fmt::format(
+      "min(38, {a_precision} - {a_scale} + {b_scale})",
       fmt::arg("a_precision", P1::name()),
-      fmt::arg("b_precision", P2::name()));
-  std::string rScale = fmt::format(
-      "{a_scale} + {b_scale}",
       fmt::arg("a_scale", S1::name()),
       fmt::arg("b_scale", S2::name()));
-  registerDecimalBinary<DecimalMultiplyFunction>(
-      prefix + "multiply", makeConstraints(rPrecision, rScale));
+  std::string fractionDigits = fmt::format(
+      "min(38, max(6, {a_scale} + {b_precision} + 1))",
+      fmt::arg("a_scale", S1::name()),
+      fmt::arg("b_precision", P2::name()));
+  std::string diff = wholeDigits + " + " + fractionDigits + " - 38";
+  std::string newFractionDigits =
+      fmt::format("({}) - ({}) / 2 - 1", fractionDigits, diff);
+  std::string newWholeDigits = fmt::format("38 - ({})", newFractionDigits);
+  return {
+      exec::SignatureVariable(
+          P3::name(),
+          fmt::format(
+              "({}) > 0 ? ({}) : ({})",
+              diff,
+              bounded(newWholeDigits + " + " + newFractionDigits),
+              bounded(wholeDigits + " + " + fractionDigits)),
+          exec::ParameterType::kIntegerParameter),
+      exec::SignatureVariable(
+          S3::name(),
+          fmt::format(
+              "({}) > 0 ? ({}) : ({})",
+              diff,
+              bounded(newFractionDigits),
+              bounded(fractionDigits)),
+          exec::ParameterType::kIntegerParameter)};
 }
 
-std::vector<exec::SignatureVariable> getDivideConstraints() {
+std::vector<exec::SignatureVariable> getDivideConstraintsAllowPrecisionLoss() {
   std::string rPrecision = fmt::format(
       "{a_precision} - {a_scale} + {b_scale} + max(6, {a_scale} + {b_precision} + 1)",
       fmt::arg("a_precision", P1::name()),
@@ -576,25 +648,70 @@ std::vector<exec::SignatureVariable> getDivideConstraints() {
       "max(6, {a_scale} + {b_precision} + 1)",
       fmt::arg("a_scale", S1::name()),
       fmt::arg("b_precision", P2::name()));
-  return makeConstraints(rPrecision, rScale);
+  return makeConstraints(rPrecision, rScale, true);
 }
 
-void registerDecimalDivide(const std::string& prefix) {
-  std::vector<exec::SignatureVariable> constraints = getDivideConstraints();
-  registerDecimalBinary<DecimalDivideFunction>(prefix + "divide", constraints);
+template <template <class> typename Func>
+void registerDecimalDivide(
+    const std::string& functionName,
+    std::vector<exec::SignatureVariable> constraints) {
+  registerDecimalBinary<Func>(functionName, constraints);
 
   // (short, long) -> short
   registerFunction<
-      DecimalDivideFunction,
+      Func,
       ShortDecimal<P3, S3>,
       ShortDecimal<P1, S1>,
-      LongDecimal<P2, S2>>({prefix + "divide"}, constraints);
+      LongDecimal<P2, S2>>({functionName}, constraints);
 
   // (long, short) -> short
   registerFunction<
-      DecimalDivideFunction,
+      Func,
       ShortDecimal<P3, S3>,
       LongDecimal<P1, S1>,
-      ShortDecimal<P2, S2>>({prefix + "divide"}, constraints);
+      ShortDecimal<P2, S2>>({functionName}, constraints);
+}
+} // namespace
+
+void registerDecimalAdd(const std::string& prefix) {
+  auto [rPrecision, rScale] = getAddSubtractResultPrecisionScale();
+  registerDecimalBinary<AddFunctionAllowPrecisionLoss>(
+      prefix + "add", makeConstraints(rPrecision, rScale, true));
+  registerDecimalBinary<AddFunctionDenyPrecisionLoss>(
+      prefix + "add" + kDenyPrecisionLoss,
+      makeConstraints(rPrecision, rScale, false));
+}
+
+void registerDecimalSubtract(const std::string& prefix) {
+  auto [rPrecision, rScale] = getAddSubtractResultPrecisionScale();
+  registerDecimalBinary<SubtractFunctionAllowPrecisionLoss>(
+      prefix + "subtract", makeConstraints(rPrecision, rScale, true));
+  registerDecimalBinary<SubtractFunctionDenyPrecisionLoss>(
+      prefix + "subtract" + kDenyPrecisionLoss,
+      makeConstraints(rPrecision, rScale, false));
+}
+
+void registerDecimalMultiply(const std::string& prefix) {
+  std::string rPrecision = fmt::format(
+      "{a_precision} + {b_precision} + 1",
+      fmt::arg("a_precision", P1::name()),
+      fmt::arg("b_precision", P2::name()));
+  std::string rScale = fmt::format(
+      "{a_scale} + {b_scale}",
+      fmt::arg("a_scale", S1::name()),
+      fmt::arg("b_scale", S2::name()));
+  registerDecimalBinary<MultiplyFunctionAllowPrecisionLoss>(
+      prefix + "multiply", makeConstraints(rPrecision, rScale, true));
+  registerDecimalBinary<MultiplyFunctionDenyPrecisionLoss>(
+      prefix + "multiply" + kDenyPrecisionLoss,
+      makeConstraints(rPrecision, rScale, false));
+}
+
+void registerDecimalDivide(const std::string& prefix) {
+  registerDecimalDivide<DivideFunctionAllowPrecisionLoss>(
+      prefix + "divide", getDivideConstraintsAllowPrecisionLoss());
+  registerDecimalDivide<DivideFunctionDenyPrecisionLoss>(
+      prefix + "divide" + kDenyPrecisionLoss,
+      getDivideConstraintsDenyPrecisionLoss());
 }
 } // namespace facebook::velox::functions::sparksql
diff --git a/velox/functions/sparksql/DecimalUtil.h b/velox/functions/sparksql/DecimalUtil.h
index fbe5da77809e..28495789dc33 100644
--- a/velox/functions/sparksql/DecimalUtil.h
+++ b/velox/functions/sparksql/DecimalUtil.h
@@ -211,6 +211,16 @@ class DecimalUtil {
     }
   }
 
+  /// This method is used when the function is registered with
+  /// ``allowPrecisionLoss`` being false. Caps precision and scale at 38.
+  static std::pair<uint8_t, uint8_t> bounded(
+      uint8_t rPrecision,
+      uint8_t rScale) {
+    return {
+        std::min(rPrecision, DecimalType<TypeKind::HUGEINT>::kMaxPrecision),
+        std::min(rScale, DecimalType<TypeKind::HUGEINT>::kMaxPrecision)};
+  }
+
  private:
   /// Maintains the max bits that need to be increased for rescaling a value by
   /// certain scale. The calculation relies on the following formula:
diff --git a/velox/functions/sparksql/tests/DecimalArithmeticTest.cpp b/velox/functions/sparksql/tests/DecimalArithmeticTest.cpp
index a80baacf78dc..98f16fa774cc 100644
--- a/velox/functions/sparksql/tests/DecimalArithmeticTest.cpp
+++ b/velox/functions/sparksql/tests/DecimalArithmeticTest.cpp
@@ -517,5 +517,64 @@ TEST_F(DecimalArithmeticTest, divide) {
       {makeConstant<int128_t>(DecimalUtil::kLongDecimalMax, 1, DECIMAL(38, 0)),
        makeConstant<int64_t>(1, 1, DECIMAL(3, 2))});
 }
+
+TEST_F(DecimalArithmeticTest, denyPrecisionLoss) {
+  const std::string denyPrecisionLoss = "_deny_precision_loss";
+  testArithmeticFunction(
+      "add" + denyPrecisionLoss,
+      makeFlatVector(
+          std::vector<int128_t>{21232100, 29998888, 42345678, 42135632},
+          DECIMAL(38, 7)),
+      {makeFlatVector(
+           std::vector<int128_t>{11232100, 9998888, 12345678, 2135632},
+           DECIMAL(38, 7)),
+       makeFlatVector(std::vector<int64_t>{1, 2, 3, 4}, DECIMAL(10, 0))});
+
+  // Overflow when scaling up the whole part.
+  testArithmeticFunction(
+      "add" + denyPrecisionLoss,
+      makeNullableLongDecimalVector(
+          {"null", "null", "null", "null"}, DECIMAL(38, 7)),
+      {makeNullableLongDecimalVector(
+           {"-99999999999999999999999999999999990000",
+            "99999999999999999999999999999999999000",
+            "-99999999999999999999999999999999999900",
+            "99999999999999999999999999999999999990"},
+           DECIMAL(38, 3)),
+       makeFlatVector(
+           std::vector<int128_t>{-100, 9999999, -999900, 99999},
+           DECIMAL(38, 7))});
+
+  testArithmeticFunction(
+      "subtract" + denyPrecisionLoss,
+      makeFlatVector(
+          std::vector<int128_t>{1232100, -10001112, -17654322, -37864368},
+          DECIMAL(38, 7)),
+      {makeFlatVector(
+           std::vector<int128_t>{11232100, 9998888, 12345678, 2135632},
+           DECIMAL(38, 7)),
+       makeFlatVector(std::vector<int64_t>{1, 2, 3, 4}, DECIMAL(10, 0))});
+
+  testArithmeticFunction(
+      "multiply" + denyPrecisionLoss,
+      makeConstant<int128_t>(60501, 1, DECIMAL(38, 10)),
+      {makeConstant<int128_t>(201, 1, DECIMAL(20, 5)),
+       makeConstant<int128_t>(301, 1, DECIMAL(20, 5))});
+
+  // diff > 0
+  testArithmeticFunction(
+      "divide" + denyPrecisionLoss,
+      makeConstant<int128_t>(
+          HugeInt::parse("5" + std::string(18, '0')), 1, DECIMAL(38, 18)),
+      {makeConstant<int128_t>(500, 1, DECIMAL(20, 2)),
+       makeConstant<int64_t>(1000, 1, DECIMAL(17, 3))});
+  // diff < 0
+  testArithmeticFunction(
+      "divide" + denyPrecisionLoss,
+      makeConstant<int128_t>(
+          HugeInt::parse("5" + std::string(10, '0')), 1, DECIMAL(31, 10)),
+      {makeConstant<int128_t>(500, 1, DECIMAL(20, 2)),
+       makeConstant<int64_t>(1000, 1, DECIMAL(7, 3))});
+}
 } // namespace
 } // namespace facebook::velox::functions::sparksql::test
diff --git a/velox/functions/sparksql/tests/DecimalUtilTest.cpp b/velox/functions/sparksql/tests/DecimalUtilTest.cpp
index 833b88605a20..1b63019ed12a 100644
--- a/velox/functions/sparksql/tests/DecimalUtilTest.cpp
+++ b/velox/functions/sparksql/tests/DecimalUtilTest.cpp
@@ -60,4 +60,16 @@ TEST_F(DecimalUtilTest, minLeadingZeros) {
       12);
   ASSERT_EQ(result, 0);
 }
+
+TEST_F(DecimalUtilTest, bounded) {
+  auto testBounded = [](uint8_t rPrecision,
+                        uint8_t rScale,
+                        std::pair<uint8_t, uint8_t> expected) {
+    ASSERT_EQ(DecimalUtil::bounded(rPrecision, rScale), expected);
+  };
+
+  testBounded(10, 3, {10, 3});
+  testBounded(40, 3, {38, 3});
+  testBounded(44, 42, {38, 38});
+}
 } // namespace facebook::velox::functions::sparksql::test