Re: [PR] [Variant] `rescale_decimal` followup [arrow-rs]

via GitHub Mon, 20 Oct 2025 12:14:30 -0700


scovich commented on code in PR #8655:
URL: https://github.com/apache/arrow-rs/pull/8655#discussion_r2445879368



##########
parquet-variant-compute/src/type_conversion.rs:
##########
@@ -239,44 +247,22 @@ where
             false if r <= half_neg => d.sub_wrapping(I::Native::ONE),
             _ => d,
         };
-        O::Native::from_decimal(adjusted)
-    };
 
-    scaled.filter(|v| is_infallible_cast || O::is_valid_decimal_precision(*v, 
output_precision))
-}
-
-/// Returns true if casting from (input_precision, input_scale) to
-/// (output_precision, output_scale) is infallible based on precision/scale 
math.
-fn is_infallible_decimal_cast(
-    input_precision: u8,
-    input_scale: i8,
-    output_precision: u8,
-    output_scale: i8,
-) -> bool {
-    let delta_scale = output_scale - input_scale;
-    let input_precision = input_precision as i8;
-    let output_precision = output_precision as i8;
-    if delta_scale >= 0 {
-        // if the gain in precision (digits) is greater than the 
multiplication due to scaling
-        // every number will fit into the output type
-        // Example: If we are starting with any number of precision 5 [xxxxx],
-        // then an increase of scale by 3 will have the following effect on 
the representation:
-        // [xxxxx] -> [xxxxx000], so for the cast to be infallible, the output 
type
-        // needs to provide at least 8 digits precision
-        input_precision + delta_scale <= output_precision
-    } else {
         // if the reduction of the input number through scaling (dividing) is 
greater
         // than a possible precision loss (plus potential increase via 
rounding)
         // every input number will fit into the output type
         // Example: If we are starting with any number of precision 5 [xxxxx],
         // then and decrease the scale by 3 will have the following effect on 
the representation:
         // [xxxxx] -> [xx] (+ 1 possibly, due to rounding).
-        // The rounding may add an additional digit, so for the cast to be 
infallible,
+        // The rounding may add a digit, so for the cast to be infallible,
         // the output type needs to have at least 3 digits of precision.
         // e.g. Decimal(5, 3) 99.999 to Decimal(3, 0) will result in 100:
         // [99999] -> [99] + 1 = [100], a cast to Decimal(2, 0) would not be 
possible
-        input_precision + delta_scale < output_precision
-    }
+        let is_infallible_cast = input_precision as i8 + delta_scale < 
output_precision as i8;
+        (O::Native::from_decimal(adjusted), is_infallible_cast)
+    };
+
+    scaled.filter(|v| is_infallible_cast || O::is_valid_decimal_precision(*v, 
output_precision))

Review Comment:
   aside: I _believe_ compiler "jump threading" optimizations should bypass the 
`filter` call when `is_infallible_cast=true`. Not sure how to verify that, tho.
   
   Alternatively, we can drastically increase the probability of successful 
jump threading by defining `mut scale` and then:
   
   ```suggestion
       if !is_infallible_cast {
           scaled = scaled.filter(|v| O::is_valid_decimal_precision(*v, 
output_precision));
       }
       scaled
   ```
   (if we pursue that, we may want to change the logic to `is_fallible_cast` to 
avoid error-prone double negative logic)



##########
parquet-variant-compute/src/type_conversion.rs:
##########
@@ -189,40 +189,48 @@ where
 /// Rescale a decimal from (input_precision, input_scale) to 
(output_precision, output_scale)
 /// and return the scaled value if it fits the output precision. Similar to 
the implementation in
 /// decimal.rs in arrow-cast.
-pub(crate) fn rescale_decimal<I, O>(
+pub(crate) fn rescale_decimal<I: DecimalType, O: DecimalType>(
     value: I::Native,
     input_precision: u8,
     input_scale: i8,
     output_precision: u8,
     output_scale: i8,
 ) -> Option<O::Native>
 where
-    I: DecimalType,
-    O: DecimalType,
     I::Native: DecimalCast,
     O::Native: DecimalCast,
 {
     let delta_scale = output_scale - input_scale;
 
-    // Determine if the cast is infallible based on precision/scale math
-    let is_infallible_cast =
-        is_infallible_decimal_cast(input_precision, input_scale, 
output_precision, output_scale);
+    let (scaled, is_infallible_cast) = if delta_scale >= 0 {
+        // O::MAX_FOR_EACH_PRECISION[k] stores 10^k - 1 (e.g., 9, 99, 999, 
...).
+        // Adding 1 yields exactly 10^k without computing a power at runtime.
+        // Using the precomputed table avoids pow(10, k) and its 
checked/overflow
+        // handling, which is faster and simpler for scaling by 10^delta_scale.
+        let max = O::MAX_FOR_EACH_PRECISION.get(delta_scale as usize)?;
+        let mul = max.add_wrapping(O::Native::ONE);
 
-    let scaled = if delta_scale == 0 {
-        O::Native::from_decimal(value)
-    } else if delta_scale > 0 {
-        let mul = O::Native::from_decimal(10_i128)
-            .and_then(|t| t.pow_checked(delta_scale as u32).ok())?;
-        O::Native::from_decimal(value).and_then(|x| x.mul_checked(mul).ok())
+        // if the gain in precision (digits) is greater than the 
multiplication due to scaling
+        // every number will fit into the output type
+        // Example: If we are starting with any number of precision 5 [xxxxx],
+        // then an increase of scale by 3 will have the following effect on 
the representation:
+        // [xxxxx] -> [xxxxx000], so for the cast to be infallible, the output 
type
+        // needs to provide at least 8 digits precision
+        let is_infallible_cast = input_precision as i8 + delta_scale <= 
output_precision as i8;
+        let scaled = if is_infallible_cast {
+            Some(O::Native::from_decimal(value).unwrap().mul_wrapping(mul))
+        } else {
+            O::Native::from_decimal(value).and_then(|x| 
x.mul_checked(mul).ok())
+        };

Review Comment:
   ```suggestion
           let value = O::Native::from_decimal(value);
           let scaled = if is_infallible_cast {
               Some(value.unwrap().mul_wrapping(mul))
           } else {
               value.and_then(|x| x.mul_checked(mul).ok())
           };
   ```



-- 
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.

To unsubscribe, e-mail: [email protected]

For queries about this service, please contact Infrastructure at:
[email protected]

Re: [PR] [Variant] `rescale_decimal` followup [arrow-rs]

Reply via email to