[arrow-rs] branch master updated: fix: cast decimal to decimal should be round the result (#3139)

tustvold Thu, 24 Nov 2022 23:06:24 -0800

This is an automated email from the ASF dual-hosted git repository.

tustvold pushed a commit to branch master
in repository https://gitbox.apache.org/repos/asf/arrow-rs.git



The following commit(s) were added to refs/heads/master by this push:
     new 187bf619d fix: cast decimal to decimal should be round the result 
(#3139)
187bf619d is described below

commit 187bf619dfafccdb21cea6b2cecabd29daffc1e4
Author: Kun Liu <[email protected]>
AuthorDate: Fri Nov 25 15:06:12 2022 +0800

    fix: cast decimal to decimal should be round the result (#3139)
    
    Co-authored-by: Raphael Taylor-Davies <[email protected]>
---
 arrow-cast/src/cast.rs | 192 +++++++++++++++++++++++++++++++++++++++++++++----
 1 file changed, 179 insertions(+), 13 deletions(-)

diff --git a/arrow-cast/src/cast.rs b/arrow-cast/src/cast.rs
index 3f1775825..07c7d6a3a 100644
--- a/arrow-cast/src/cast.rs
+++ b/arrow-cast/src/cast.rs
@@ -1967,12 +1967,26 @@ fn cast_decimal_to_decimal_safe<const BYTE_WIDTH1: 
usize, const BYTE_WIDTH2: usi
         // For example, input_scale is 4 and output_scale is 3;
         // Original value is 11234_i128, and will be cast to 1123_i128.
         let div = 10_i128.pow((input_scale - output_scale) as u32);
+        let half = div / 2;
+        let neg_half = half.wrapping_neg();
         if BYTE_WIDTH1 == 16 {
             let array = 
array.as_any().downcast_ref::<Decimal128Array>().unwrap();
             if BYTE_WIDTH2 == 16 {
-                let iter = array
-                    .iter()
-                    .map(|v| v.and_then(|v| v.div_checked(div).ok()));
+                // rounding the result
+                let iter = array.iter().map(|v| {
+                    v.map(|v| {
+                        // the div must be gt_eq 10, we don't need to check 
the overflow for the `div`/`mod` operation
+                        let d = v.wrapping_div(div);
+                        let r = v.wrapping_rem(div);
+                        if v >= 0 && r >= half {
+                            d.wrapping_add(1)
+                        } else if v < 0 && r <= neg_half {
+                            d.wrapping_sub(1)
+                        } else {
+                            d
+                        }
+                    })
+                });
                 let casted_array = unsafe {
                     
PrimitiveArray::<Decimal128Type>::from_trusted_len_iter(iter)
                 };
@@ -1981,7 +1995,17 @@ fn cast_decimal_to_decimal_safe<const BYTE_WIDTH1: 
usize, const BYTE_WIDTH2: usi
                     .map(|a| Arc::new(a) as ArrayRef)
             } else {
                 let iter = array.iter().map(|v| {
-                    v.and_then(|v| 
v.div_checked(div).ok().map(i256::from_i128))
+                    v.map(|v| {
+                        let d = v.wrapping_div(div);
+                        let r = v.wrapping_rem(div);
+                        i256::from_i128(if v >= 0 && r >= half {
+                            d.wrapping_add(1)
+                        } else if v < 0 && r <= neg_half {
+                            d.wrapping_sub(1)
+                        } else {
+                            d
+                        })
+                    })
                 });
                 let casted_array = unsafe {
                     
PrimitiveArray::<Decimal256Type>::from_trusted_len_iter(iter)
@@ -1993,9 +2017,22 @@ fn cast_decimal_to_decimal_safe<const BYTE_WIDTH1: 
usize, const BYTE_WIDTH2: usi
         } else {
             let array = 
array.as_any().downcast_ref::<Decimal256Array>().unwrap();
             let div = i256::from_i128(div);
+            let half = div / i256::from_i128(2);
+            let neg_half = half.wrapping_neg();
             if BYTE_WIDTH2 == 16 {
                 let iter = array.iter().map(|v| {
-                    v.and_then(|v| v.div_checked(div).ok().and_then(|v| 
v.to_i128()))
+                    v.and_then(|v| {
+                        let d = v.wrapping_div(div);
+                        let r = v.wrapping_rem(div);
+                        if v >= i256::ZERO && r >= half {
+                            d.wrapping_add(i256::ONE)
+                        } else if v < i256::ZERO && r <= neg_half {
+                            d.wrapping_sub(i256::ONE)
+                        } else {
+                            d
+                        }
+                        .to_i128()
+                    })
                 });
                 let casted_array = unsafe {
                     
PrimitiveArray::<Decimal128Type>::from_trusted_len_iter(iter)
@@ -2004,9 +2041,19 @@ fn cast_decimal_to_decimal_safe<const BYTE_WIDTH1: 
usize, const BYTE_WIDTH2: usi
                     .with_precision_and_scale(*output_precision, *output_scale)
                     .map(|a| Arc::new(a) as ArrayRef)
             } else {
-                let iter = array
-                    .iter()
-                    .map(|v| v.and_then(|v| v.div_checked(div).ok()));
+                let iter = array.iter().map(|v| {
+                    v.map(|v| {
+                        let d = v.wrapping_div(div);
+                        let r = v.wrapping_rem(div);
+                        if v >= i256::ZERO && r >= half {
+                            d.wrapping_add(i256::ONE)
+                        } else if v < i256::ZERO && r <= neg_half {
+                            d.wrapping_sub(i256::ONE)
+                        } else {
+                            d
+                        }
+                    })
+                });
                 let casted_array = unsafe {
                     
PrimitiveArray::<Decimal256Type>::from_trusted_len_iter(iter)
                 };
@@ -3566,6 +3613,125 @@ mod tests {
             .with_precision_and_scale(precision, scale)
     }
 
+    #[test]
+    #[cfg(not(feature = "force_validate"))]
+    fn test_cast_decimal_to_decimal_round() {
+        let array = vec![
+            Some(1123454),
+            Some(2123456),
+            Some(-3123453),
+            Some(-3123456),
+            None,
+        ];
+        let input_decimal_array = create_decimal_array(array, 20, 4).unwrap();
+        let array = Arc::new(input_decimal_array) as ArrayRef;
+        // decimal128 to decimal128
+        let input_type = DataType::Decimal128(20, 4);
+        let output_type = DataType::Decimal128(20, 3);
+        assert!(can_cast_types(&input_type, &output_type));
+        generate_cast_test_case!(
+            &array,
+            Decimal128Array,
+            &output_type,
+            vec![
+                Some(112345_i128),
+                Some(212346_i128),
+                Some(-312345_i128),
+                Some(-312346_i128),
+                None
+            ]
+        );
+
+        // decimal128 to decimal256
+        let input_type = DataType::Decimal128(20, 4);
+        let output_type = DataType::Decimal256(20, 3);
+        assert!(can_cast_types(&input_type, &output_type));
+        generate_cast_test_case!(
+            &array,
+            Decimal256Array,
+            &output_type,
+            vec![
+                Some(i256::from_i128(112345_i128)),
+                Some(i256::from_i128(212346_i128)),
+                Some(i256::from_i128(-312345_i128)),
+                Some(i256::from_i128(-312346_i128)),
+                None
+            ]
+        );
+
+        // decimal256
+        let array = vec![
+            Some(i256::from_i128(1123454)),
+            Some(i256::from_i128(2123456)),
+            Some(i256::from_i128(-3123453)),
+            Some(i256::from_i128(-3123456)),
+            None,
+        ];
+        let input_decimal_array = create_decimal256_array(array, 20, 
4).unwrap();
+        let array = Arc::new(input_decimal_array) as ArrayRef;
+
+        // decimal256 to decimal256
+        let input_type = DataType::Decimal256(20, 4);
+        let output_type = DataType::Decimal256(20, 3);
+        assert!(can_cast_types(&input_type, &output_type));
+        generate_cast_test_case!(
+            &array,
+            Decimal256Array,
+            &output_type,
+            vec![
+                Some(i256::from_i128(112345_i128)),
+                Some(i256::from_i128(212346_i128)),
+                Some(i256::from_i128(-312345_i128)),
+                Some(i256::from_i128(-312346_i128)),
+                None
+            ]
+        );
+        // decimal256 to decimal128
+        let input_type = DataType::Decimal256(20, 4);
+        let output_type = DataType::Decimal128(20, 3);
+        assert!(can_cast_types(&input_type, &output_type));
+        generate_cast_test_case!(
+            &array,
+            Decimal128Array,
+            &output_type,
+            vec![
+                Some(112345_i128),
+                Some(212346_i128),
+                Some(-312345_i128),
+                Some(-312346_i128),
+                None
+            ]
+        );
+
+        // decimal256 to decimal128 overflow
+        let array = vec![
+            Some(i256::from_i128(1123454)),
+            Some(i256::from_i128(2123456)),
+            Some(i256::from_i128(-3123453)),
+            Some(i256::from_i128(-3123456)),
+            None,
+            Some(i256::MAX),
+            Some(i256::MIN),
+        ];
+        let input_decimal_array = create_decimal256_array(array, 76, 
4).unwrap();
+        let array = Arc::new(input_decimal_array) as ArrayRef;
+        assert!(can_cast_types(&input_type, &output_type));
+        generate_cast_test_case!(
+            &array,
+            Decimal128Array,
+            &output_type,
+            vec![
+                Some(112345_i128),
+                Some(212346_i128),
+                Some(-312345_i128),
+                Some(-312346_i128),
+                None,
+                None,
+                None
+            ]
+        );
+    }
+
     #[test]
     #[cfg(not(feature = "force_validate"))]
     fn test_cast_decimal128_to_decimal128() {
@@ -7219,7 +7385,7 @@ mod tests {
         let input_type = DataType::Decimal128(20, 0);
         let output_type = DataType::Decimal128(20, -1);
         assert!(can_cast_types(&input_type, &output_type));
-        let array = vec![Some(1123456), Some(2123456), Some(3123456), None];
+        let array = vec![Some(1123450), Some(2123455), Some(3123456), None];
         let input_decimal_array = create_decimal_array(array, 20, 0).unwrap();
         let array = Arc::new(input_decimal_array) as ArrayRef;
         generate_cast_test_case!(
@@ -7228,8 +7394,8 @@ mod tests {
             &output_type,
             vec![
                 Some(112345_i128),
-                Some(212345_i128),
-                Some(312345_i128),
+                Some(212346_i128),
+                Some(312346_i128),
                 None
             ]
         );
@@ -7238,8 +7404,8 @@ mod tests {
         let decimal_arr = as_primitive_array::<Decimal128Type>(&casted_array);
 
         assert_eq!("1123450", decimal_arr.value_as_string(0));
-        assert_eq!("2123450", decimal_arr.value_as_string(1));
-        assert_eq!("3123450", decimal_arr.value_as_string(2));
+        assert_eq!("2123460", decimal_arr.value_as_string(1));
+        assert_eq!("3123460", decimal_arr.value_as_string(2));
     }
 
     #[test]

[arrow-rs] branch master updated: fix: cast decimal to decimal should be round the result (#3139)

Reply via email to