This is an automated email from the ASF dual-hosted git repository.

panxiaolei pushed a commit to branch master
in repository https://gitbox.apache.org/repos/asf/doris.git


The following commit(s) were added to refs/heads/master by this push:
     new f8a3034dca [Opt](performance) refactor and opt time round floor 
function (#25026)
f8a3034dca is described below

commit f8a3034dca5f45f4cff9c3892fc8386cd514abc6
Author: HappenLee <[email protected]>
AuthorDate: Sun Oct 1 11:51:26 2023 +0800

    [Opt](performance) refactor and opt time round floor function (#25026)
    
    refactor and opt time round floor function
---
 .../vec/functions/function_datetime_floor_ceil.cpp | 252 ++++++++++++---------
 be/src/vec/runtime/vdatetime_value.h               |   2 +-
 2 files changed, 151 insertions(+), 103 deletions(-)

diff --git a/be/src/vec/functions/function_datetime_floor_ceil.cpp 
b/be/src/vec/functions/function_datetime_floor_ceil.cpp
index 967a39c2a3..b66cd5c0b6 100644
--- a/be/src/vec/functions/function_datetime_floor_ceil.cpp
+++ b/be/src/vec/functions/function_datetime_floor_ceil.cpp
@@ -517,13 +517,84 @@ struct FloorCeilImpl {
     }
 };
 
+#define FLOOR 0
+#define CEIL 1
+
+template <typename Impl, typename DateValueType>
+struct TimeRoundOpt {
+    constexpr static bool can_use_optimize(int period) {
+        if constexpr (!std::is_same_v<DateValueType, VecDateTimeValue> && 
Impl::Type == FLOOR) {
+            if constexpr (Impl::Unit == YEAR || Impl::Unit == MONTH || 
Impl::Unit == DAY ||
+                          Impl::Unit == MINUTE || Impl::Unit == SECOND) {
+                return period == 1;
+            }
+            if constexpr (Impl::Unit == HOUR) {
+                return period <= 23 && 24 % period == 0;
+            }
+        }
+        return false;
+    }
+
+    static void floor_opt(const DateValueType& ts2, DateValueType& ts1, int 
period) {
+        if (period == 1) {
+            floor_opt_one_period(ts2, ts1);
+        } else {
+            static constexpr uint64_t MASK_HOUR_FLOOR =
+                    
0b1111111111111111111111111111111100000000000000000000000000000000;
+
+            // Optimize the performance of the datetimev2 type on the floor 
operation.
+            // Now supports unit hour
+            if constexpr (Impl::Unit == HOUR && !std::is_same_v<DateValueType, 
VecDateTimeValue>) {
+                int hour = ts2.hour();
+                int new_hour = hour / period * period;
+                if (new_hour >= 24) {
+                    new_hour = new_hour % 24;
+                }
+                ts1.set_int_val(ts2.to_date_int_val() & MASK_HOUR_FLOOR);
+                ts1.template set_time_unit<TimeUnit::HOUR>(new_hour);
+            }
+        }
+    }
+
+    static void floor_opt_one_period(const DateValueType& ts2, DateValueType& 
ts1) {
+        if constexpr (Impl::Unit == YEAR) {
+            ts1.set_time(ts2.year(), 1, 1, 0, 0, 0);
+        }
+        if constexpr (Impl::Unit == MONTH) {
+            ts1.set_time(ts2.year(), ts2.month(), 1, 0, 0, 0);
+        }
+        if constexpr (Impl::Unit == DAY) {
+            ts1.set_time(ts2.year(), ts2.month(), ts2.day(), 0, 0, 0);
+        }
+
+        if constexpr (std::is_same_v<DateValueType, 
DateV2Value<DateTimeV2ValueType>>) {
+            static constexpr uint64_t MASK_HOUR_FLOOR =
+                    
0b1111111111111111111111111111111100000000000000000000000000000000;
+            static constexpr uint64_t MASK_MINUTE_FLOOR =
+                    
0b1111111111111111111111111111111111111100000000000000000000000000;
+            static constexpr uint64_t MASK_SECOND_FLOOR =
+                    
0b1111111111111111111111111111111111111111111100000000000000000000;
+
+            // Optimize the performance of the datetimev2 type on the floor 
operation.
+            // Now supports unit biger than SECOND
+            if constexpr (Impl::Unit == HOUR) {
+                ts1.set_int_val(ts2.to_date_int_val() & MASK_HOUR_FLOOR);
+            }
+            if constexpr (Impl::Unit == MINUTE) {
+                ts1.set_int_val(ts2.to_date_int_val() & MASK_MINUTE_FLOOR);
+            }
+            if constexpr (Impl::Unit == SECOND) {
+                ts1.set_int_val(ts2.to_date_int_val() & MASK_SECOND_FLOOR);
+            }
+        }
+    }
+};
+
 template <typename Impl>
 struct TimeRound {
     static constexpr auto name = Impl::name;
     static constexpr uint64_t FIRST_DAY = 19700101000000;
     static constexpr uint64_t FIRST_SUNDAY = 19700104000000;
-    static constexpr int8_t FLOOR = 0;
-    static constexpr int8_t CEIL = 1;
 
     static constexpr uint32_t MASK_YEAR_FOR_DATEV2 = ((uint32_t)-1) >> 23;
     static constexpr uint32_t MASK_YEAR_MONTH_FOR_DATEV2 = ((uint32_t)-1) >> 
27;
@@ -534,7 +605,7 @@ struct TimeRound {
     static constexpr uint64_t MASK_YEAR_MONTH_DAY_HOUR_FOR_DATETIMEV2 = 
((uint64_t)-1) >> 32;
     static constexpr uint64_t MASK_YEAR_MONTH_DAY_HOUR_MINUTE_FOR_DATETIMEV2 = 
((uint64_t)-1) >> 38;
 
-    template <typename NativeType, typename DateValueType>
+    template <typename DateValueType>
     static void time_round(const DateValueType& ts2, const Int32 period, 
DateValueType& ts1) {
         int64_t diff;
         int64_t trivial_part_ts1;
@@ -682,89 +753,61 @@ struct TimeRound {
         ts1.template date_add_interval<Impl::Unit, false>(interval);
     }
 
-    template <typename NativeType, typename DateValueType, Int32 period>
+    template <typename DateValueType, Int32 period>
     static void time_round_with_constant_optimization(const DateValueType& ts2,
                                                       DateValueType& ts1) {
-        time_round<NativeType, DateValueType>(ts2, period, ts1);
+        time_round<DateValueType>(ts2, period, ts1);
     }
 
-    static constexpr uint64_t MASK_DAY_FLOOR =
-            0b1111111111111111111111111110000000000000000000000000000000000000;
-    static constexpr uint64_t MASK_HOUR_FLOOR =
-            0b1111111111111111111111111111111100000000000000000000000000000000;
-    static constexpr uint64_t MASK_MINUTE_FLOOR =
-            0b1111111111111111111111111111111111111100000000000000000000000000;
-    static constexpr uint64_t MASK_SECOND_FLOOR =
-            0b1111111111111111111111111111111111111111111100000000000000000000;
-
-    static constexpr bool USE_OPTIMIZE_FLOOR =
-            Impl::Unit == DAY || Impl::Unit == HOUR || Impl::Unit == MINUTE || 
Impl::Unit == SECOND;
-    template <typename NativeType, typename DateValueType>
-    static void datetimev2_floor(const DateValueType& ts2, DateValueType& ts1) 
{
-        // Optimize the performance of the datetimev2 type on the floor 
operation.
-        // Now supports days, hours, minutes, and seconds.
-        if constexpr (Impl::Unit == DAY) {
-            ts1.set_int_val(ts2.to_date_int_val() & MASK_DAY_FLOOR);
-        }
-        if constexpr (Impl::Unit == HOUR) {
-            ts1.set_int_val(ts2.to_date_int_val() & MASK_HOUR_FLOOR);
-        }
-        if constexpr (Impl::Unit == MINUTE) {
-            ts1.set_int_val(ts2.to_date_int_val() & MASK_MINUTE_FLOOR);
-        }
-        if constexpr (Impl::Unit == SECOND) {
-            ts1.set_int_val(ts2.to_date_int_val() & MASK_SECOND_FLOOR);
-        }
-    }
-    template <typename NativeType, typename DateValueType>
+    template <typename DateValueType>
     static void time_round(const DateValueType& ts2, DateValueType& ts1) {
         static_assert(Impl::Unit != WEEK);
-        if constexpr (std::is_same_v<DateValueType, 
DateV2Value<DateTimeV2ValueType>> &&
-                      Impl::Type == FLOOR && USE_OPTIMIZE_FLOOR) {
-            datetimev2_floor<NativeType, DateValueType>(ts2, ts1);
-            return;
-        };
-        if constexpr (std::is_same_v<DateValueType, VecDateTimeValue>) {
-            ts1.reset_zero_by_type(ts2.type());
-        }
-        int64_t diff;
-        int64_t part;
-        if constexpr (Impl::Unit == YEAR) {
-            diff = ts2.year();
-            part = (ts2.month() - 1) + (ts2.day() - 1) + ts2.hour() + 
ts2.minute() + ts2.second();
-        }
-        if constexpr (Impl::Unit == MONTH) {
-            diff = ts2.year() * 12 + ts2.month() - 1;
-            part = (ts2.day() - 1) + ts2.hour() + ts2.minute() + ts2.second();
-        }
-        if constexpr (Impl::Unit == DAY) {
-            diff = ts2.daynr();
-            part = ts2.hour() + ts2.minute() + ts2.second();
-        }
-        if constexpr (Impl::Unit == HOUR) {
-            diff = ts2.daynr() * 24 + ts2.hour();
-            part = ts2.minute() + ts2.second();
-        }
-        if constexpr (Impl::Unit == MINUTE) {
-            diff = ts2.daynr() * 24L * 60 + ts2.hour() * 60 + ts2.minute();
-            part = ts2.second();
-        }
-        if constexpr (Impl::Unit == SECOND) {
-            diff = ts2.daynr() * 24L * 60 * 60 + ts2.hour() * 60L * 60 + 
ts2.minute() * 60L +
-                   ts2.second();
-            part = 0;
-            if constexpr (std::is_same_v<DateValueType, 
DateV2Value<DateTimeV2ValueType>>) {
-                part = ts2.microsecond();
+        if constexpr (TimeRoundOpt<Impl, DateValueType>::can_use_optimize(1)) {
+            TimeRoundOpt<Impl, DateValueType>::floor_opt_one_period(ts2, ts1);
+        } else {
+            if constexpr (std::is_same_v<DateValueType, VecDateTimeValue>) {
+                ts1.reset_zero_by_type(ts2.type());
+            }
+            int64_t diff;
+            int64_t part;
+            if constexpr (Impl::Unit == YEAR) {
+                diff = ts2.year();
+                part = (ts2.month() - 1) + (ts2.day() - 1) + ts2.hour() + 
ts2.minute() +
+                       ts2.second();
+            }
+            if constexpr (Impl::Unit == MONTH) {
+                diff = ts2.year() * 12 + ts2.month() - 1;
+                part = (ts2.day() - 1) + ts2.hour() + ts2.minute() + 
ts2.second();
+            }
+            if constexpr (Impl::Unit == DAY) {
+                diff = ts2.daynr();
+                part = ts2.hour() + ts2.minute() + ts2.second();
+            }
+            if constexpr (Impl::Unit == HOUR) {
+                diff = ts2.daynr() * 24 + ts2.hour();
+                part = ts2.minute() + ts2.second();
+            }
+            if constexpr (Impl::Unit == MINUTE) {
+                diff = ts2.daynr() * 24L * 60 + ts2.hour() * 60 + ts2.minute();
+                part = ts2.second();
+            }
+            if constexpr (Impl::Unit == SECOND) {
+                diff = ts2.daynr() * 24L * 60 * 60 + ts2.hour() * 60L * 60 + 
ts2.minute() * 60L +
+                       ts2.second();
+                part = 0;
+                if constexpr (std::is_same_v<DateValueType, 
DateV2Value<DateTimeV2ValueType>>) {
+                    part = ts2.microsecond();
+                }
             }
-        }
 
-        if constexpr (Impl::Type == CEIL) {
-            if (part) {
-                diff++;
+            if constexpr (Impl::Type == CEIL) {
+                if (part) {
+                    diff++;
+                }
             }
+            TimeInterval interval(Impl::Unit, diff, 1);
+            ts1.template date_set_interval<Impl::Unit>(interval);
         }
-        TimeInterval interval(Impl::Unit, diff, 1);
-        ts1.template date_set_interval<Impl::Unit>(interval);
     }
 
     template <typename NativeType, typename DateValueType>
@@ -772,7 +815,7 @@ struct TimeRound {
         res = origin_date;
         auto ts2 = binary_cast<NativeType, DateValueType>(date);
         auto& ts1 = (DateValueType&)(res);
-        TimeRound<Impl>::template time_round<NativeType, DateValueType>(ts2, 
period, ts1);
+        TimeRound<Impl>::template time_round<DateValueType>(ts2, period, ts1);
     }
 
     template <typename NativeType, typename DateValueType, Int32 period>
@@ -781,22 +824,27 @@ struct TimeRound {
         res = origin_date;
         auto ts2 = binary_cast<NativeType, DateValueType>(date);
         auto& ts1 = (DateValueType&)(res);
-        TimeRound<Impl>::template 
time_round_with_constant_optimization<NativeType, DateValueType,
-                                                                        
period>(ts2, ts1);
+        TimeRound<Impl>::template 
time_round_with_constant_optimization<DateValueType, period>(ts2,
+                                                                               
                ts1);
     }
 
     template <typename NativeType, typename DateValueType>
     static void time_round(NativeType date, Int32 period, NativeType& res) {
         auto ts2 = binary_cast<NativeType, DateValueType>(date);
         auto& ts1 = (DateValueType&)(res);
-        if constexpr (Impl::Unit != WEEK) {
-            ts1.from_olap_datetime(FIRST_DAY);
+
+        if (TimeRoundOpt<Impl, DateValueType>::can_use_optimize(period)) {
+            TimeRoundOpt<Impl, DateValueType>::floor_opt(ts2, ts1, period);
         } else {
-            // Only week use the FIRST SUNDAY
-            ts1.from_olap_datetime(FIRST_SUNDAY);
-        }
+            if constexpr (Impl::Unit != WEEK) {
+                ts1.from_olap_datetime(FIRST_DAY);
+            } else {
+                // Only week use the FIRST SUNDAY
+                ts1.from_olap_datetime(FIRST_SUNDAY);
+            }
 
-        TimeRound<Impl>::template time_round<NativeType, DateValueType>(ts2, 
period, ts1);
+            TimeRound<Impl>::template time_round<DateValueType>(ts2, period, 
ts1);
+        }
     }
 
     template <typename NativeType, typename DateValueType>
@@ -804,11 +852,11 @@ struct TimeRound {
         auto ts2 = binary_cast<NativeType, DateValueType>(date);
         auto& ts1 = (DateValueType&)(res);
         if constexpr (Impl::Unit != WEEK) {
-            TimeRound<Impl>::template time_round<NativeType, 
DateValueType>(ts2, ts1);
+            TimeRound<Impl>::template time_round<DateValueType>(ts2, ts1);
         } else {
             // Only week use the FIRST SUNDAY
             ts1.from_olap_datetime(FIRST_SUNDAY);
-            TimeRound<Impl>::template time_round<NativeType, 
DateValueType>(ts2, 1, ts1);
+            TimeRound<Impl>::template time_round<DateValueType>(ts2, 1, ts1);
         }
     }
 };
@@ -861,21 +909,21 @@ struct TimeRound {
             FunctionDateTimeFloorCeil<FloorCeilImpl<TimeRound<CLASS>>, 
VecDateTimeValue, Int32, 2, \
                                       true>;
 
-TIME_ROUND(YearFloor, year_floor, YEAR, false);
-TIME_ROUND(MonthFloor, month_floor, MONTH, false);
-TIME_ROUND(WeekFloor, week_floor, WEEK, false);
-TIME_ROUND(DayFloor, day_floor, DAY, false);
-TIME_ROUND(HourFloor, hour_floor, HOUR, false);
-TIME_ROUND(MinuteFloor, minute_floor, MINUTE, false);
-TIME_ROUND(SecondFloor, second_floor, SECOND, false);
-
-TIME_ROUND(YearCeil, year_ceil, YEAR, true);
-TIME_ROUND(MonthCeil, month_ceil, MONTH, true);
-TIME_ROUND(WeekCeil, week_ceil, WEEK, true);
-TIME_ROUND(DayCeil, day_ceil, DAY, true);
-TIME_ROUND(HourCeil, hour_ceil, HOUR, true);
-TIME_ROUND(MinuteCeil, minute_ceil, MINUTE, true);
-TIME_ROUND(SecondCeil, second_ceil, SECOND, true);
+TIME_ROUND(YearFloor, year_floor, YEAR, FLOOR);
+TIME_ROUND(MonthFloor, month_floor, MONTH, FLOOR);
+TIME_ROUND(WeekFloor, week_floor, WEEK, FLOOR);
+TIME_ROUND(DayFloor, day_floor, DAY, FLOOR);
+TIME_ROUND(HourFloor, hour_floor, HOUR, FLOOR);
+TIME_ROUND(MinuteFloor, minute_floor, MINUTE, FLOOR);
+TIME_ROUND(SecondFloor, second_floor, SECOND, FLOOR);
+
+TIME_ROUND(YearCeil, year_ceil, YEAR, CEIL);
+TIME_ROUND(MonthCeil, month_ceil, MONTH, CEIL);
+TIME_ROUND(WeekCeil, week_ceil, WEEK, CEIL);
+TIME_ROUND(DayCeil, day_ceil, DAY, CEIL);
+TIME_ROUND(HourCeil, hour_ceil, HOUR, CEIL);
+TIME_ROUND(MinuteCeil, minute_ceil, MINUTE, CEIL);
+TIME_ROUND(SecondCeil, second_ceil, SECOND, CEIL);
 
 void register_function_datetime_floor_ceil(SimpleFunctionFactory& factory) {
 #define REGISTER_FUNC_WITH_DELTA_TYPE(CLASS, DELTA)                        \
diff --git a/be/src/vec/runtime/vdatetime_value.h 
b/be/src/vec/runtime/vdatetime_value.h
index c525e68ee7..3367c2f706 100644
--- a/be/src/vec/runtime/vdatetime_value.h
+++ b/be/src/vec/runtime/vdatetime_value.h
@@ -763,7 +763,7 @@ public:
     }
 
     void set_time(uint16_t year, uint8_t month, uint8_t day, uint8_t hour, 
uint8_t minute,
-                  uint8_t second, uint32_t microsecond);
+                  uint8_t second, uint32_t microsecond = 0);
 
     void set_time(uint8_t hour, uint8_t minute, uint8_t second, uint32_t 
microsecond);
 


---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]

Reply via email to