This is an automated email from the ASF dual-hosted git repository.
alamb pushed a change to branch dependabot/cargo/main/strum-0.26.1
in repository https://gitbox.apache.org/repos/asf/arrow-datafusion.git
from dbb3e0b1b1 Update strum-macros and datafusion-cli
add 1097dc0345 Fix the clippy error of use of deprecated method (#9034)
add fffc8bef30 feat: support the ergonomics of getting list slice with
stride (#8946)
add a57e270088 Cache common referred expression at the window input (#9009)
add af0e8a95ca Optimize `COUNT( DISTINCT ...)` for strings (up to 9x
faster) (#8849)
add 9bf0f68b36 feat: Parallel Arrow file format reading (#8897)
add 92104a5446 Change remove from swap to shift in index map (#9049)
add d594e6257b Relax join keys constraint from Column to any physical
expression for physical join operators (#8991)
add d2625c35d1 Minor: Improve memory helper trait documentaiton (#9025)
add 90a821a061 Docs: improve contributor guide to explain how to work with
tickets (#8999)
add 8326f577bc upper and lower functions only work correctly on ascii
character #9053 (#9054)
add 724a8e8d5b spelling etc (#9035)
add 851bc7de85 explicitly list out all Expr types (#9038)
add 3eb7080671 Minor: improve scalar functions document (#9029)
add 488cfe117c Minor: alter a test to support new functionality (#9065)
add ee9736fc81 Remove some recursive clones (#9050)
add cea211d218 minor: remove useless macro (#8979)
add 8dee7bbb66 Causality Analysis for Builtin Window Functions (#9048)
add c3f6c0f079 Minor: add doc examples for RawTableAllocExt (#9059)
add 228c88f565 Update substrait requirement from 0.23.0 to 0.24.0 (#9067)
add 4d389c2590 Remove single_file_output option from FileSinkConfig and
Copy statement (#9041)
add 78447d6081 Add a make_date function (#9040)
add d6f7c1623e Speedup `DFSchema::merge` using HashSet indices (#9020)
add 7fb83cc318 Document minimum required rust version (#9071)
add efd2fd2e26 Return proper number of expressions for nth_value_agg
(#9044)
add 85ceb9db7a ScalarUDF with zero arguments should be provided with one
null array as parameter (#9031)
add 7c5ac55df6 Merge remote-tracking branch 'apache/main' into
dependabot/cargo/main/strum-0.26.1
No new revisions were added by this update.
Summary of changes:
CONTRIBUTING.md | 2 +-
Cargo.toml | 2 +-
README.md | 6 +-
benchmarks/bench.sh | 17 +-
benchmarks/queries/clickbench/README.md | 3 +-
datafusion-cli/Cargo.lock | 1 +
datafusion-examples/README.md | 1 +
datafusion-examples/examples/make_date.rs | 120 +++++
datafusion/common/src/dfschema.rs | 16 +-
datafusion/core/src/dataframe/mod.rs | 2 -
datafusion/core/src/dataframe/parquet.rs | 1 -
.../core/src/datasource/file_format/arrow.rs | 1 -
.../core/src/datasource/file_format/parquet.rs | 1 -
.../core/src/datasource/file_format/write/demux.rs | 2 +-
.../datasource/file_format/write/orchestration.rs | 2 -
datafusion/core/src/datasource/listing/table.rs | 1 -
.../src/datasource/physical_plan/arrow_file.rs | 159 ++++++-
.../core/src/datasource/physical_plan/csv.rs | 4 +-
.../core/src/datasource/physical_plan/json.rs | 4 +-
.../core/src/datasource/physical_plan/mod.rs | 4 -
.../src/datasource/physical_plan/parquet/mod.rs | 4 +-
.../src/physical_optimizer/enforce_distribution.rs | 291 +++++++-----
.../core/src/physical_optimizer/enforce_sorting.rs | 19 +-
.../core/src/physical_optimizer/join_selection.rs | 79 ++--
.../src/physical_optimizer/projection_pushdown.rs | 53 ++-
.../replace_with_order_preserving_variants.rs | 2 +-
datafusion/core/src/physical_planner.rs | 29 +-
.../tests/fuzz_cases/distinct_count_string_fuzz.rs | 211 +++++++++
datafusion/core/tests/fuzz_cases/join_fuzz.rs | 8 +-
datafusion/core/tests/fuzz_cases/mod.rs | 1 +
datafusion/core/tests/fuzz_cases/window_fuzz.rs | 205 ++++++---
.../user_defined/user_defined_scalar_functions.rs | 114 ++++-
datafusion/execution/src/memory_pool/mod.rs | 15 +-
datafusion/execution/src/memory_pool/proxy.rs | 40 +-
datafusion/expr/src/built_in_function.rs | 10 +
datafusion/expr/src/expr.rs | 28 +-
datafusion/expr/src/expr_fn.rs | 3 +-
datafusion/expr/src/expr_schema.rs | 7 +-
datafusion/expr/src/field_util.rs | 13 +-
datafusion/expr/src/logical_plan/builder.rs | 4 +-
datafusion/expr/src/logical_plan/dml.rs | 4 -
datafusion/expr/src/logical_plan/plan.rs | 80 ++--
datafusion/expr/src/partition_evaluator.rs | 5 +
datafusion/expr/src/tree_node/expr.rs | 4 +-
datafusion/expr/src/tree_node/plan.rs | 6 +-
datafusion/expr/src/utils.rs | 2 +-
datafusion/optimizer/src/analyzer/rewrite_expr.rs | 2 +-
datafusion/optimizer/src/analyzer/type_coercion.rs | 23 +-
.../optimizer/src/common_subexpr_eliminate.rs | 79 +++-
datafusion/optimizer/src/eliminate_outer_join.rs | 5 +-
datafusion/optimizer/src/optimize_projections.rs | 6 +-
datafusion/optimizer/src/optimizer.rs | 5 +-
datafusion/optimizer/src/push_down_filter.rs | 117 ++---
datafusion/optimizer/src/push_down_limit.rs | 106 +++--
.../src/simplify_expressions/simplify_exprs.rs | 2 +-
.../optimizer/src/unwrap_cast_in_comparison.rs | 4 +-
datafusion/optimizer/src/utils.rs | 3 +-
datafusion/physical-expr/Cargo.toml | 1 +
.../{count_distinct.rs => count_distinct/mod.rs} | 126 +++---
.../src/aggregate/count_distinct/strings.rs | 490 +++++++++++++++++++++
.../physical-expr/src/aggregate/nth_value.rs | 9 +-
.../physical-expr/src/datetime_expressions.rs | 221 +++++++++-
datafusion/physical-expr/src/equivalence/class.rs | 26 +-
.../physical-expr/src/equivalence/properties.rs | 45 +-
.../src/expressions/get_indexed_field.rs | 85 +++-
datafusion/physical-expr/src/functions.rs | 2 +
datafusion/physical-expr/src/planner.rs | 45 +-
datafusion/physical-expr/src/scalar_function.rs | 17 +-
datafusion/physical-expr/src/string_expressions.rs | 4 +-
datafusion/physical-expr/src/udf.rs | 1 +
datafusion/physical-expr/src/window/built_in.rs | 7 +-
datafusion/physical-expr/src/window/lead_lag.rs | 5 +
datafusion/physical-expr/src/window/rank.rs | 4 +
datafusion/physical-expr/src/window/row_number.rs | 5 +
datafusion/physical-plan/src/joins/hash_join.rs | 197 ++++-----
.../physical-plan/src/joins/sort_merge_join.rs | 152 +++----
.../physical-plan/src/joins/symmetric_hash_join.rs | 84 ++--
datafusion/physical-plan/src/joins/test_utils.rs | 12 +-
datafusion/physical-plan/src/joins/utils.rs | 177 +++++---
datafusion/proto/proto/datafusion.proto | 9 +-
datafusion/proto/src/generated/pbjson.rs | 73 +--
datafusion/proto/src/generated/prost.rs | 15 +-
datafusion/proto/src/logical_plan/from_proto.rs | 16 +
datafusion/proto/src/logical_plan/mod.rs | 3 -
datafusion/proto/src/logical_plan/to_proto.rs | 20 +-
datafusion/proto/src/physical_plan/from_proto.rs | 29 +-
datafusion/proto/src/physical_plan/mod.rs | 73 +--
datafusion/proto/src/physical_plan/to_proto.rs | 16 +-
.../proto/tests/cases/roundtrip_logical_plan.rs | 7 -
.../proto/tests/cases/roundtrip_physical_plan.rs | 40 +-
datafusion/sql/src/expr/mod.rs | 53 ++-
datafusion/sql/src/statement.rs | 6 -
datafusion/sql/tests/sql_integration.rs | 6 +-
datafusion/sqllogictest/Cargo.toml | 1 +
datafusion/sqllogictest/test_files/aggregate.slt | 57 +++
datafusion/sqllogictest/test_files/array.slt | 45 ++
datafusion/sqllogictest/test_files/clickbench.slt | 3 +
datafusion/sqllogictest/test_files/copy.slt | 34 +-
datafusion/sqllogictest/test_files/csv_files.slt | 4 +-
datafusion/sqllogictest/test_files/functions.slt | 22 +-
datafusion/sqllogictest/test_files/group_by.slt | 8 +-
datafusion/sqllogictest/test_files/parquet.slt | 8 +-
datafusion/sqllogictest/test_files/repartition.slt | 2 +-
.../sqllogictest/test_files/repartition_scan.slt | 19 +-
.../sqllogictest/test_files/schema_evolution.slt | 8 +-
datafusion/sqllogictest/test_files/timestamps.slt | 164 +++++++
datafusion/sqllogictest/test_files/window.slt | 259 ++++++-----
datafusion/substrait/Cargo.toml | 2 +-
docs/source/contributor-guide/index.md | 39 +-
docs/source/user-guide/sql/dml.md | 2 +-
docs/source/user-guide/sql/scalar_functions.md | 102 ++++-
docs/source/user-guide/sql/write_options.md | 12 +-
112 files changed, 3527 insertions(+), 1283 deletions(-)
create mode 100644 datafusion-examples/examples/make_date.rs
create mode 100644
datafusion/core/tests/fuzz_cases/distinct_count_string_fuzz.rs
rename datafusion/physical-expr/src/aggregate/{count_distinct.rs =>
count_distinct/mod.rs} (90%)
create mode 100644
datafusion/physical-expr/src/aggregate/count_distinct/strings.rs