This is an automated email from the ASF dual-hosted git repository.
rui-mo pushed a change to branch ts_ntz_dev
in repository https://gitbox.apache.org/repos/asf/gluten.git
omit 65182e0f12 [GLUTEN-11622][VL] Use formatted string for TIMESTAMP_NTZ
partition value
omit 45e2bacceb [GLUTEN-11622][VL] Add basic TIMESTAMP_NTZ type support
(#11939)
add b40f776e70 [INFRA] Enable automated GitHub Copilot code reviews
(#12228)
add 60ce4f880f [VL] Skip escape argument when offloading `Like`
expressions without backslashes (#12152)
add a2cdb98ea8 [VL] Support native scala udaf in window (#12117)
add 5668e14bcf [GLUTEN-12225][CORE] Fix arrow.c shading: exclude
memory/vector packages so public API stays unshaded (#12226)
add 2731470f62 [GLUTEN-12143][VL] Route bitmap_construct_agg to native
Velox execution (#12142)
add 6565a406b8 [MINOR] Upgrade Spark 4.0 to 4.0.2 (#12180)
add 73ca2130c3 [GLUTEN-6887][VL] Daily Update Velox Version (2026_06_04)
(#12230)
add 9acd3d7015 [GLUTEN-12022][VL] Extend S3 filesystem registration in
Gluten (#12026)
add aa82d4aae6 [VL] Reduce Velox scan SQL metrics by default to mitigate
driver OOM (#12127)
add ca7d68f7a2 [VL] Bump FasterXML Jackson to 2.18.6 for Spark 3.5 and
above (#12243)
add a8bf7ea290 [MINOR] Fix typo in shuffleInputOutput config name (#12239)
add 9de3b50b1f [VL] Fixed iceberg config logic (#12221)
add 4281c08a5f [GLUTEN-6887][VL] Daily Update Velox Version
(dft-2026_06_05) (#12247)
add bc37334384 [GLUTEN-10215][VL] Remove streaming aggregation workaround
in Delta stats writer (#12222)
add fc90a7933a [VL] Respect orc.force.positional.evolution (#12234)
add b96d8e83d6 [MINOR][VL] Re-enable stale ignored atan2 test in
MathFunctionsValidateSuite (#12199)
add 2e37dd2f2e Bump pyarrow in /tools/workload/benchmark_velox/analysis
(#12254)
add 2d6f39bcac [Core] Upgrade default spark version to 4.0.2 (#12252)
add 7415d74c22 [VL] Make Velox memory manager capacity ratio configurable
(#12258)
add 6e04b4a4bb [MINOR][VL] Remove modify_arrow_dataset_scan_option.patch
(#12148)
add 4634c80a21 [GLUTEN-11915][VL] Support RowBasedChecksum in
ColumnarShuffleWriter (SPARK-51756) (#12067)
add 64c75a5ab1 [GLUTEN-11622][VL] Add basic TIMESTAMP_NTZ type support
(#11939)
add df10cf0573 [GLUTEN-11622][VL] Use formatted string for TIMESTAMP_NTZ
partition value
This update added new revisions after undoing existing revisions.
That is to say, some revisions that were in the old version of the
branch are not in the new version. This situation occurs
when a user --force pushes a change and generates a repository
containing something like this:
* -- * -- B -- O -- O -- O (65182e0f12)
\
N -- N -- N refs/heads/ts_ntz_dev (df10cf0573)
You should already have received notification emails for all of the O
revisions, and so the following emails describe only the N revisions
from the common base, B.
Any revisions marked "omit" are not gone; other references still
refer to them. Any revisions marked "discard" are gone forever.
No new revisions were added by this update.
Summary of changes:
.asf.yaml | 5 +
.github/workflows/util/install-spark-resources.sh | 2 +-
.github/workflows/velox_backend_x86.yml | 4 +-
.../org/apache/gluten/utils/CHExpressionUtil.scala | 1 +
.../VeloxCelebornColumnarShuffleWriter.scala | 3 +-
.../delta/stats/GlutenDeltaJobStatsTracker.scala | 65 +-
.../delta/stats/GlutenDeltaJobStatsTracker.scala | 65 +-
.../execution/AbstractIcebergWriteExec.scala | 2 +-
.../execution/enhanced/VeloxIcebergSuite.scala | 71 ++
.../writer/VeloxUniffleColumnarShuffleWriter.java | 3 +-
.../gluten/backendsapi/velox/VeloxMetricsApi.scala | 18 +
.../backendsapi/velox/VeloxSparkPlanExecApi.scala | 158 +++-
.../org/apache/gluten/config/VeloxConfig.scala | 5 +-
.../gluten/metrics/BatchScanMetricsUpdater.scala | 102 ++-
.../metrics/FileSourceScanMetricsUpdater.scala | 116 +--
.../metrics/HiveTableScanMetricsUpdater.scala | 113 +--
.../spark/shuffle/ColumnarShuffleWriter.scala | 21 +-
.../apache/spark/sql/expression/UDFResolver.scala | 45 +-
.../apache/gluten/expression/VeloxUdfSuite.scala | 146 +++-
.../functions/MathFunctionsValidateSuite.scala | 8 +-
cpp/core/config/GlutenConfig.h | 3 +
cpp/core/jni/JniWrapper.cc | 16 +-
cpp/core/shuffle/Options.h | 2 +
cpp/core/shuffle/ShuffleWriter.cc | 4 +
cpp/core/shuffle/ShuffleWriter.h | 2 +
cpp/core/utils/tac/ffor.hpp | 3 +-
cpp/velox/CMakeLists.txt | 13 +-
cpp/velox/compute/VeloxBackend.cc | 24 +-
cpp/velox/filesystem/GlutenS3FileSystem.cc | 54 ++
.../filesystem/GlutenS3FileSystem.h} | 29 +-
cpp/velox/shuffle/VeloxHashShuffleWriter.cc | 65 ++
cpp/velox/shuffle/VeloxHashShuffleWriter.h | 11 +-
cpp/velox/substrait/SubstraitToVeloxPlan.cc | 3 +-
.../substrait/SubstraitToVeloxPlanValidator.cc | 3 +-
cpp/velox/tests/CMakeLists.txt | 4 +
cpp/velox/tests/GlutenS3FileSystemTest.cc | 57 ++
cpp/velox/tests/RowBasedChecksumTest.cc | 121 +++
cpp/velox/udf/examples/UdfCommon.h | 4 +-
dev/build-arrow.sh | 1 -
dev/check-arrow-c-shading.sh | 89 +++
docs/Configuration.md | 1 +
docs/developers/VeloxUDF.md | 1 +
docs/get-started/build-guide.md | 2 +-
docs/get-started/getting-started.md | 2 +-
docs/velox-configuration.md | 2 +-
ep/build-velox/src/get-velox.sh | 6 +-
.../src/modify_arrow_dataset_scan_option.patch | 883 ---------------------
.../gluten/vectorized/GlutenSplitResult.java | 9 +-
.../gluten/vectorized/ShuffleWriterJniWrapper.java | 3 +-
.../apache/gluten/execution/IcebergWriteExec.scala | 9 +-
.../gluten/backendsapi/SparkPlanExecApi.scala | 137 +---
.../org/apache/gluten/config/GlutenConfig.scala | 41 +
.../execution/FileSourceScanExecTransformer.scala | 13 +-
.../apache/gluten/metrics/ScanMetricsUtil.scala | 81 ++
.../sql/hive/HiveTableScanExecTransformer.scala | 5 +-
.../gluten/metrics/ScanMetricsUtilSuite.scala | 70 ++
.../hive/execution/GlutenHiveSQLQuerySuite.scala | 30 +
.../hive/execution/GlutenHiveSQLQuerySuite.scala | 30 +
.../utils/clickhouse/ClickHouseTestSettings.scala | 2 +
.../gluten/utils/velox/VeloxTestSettings.scala | 4 +
.../sql/GlutenBitmapExpressionsQuerySuite.scala | 21 +-
.../hive/execution/GlutenHiveSQLQuerySuite.scala | 30 +
.../utils/clickhouse/ClickHouseTestSettings.scala | 2 +
.../gluten/utils/velox/VeloxTestSettings.scala | 5 +
.../sql/GlutenBitmapExpressionsQuerySuite.scala | 21 +-
.../GlutenKeyGroupedPartitioningSuite.scala | 56 ++
.../hive/execution/GlutenHiveSQLQuerySuite.scala | 30 +
.../utils/clickhouse/ClickHouseTestSettings.scala | 2 +
.../gluten/utils/velox/VeloxTestSettings.scala | 10 +-
.../sql/GlutenBitmapExpressionsQuerySuite.scala | 21 +-
.../sql/gluten/GlutenRowBasedChecksumSuite.scala | 91 +++
.../hive/execution/GlutenHiveSQLQuerySuite.scala | 30 +
.../gluten/config/GlutenRuntimeConfigSuite.scala | 15 +
package/pom.xml | 43 +-
pom.xml | 8 +-
.../apache/gluten/expression/ExpressionNames.scala | 1 +
.../apache/spark/shuffle/GlutenMapStatusUtil.scala | 15 +-
.../apache/spark/shuffle/GlutenMapStatusUtil.scala | 15 +-
.../gluten/sql/shims/spark35/Spark35Shims.scala | 3 +-
.../apache/spark/shuffle/GlutenMapStatusUtil.scala | 15 +-
.../gluten/sql/shims/spark40/Spark40Shims.scala | 3 +-
.../apache/spark/shuffle/GlutenMapStatusUtil.scala | 15 +-
.../gluten/sql/shims/spark41/Spark41Shims.scala | 3 +-
.../spark/shuffle/GlutenMapStatusUtil.scala} | 27 +-
.../gluten/integration/action/DataGenOnly.scala | 52 +-
tools/gluten-it/pom.xml | 2 +-
.../benchmark_velox/analysis/requirements.txt | 2 +-
87 files changed, 1891 insertions(+), 1439 deletions(-)
create mode 100644 cpp/velox/filesystem/GlutenS3FileSystem.cc
copy cpp/{core/utils/WholeStageDumper.h =>
velox/filesystem/GlutenS3FileSystem.h} (55%)
create mode 100644 cpp/velox/tests/GlutenS3FileSystemTest.cc
create mode 100644 cpp/velox/tests/RowBasedChecksumTest.cc
create mode 100755 dev/check-arrow-c-shading.sh
delete mode 100644 ep/build-velox/src/modify_arrow_dataset_scan_option.patch
create mode 100644
gluten-substrait/src/main/scala/org/apache/gluten/metrics/ScanMetricsUtil.scala
create mode 100644
gluten-substrait/src/test/scala/org/apache/gluten/metrics/ScanMetricsUtilSuite.scala
create mode 100644
gluten-ut/spark41/src/test/scala/org/apache/spark/sql/gluten/GlutenRowBasedChecksumSuite.scala
copy
backends-clickhouse/src-celeborn/main/scala/org/apache/spark/shuffle/CHCelebornColumnarBatchSerializerFactory.scala
=>
shims/spark33/src/main/scala/org/apache/spark/shuffle/GlutenMapStatusUtil.scala
(69%)
copy
backends-clickhouse/src-celeborn/main/scala/org/apache/spark/shuffle/CHCelebornColumnarBatchSerializerFactory.scala
=>
shims/spark34/src/main/scala/org/apache/spark/shuffle/GlutenMapStatusUtil.scala
(69%)
copy
backends-clickhouse/src-celeborn/main/scala/org/apache/spark/shuffle/CHCelebornColumnarBatchSerializerFactory.scala
=>
shims/spark35/src/main/scala/org/apache/spark/shuffle/GlutenMapStatusUtil.scala
(69%)
copy
backends-clickhouse/src-celeborn/main/scala/org/apache/spark/shuffle/CHCelebornColumnarBatchSerializerFactory.scala
=>
shims/spark40/src/main/scala/org/apache/spark/shuffle/GlutenMapStatusUtil.scala
(69%)
copy
shims/{spark33/src/main/scala/org/apache/spark/sql/catalyst/expressions/EvalMode.scala
=> spark41/src/main/scala/org/apache/spark/shuffle/GlutenMapStatusUtil.scala}
(60%)
---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]