This is an automated email from the ASF dual-hosted git repository.

zhouyuan pushed a commit to branch main
in repository https://gitbox.apache.org/repos/asf/gluten.git


The following commit(s) were added to refs/heads/main by this push:
     new e733332184 [GLUTEN-6887][VL] Daily Update Velox Version (2026_05_18) 
(#12102)
e733332184 is described below

commit e733332184fa2e0fe85f29c5384b8d5210ca972e
Author: Gluten Performance Bot 
<[email protected]>
AuthorDate: Fri May 22 07:56:12 2026 +0100

    [GLUTEN-6887][VL] Daily Update Velox Version (2026_05_18) (#12102)
    
    * [GLUTEN-6887][VL] Daily Update Velox Version (dft-2026_05_18)
    
    Upstream Velox's New Commits:
    6af674c38 by Claude, feat(fuzzer): Add WindowNode-based alternate plan to 
TopNRowNumberFuzzer (#17536)
    bec8806bf by 1fanwang, fix(parquet): Include file column name in 
schema-mismatch error (#16591) (#17353)
    103b8c889 by Shaojie Li, fix(cudf): Show stats for adapter operators not in 
plan tree (#17541)
    81dff12ad by Suryadev Sahadevan Rajesh, refactor(encoding): Move encoding 
selection files to `selection/` subfolder (#17540)
    472d3196b by beliefer, fix: Pass request type to 
SelectiveDecimalColumnReader (#17463)
    fb0826ace by Masha Basmanova, docs: Add PR review scripts and style guide 
(#17524)
    d41a22889 by Xiao Du, refactor: Enforce callers to provide metadataIoStats 
to TabletReader (#17534)
    951677f88 by Shruti Shivakumar, refactor(cudf): Alphabetize objects in 
Velox-cuDF CMake files (#17517)
    1718279d7 by Krishna Pai, build(docker): Pin tzdata across all velox-dev 
images (#17535)
    2a5e3f905 by Shrinidhi Joshi, fix: Drop HashTable cache entry on builder 
failure (#17527)
    982637f85 by Masha Basmanova, feat: Support dialect-specific type coercion 
(#17519)
    ea683f05a by Chengcheng Jin, fix(cudf): Fix CudfSplitReader ReaderOptions 
init (#17532)
    8801a43ff by Scott Lee, Add reallocateBytes to MemoryAllocator to avoid 
unnecessary memcpy (#17525)
    a983d9b07 by Madhurendra Purbay, perf(simd): Add arch-aware boolean mask 
helpers (#17257)
    2cea959b7 by rexan, feat: Add support for TZDIR environment variable 
(#15871)
    02f22e8ac by Raymond Lin, feat: Add partition key propagation to 
ScanBatchEvent callback (#17513)
    53b6a8b03 by Huameng (Michael) Jiang, fix(tracer): Fix TableWrite trace 
replayer to register connector and preserve serde parameters (#17526)
    5680a3226 by Xiaoxuan Meng, Refactor ReaderOptions IoStatistics from raw 
pointers to shared_ptr (#17518)
    fd130f44a by mohsaka, feat: Add iceberg data file statistics (#17388)
    805db6b72 by Pramod Satya, fix: Validate reduce_agg initial state (#17398)
    6af81f0e7 by Shaojie Li, perf(hashtable): Add adaptive prefetch to hashRows 
normalizedKey path (#17495)
    78ebafc59 by Rui Mo, fix(spark): Remove TIMESTAMP_NTZ type (#17512)
    6800d5ba1 by mohsaka, feat: Add FileMetadata return to Writer::close() and 
introduce WriterConfig constants (#17509)
    888bab856 by Orri Erling, feat(wave): Add durable kernel caching 
infrastructure to wave/common (#17474)
    d0a53253c by Facebook GitHub Bot, Re-sync with internal repository
    
    Signed-off-by: glutenperfbot <[email protected]>
    
    * Trigger CI
    
    * Trigger PR CI
    
    Signed-off-by: Reema Alzaid <[email protected]>
    
    * Fix Velox API compatibility
    
    * Trigger PR CI
    
    Signed-off-by: Reema Alzaid <[email protected]>
    
    * Trigger CI for IBM Velox 2026-05-18 fix
    
    * Trigger CI for IBM Velox 2026-05-18 fix
    
    * [VL][Iceberg] Propagate VELOX_ENABLE_PARQUET to Gluten backend
    
    ---------
    
    Signed-off-by: glutenperfbot <[email protected]>
    Signed-off-by: Reema Alzaid <[email protected]>
    Co-authored-by: glutenperfbot <[email protected]>
    Co-authored-by: Reema Alzaid <[email protected]>
---
 cpp/velox/CMakeLists.txt                             | 12 ++++++++++++
 cpp/velox/substrait/SubstraitToVeloxPlanValidator.cc |  3 ++-
 cpp/velox/utils/ConfigExtractor.cc                   |  6 +++---
 ep/build-velox/src/get-velox.sh                      |  4 ++--
 4 files changed, 19 insertions(+), 6 deletions(-)

diff --git a/cpp/velox/CMakeLists.txt b/cpp/velox/CMakeLists.txt
index 532dd6e6a7..a8b0d668ca 100644
--- a/cpp/velox/CMakeLists.txt
+++ b/cpp/velox/CMakeLists.txt
@@ -239,6 +239,18 @@ endif()
 
 add_library(velox SHARED ${VELOX_SRCS})
 
+# Keep ABI sensitive Velox feature macros in sync
+set(GLUTEN_VELOX_CMAKE_CACHE "${VELOX_BUILD_PATH}/CMakeCache.txt")
+set(GLUTEN_VELOX_ENABLE_PARQUET ${VELOX_ENABLE_PARQUET})
+if(NOT GLUTEN_VELOX_ENABLE_PARQUET AND EXISTS "${GLUTEN_VELOX_CMAKE_CACHE}")
+  file(STRINGS "${GLUTEN_VELOX_CMAKE_CACHE}" GLUTEN_VELOX_ENABLE_PARQUET
+       REGEX "^VELOX_ENABLE_PARQUET:BOOL=(ON|TRUE|1)$")
+endif()
+if(GLUTEN_VELOX_ENABLE_PARQUET)
+  target_compile_definitions(velox PRIVATE VELOX_ENABLE_PARQUET)
+  message(STATUS "Propagating VELOX_ENABLE_PARQUET to Gluten Velox backend")
+endif()
+
 if(ENABLE_GLUTEN_VCPKG AND NOT CMAKE_SYSTEM_NAME MATCHES "Darwin")
   # Hide some symbols to avoid conflict.
   target_link_options(
diff --git a/cpp/velox/substrait/SubstraitToVeloxPlanValidator.cc 
b/cpp/velox/substrait/SubstraitToVeloxPlanValidator.cc
index 6b10b805ed..3ea800b60c 100644
--- a/cpp/velox/substrait/SubstraitToVeloxPlanValidator.cc
+++ b/cpp/velox/substrait/SubstraitToVeloxPlanValidator.cc
@@ -25,6 +25,7 @@
 #include "velox/exec/Aggregate.h"
 #include "velox/expression/Expr.h"
 #include "velox/expression/SignatureBinder.h"
+#include "velox/type/TypeCoercer.h"
 
 namespace gluten {
 namespace {
@@ -1159,7 +1160,7 @@ bool 
SubstraitToVeloxPlanValidator::validateAggRelFunctionType(const ::substrait
 
     bool resolved = false;
     for (const auto& signature : signaturesOpt.value()) {
-      exec::SignatureBinder binder(*signature, types);
+      exec::SignatureBinder binder(*signature, types, 
facebook::velox::TypeCoercer::defaults());
       if (binder.tryBind()) {
         TypePtr resolveType = nullptr;
         try {
diff --git a/cpp/velox/utils/ConfigExtractor.cc 
b/cpp/velox/utils/ConfigExtractor.cc
index 6006d990db..b0b6c1a99a 100644
--- a/cpp/velox/utils/ConfigExtractor.cc
+++ b/cpp/velox/utils/ConfigExtractor.cc
@@ -25,7 +25,7 @@
 #include "utils/Macros.h"
 #include "velox/connectors/hive/HiveConfig.h"
 #include "velox/connectors/hive/storage_adapters/s3fs/S3Config.h"
-#include "velox/dwio/parquet/writer/Writer.h"
+#include "velox/dwio/parquet/writer/WriterConfig.h"
 
 namespace gluten {
 
@@ -229,7 +229,7 @@ std::shared_ptr<facebook::velox::config::ConfigBase> 
createHiveConnectorSessionC
   
configs[facebook::velox::connector::hive::HiveConfig::kFileColumnNamesReadAsLowerCaseSession]
 =
       !conf->get<bool>(kCaseSensitive, false) ? "true" : "false";
   
configs[facebook::velox::connector::hive::HiveConfig::kPartitionPathAsLowerCaseSession]
 = "false";
-  configs[facebook::velox::parquet::WriterOptions::kParquetWriteTimestampUnit] 
= std::string("6");
+  
configs[facebook::velox::parquet::WriterConfig::kParquetSessionWriteTimestampUnit]
 = std::string("6");
   
configs[facebook::velox::connector::hive::HiveConfig::kReadTimestampUnitSession]
 = std::string("6");
   
configs[facebook::velox::connector::hive::HiveConfig::kMaxPartitionsPerWritersSession]
 =
       conf->get<std::string>(kMaxPartitions, "10000");
@@ -243,7 +243,7 @@ std::shared_ptr<facebook::velox::config::ConfigBase> 
createHiveConnectorSessionC
       conf->get<bool>(kAllowInt32Narrowing, true) ? "true" : "false";
   
configs[facebook::velox::connector::hive::HiveConfig::kOrcUseColumnNamesSession]
 =
       conf->get<bool>(kOrcUseColumnNames, true) ? "true" : "false";
-  configs[facebook::velox::parquet::WriterOptions::kParquetWritePageSize] =
+  
configs[facebook::velox::parquet::WriterConfig::kParquetSessionWritePageSize] =
       conf->get<std::string>(kWriteParquetPageSizeBytes, "1MB");
 
   overwriteVeloxConf(conf.get(), configs, kDynamicBackendConfPrefix);
diff --git a/ep/build-velox/src/get-velox.sh b/ep/build-velox/src/get-velox.sh
index a6631e1e76..51034c77f7 100755
--- a/ep/build-velox/src/get-velox.sh
+++ b/ep/build-velox/src/get-velox.sh
@@ -18,8 +18,8 @@ set -exu
 
 CURRENT_DIR=$(cd "$(dirname "$BASH_SOURCE")"; pwd)
 VELOX_REPO=https://github.com/IBM/velox.git
-VELOX_BRANCH=dft-2026_05_15
-VELOX_ENHANCED_BRANCH=ibm-2026_05_15
+VELOX_BRANCH=dft-2026_05_18
+VELOX_ENHANCED_BRANCH=ibm-2026_05_18
 VELOX_HOME=""
 RUN_SETUP_SCRIPT=ON
 ENABLE_ENHANCED_FEATURES=OFF


---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]

Reply via email to