This is an automated email from the ASF dual-hosted git repository.

hongze pushed a commit to branch main
in repository https://gitbox.apache.org/repos/asf/incubator-gluten.git


The following commit(s) were added to refs/heads/main by this push:
     new da5259566 [VL] Add tests for Velox SMJ's coverage (#7195)
da5259566 is described below

commit da525956635d3c06d3a715a27b4b199912f23d84
Author: Hongze Zhang <[email protected]>
AuthorDate: Thu Sep 12 09:24:35 2024 +0800

    [VL] Add tests for Velox SMJ's coverage (#7195)
---
 .../utils/clickhouse/ClickHouseTestSettings.scala       |  6 +++---
 .../apache/gluten/utils/velox/VeloxTestSettings.scala   | 13 ++++++++++---
 .../sql/execution/joins/GlutenInnerJoinSuite.scala      | 17 ++++++++++++++++-
 .../sql/execution/joins/GlutenOuterJoinSuite.scala      | 17 ++++++++++++++++-
 4 files changed, 45 insertions(+), 8 deletions(-)

diff --git 
a/gluten-ut/spark35/src/test/scala/org/apache/gluten/utils/clickhouse/ClickHouseTestSettings.scala
 
b/gluten-ut/spark35/src/test/scala/org/apache/gluten/utils/clickhouse/ClickHouseTestSettings.scala
index 7e73ae9c1..77d4cb1ce 100644
--- 
a/gluten-ut/spark35/src/test/scala/org/apache/gluten/utils/clickhouse/ClickHouseTestSettings.scala
+++ 
b/gluten-ut/spark35/src/test/scala/org/apache/gluten/utils/clickhouse/ClickHouseTestSettings.scala
@@ -34,7 +34,7 @@ import org.apache.spark.sql.execution.datasources.parquet._
 import org.apache.spark.sql.execution.datasources.text.{GlutenTextV1Suite, 
GlutenTextV2Suite}
 import 
org.apache.spark.sql.execution.datasources.v2.{GlutenDataSourceV2StrategySuite, 
GlutenFileTableSuite, GlutenV2PredicateSuite}
 import org.apache.spark.sql.execution.exchange.GlutenEnsureRequirementsSuite
-import org.apache.spark.sql.execution.joins.{GlutenBroadcastJoinSuite, 
GlutenExistenceJoinSuite, GlutenInnerJoinSuite, GlutenOuterJoinSuite}
+import org.apache.spark.sql.execution.joins.{GlutenBroadcastJoinSuite, 
GlutenExistenceJoinSuite, GlutenInnerJoinSuiteForceShjOn, 
GlutenOuterJoinSuiteForceShjOn}
 import org.apache.spark.sql.extension.{GlutenCustomerExtensionSuite, 
GlutenSessionExtensionSuite}
 import org.apache.spark.sql.gluten.GlutenFallbackSuite
 import org.apache.spark.sql.hive.execution.GlutenHiveSQLQueryCHSuite
@@ -1624,7 +1624,7 @@ class ClickHouseTestSettings extends BackendTestSettings {
     .exclude("test composed unique condition (both non-equal) for left anti 
join using ShuffledHashJoin (whole-stage-codegen on)")
     .exclude("test composed unique condition (both non-equal) for left anti 
join using SortMergeJoin (whole-stage-codegen off)")
     .exclude("test composed unique condition (both non-equal) for left anti 
join using SortMergeJoin (whole-stage-codegen on)")
-  enableSuite[GlutenInnerJoinSuite]
+  enableSuite[GlutenInnerJoinSuiteForceShjOn]
     .exclude(
       "inner join, one match per row using ShuffledHashJoin (build=left) 
(whole-stage-codegen off)")
     .exclude(
@@ -1673,7 +1673,7 @@ class ClickHouseTestSettings extends BackendTestSettings {
     .exclude("SPARK-15822 - test structs as keys using BroadcastNestedLoopJoin 
build left (whole-stage-codegen on)")
     .exclude("SPARK-15822 - test structs as keys using BroadcastNestedLoopJoin 
build right (whole-stage-codegen off)")
     .exclude("SPARK-15822 - test structs as keys using BroadcastNestedLoopJoin 
build right (whole-stage-codegen on)")
-  enableSuite[GlutenOuterJoinSuite]
+  enableSuite[GlutenOuterJoinSuiteForceShjOn]
     .exclude("basic left outer join using ShuffledHashJoin 
(whole-stage-codegen off)")
     .exclude("basic left outer join using ShuffledHashJoin 
(whole-stage-codegen on)")
     .exclude("basic left outer join using SortMergeJoin (whole-stage-codegen 
off)")
diff --git 
a/gluten-ut/spark35/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
 
b/gluten-ut/spark35/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
index baabff3f7..e4706caa7 100644
--- 
a/gluten-ut/spark35/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
+++ 
b/gluten-ut/spark35/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
@@ -35,7 +35,7 @@ import org.apache.spark.sql.execution.datasources.parquet._
 import org.apache.spark.sql.execution.datasources.text.{GlutenTextV1Suite, 
GlutenTextV2Suite}
 import 
org.apache.spark.sql.execution.datasources.v2.{GlutenDataSourceV2StrategySuite, 
GlutenFileTableSuite, GlutenV2PredicateSuite}
 import org.apache.spark.sql.execution.exchange.GlutenEnsureRequirementsSuite
-import org.apache.spark.sql.execution.joins.{GlutenBroadcastJoinSuite, 
GlutenExistenceJoinSuite, GlutenInnerJoinSuite, GlutenOuterJoinSuite}
+import org.apache.spark.sql.execution.joins._
 import 
org.apache.spark.sql.extension.{GlutenCollapseProjectExecTransformerSuite, 
GlutenSessionExtensionSuite, TestFileSourceScanExecTransformer}
 import org.apache.spark.sql.gluten.GlutenFallbackSuite
 import org.apache.spark.sql.hive.execution.GlutenHiveSQLQuerySuite
@@ -879,8 +879,15 @@ class VeloxTestSettings extends BackendTestSettings {
     .exclude("broadcast join where streamed side's output partitioning is 
HashPartitioning")
 
   enableSuite[GlutenExistenceJoinSuite]
-  enableSuite[GlutenInnerJoinSuite]
-  enableSuite[GlutenOuterJoinSuite]
+  enableSuite[GlutenInnerJoinSuiteForceShjOn]
+  enableSuite[GlutenInnerJoinSuiteForceShjOff]
+  enableSuite[GlutenOuterJoinSuiteForceShjOn]
+  enableSuite[GlutenOuterJoinSuiteForceShjOff]
+    // Caused by Velox SMJ result mismatches with Spark.
+    .exclude("basic right outer join using SortMergeJoin (whole-stage-codegen 
off)")
+    .exclude("basic right outer join using SortMergeJoin (whole-stage-codegen 
on)")
+    .exclude("right outer join with unique keys using SortMergeJoin 
(whole-stage-codegen off)")
+    .exclude("right outer join with unique keys using SortMergeJoin 
(whole-stage-codegen on)")
   enableSuite[FallbackStrategiesSuite]
   enableSuite[GlutenBroadcastExchangeSuite]
   enableSuite[GlutenLocalBroadcastExchangeSuite]
diff --git 
a/gluten-ut/spark35/src/test/scala/org/apache/spark/sql/execution/joins/GlutenInnerJoinSuite.scala
 
b/gluten-ut/spark35/src/test/scala/org/apache/spark/sql/execution/joins/GlutenInnerJoinSuite.scala
index 745f550ae..d31936211 100644
--- 
a/gluten-ut/spark35/src/test/scala/org/apache/spark/sql/execution/joins/GlutenInnerJoinSuite.scala
+++ 
b/gluten-ut/spark35/src/test/scala/org/apache/spark/sql/execution/joins/GlutenInnerJoinSuite.scala
@@ -16,6 +16,21 @@
  */
 package org.apache.spark.sql.execution.joins
 
+import org.apache.gluten.GlutenConfig
+
+import org.apache.spark.SparkConf
 import org.apache.spark.sql.GlutenSQLTestsBaseTrait
 
-class GlutenInnerJoinSuite extends InnerJoinSuite with GlutenSQLTestsBaseTrait 
{}
+class GlutenInnerJoinSuiteForceShjOn extends InnerJoinSuite with 
GlutenSQLTestsBaseTrait {
+  override def sparkConf: SparkConf = {
+    super.sparkConf
+      .set(GlutenConfig.COLUMNAR_FPRCE_SHUFFLED_HASH_JOIN_ENABLED.key, "true")
+  }
+}
+
+class GlutenInnerJoinSuiteForceShjOff extends InnerJoinSuite with 
GlutenSQLTestsBaseTrait {
+  override def sparkConf: SparkConf = {
+    super.sparkConf
+      .set(GlutenConfig.COLUMNAR_FPRCE_SHUFFLED_HASH_JOIN_ENABLED.key, "false")
+  }
+}
diff --git 
a/gluten-ut/spark35/src/test/scala/org/apache/spark/sql/execution/joins/GlutenOuterJoinSuite.scala
 
b/gluten-ut/spark35/src/test/scala/org/apache/spark/sql/execution/joins/GlutenOuterJoinSuite.scala
index c915c7369..9c45eae15 100644
--- 
a/gluten-ut/spark35/src/test/scala/org/apache/spark/sql/execution/joins/GlutenOuterJoinSuite.scala
+++ 
b/gluten-ut/spark35/src/test/scala/org/apache/spark/sql/execution/joins/GlutenOuterJoinSuite.scala
@@ -16,6 +16,21 @@
  */
 package org.apache.spark.sql.execution.joins
 
+import org.apache.gluten.GlutenConfig
+
+import org.apache.spark.SparkConf
 import org.apache.spark.sql.GlutenSQLTestsBaseTrait
 
-class GlutenOuterJoinSuite extends OuterJoinSuite with GlutenSQLTestsBaseTrait 
{}
+class GlutenOuterJoinSuiteForceShjOn extends OuterJoinSuite with 
GlutenSQLTestsBaseTrait {
+  override def sparkConf: SparkConf = {
+    super.sparkConf
+      .set(GlutenConfig.COLUMNAR_FPRCE_SHUFFLED_HASH_JOIN_ENABLED.key, "true")
+  }
+}
+
+class GlutenOuterJoinSuiteForceShjOff extends OuterJoinSuite with 
GlutenSQLTestsBaseTrait {
+  override def sparkConf: SparkConf = {
+    super.sparkConf
+      .set(GlutenConfig.COLUMNAR_FPRCE_SHUFFLED_HASH_JOIN_ENABLED.key, "false")
+  }
+}


---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]

Reply via email to