(incubator-gluten) branch main updated: [GLUTEN-11341][CORE] Support Scala 2.13 with IntelliJ IDE (#11342)

changchen Tue, 30 Dec 2025 16:43:01 -0800

This is an automated email from the ASF dual-hosted git repository.

changchen pushed a commit to branch main
in repository https://gitbox.apache.org/repos/asf/incubator-gluten.git



The following commit(s) were added to refs/heads/main by this push:
     new 173bbbf3d7 [GLUTEN-11341][CORE] Support Scala 2.13 with IntelliJ IDE 
(#11342)
173bbbf3d7 is described below

commit 173bbbf3d7c083aea22e0545e50ccef69bba0752
Author: Chang chen <[email protected]>
AuthorDate: Wed Dec 31 08:42:49 2025 +0800

    [GLUTEN-11341][CORE] Support Scala 2.13 with IntelliJ IDE (#11342)
    
    * [Scala 2.13][IntelliJ] Remove suppression for lint-multiarg-infix 
warnings in pom.xml
    
    see https://github.com/apache/spark/pull/43332
    
    * [Scala 2.13][IntelliJ] Suppress warning for `ContentFile::path`
    
    * [Scala 2.13][IntelliJ] Suppress warning for ContextAwareIterator 
initialization
    
    * [Scala 2.13][IntelliJ] Refactor to use Symbol for column references to 
fix compilation error in Scala 2.13 with IntelliJ compiler: symbol literal is 
deprecated; use Symbol("i")
    
    * [Fix] Replace deprecated fileToString with Files.readString for file 
reading in GlutenSQLQueryTestSuite
    
    see https://github.com/apache/spark/pull/51911 which removes Spark's 
fileToString method from Spark code base.
    
    * [Scala 2.13][IntelliJ] Update the Java compiler release version from 8 to 
`${java.version}` in the Scala 2.13 profiler to align it with 
`maven.compiler.target`
    
    * [Refactor] Replace usage of `Symbol` with `col` for column references to 
align with Spark API best practices
    
    ---------
    
    Co-authored-by: Chang chen <[email protected]>
---
 .../api/python/ColumnarArrowEvalPythonExec.scala   |  3 +-
 .../spark/source/GlutenIcebergSourceUtil.scala     |  2 +
 .../org/apache/spark/GlutenSQLQueryTestSuite.scala |  9 +--
 .../sql/connector/GlutenDataSourceV2Suite.scala    | 11 ++--
 .../ClickHouseAdaptiveQueryExecSuite.scala         | 71 +++++++++++-----------
 .../velox/VeloxAdaptiveQueryExecSuite.scala        | 71 +++++++++++-----------
 pom.xml                                            |  3 +-
 7 files changed, 90 insertions(+), 80 deletions(-)

diff --git 
a/backends-velox/src/main/scala/org/apache/spark/api/python/ColumnarArrowEvalPythonExec.scala
 
b/backends-velox/src/main/scala/org/apache/spark/api/python/ColumnarArrowEvalPythonExec.scala
index bfa33a804c..033f8a4284 100644
--- 
a/backends-velox/src/main/scala/org/apache/spark/api/python/ColumnarArrowEvalPythonExec.scala
+++ 
b/backends-velox/src/main/scala/org/apache/spark/api/python/ColumnarArrowEvalPythonExec.scala
@@ -43,6 +43,7 @@ import org.apache.arrow.vector.ipc.{ArrowStreamReader, 
ArrowStreamWriter}
 import java.io.{DataInputStream, DataOutputStream}
 import java.util.concurrent.atomic.AtomicBoolean
 
+import scala.annotation.nowarn
 import scala.collection.mutable
 import scala.collection.mutable.ArrayBuffer
 
@@ -362,7 +363,7 @@ case class ColumnarArrowEvalPythonExec(
             StructField(s"_$i", dt)
         }.toSeq)
 
-        val contextAwareIterator = new ContextAwareIterator(context, iter)
+        @nowarn val contextAwareIterator = new ContextAwareIterator(context, 
iter)
         val inputCbCache = new ArrayBuffer[ColumnarBatch]()
         var start_time: Long = 0
         val inputBatchIter = contextAwareIterator.map {
diff --git 
a/gluten-iceberg/src/main/scala/org/apache/iceberg/spark/source/GlutenIcebergSourceUtil.scala
 
b/gluten-iceberg/src/main/scala/org/apache/iceberg/spark/source/GlutenIcebergSourceUtil.scala
index ebe899f922..f1122280c1 100644
--- 
a/gluten-iceberg/src/main/scala/org/apache/iceberg/spark/source/GlutenIcebergSourceUtil.scala
+++ 
b/gluten-iceberg/src/main/scala/org/apache/iceberg/spark/source/GlutenIcebergSourceUtil.scala
@@ -33,6 +33,7 @@ import org.apache.iceberg.spark.SparkSchemaUtil
 import java.lang.{Class, Long => JLong}
 import java.util.{ArrayList => JArrayList, HashMap => JHashMap, List => JList, 
Map => JMap}
 
+import scala.annotation.nowarn
 import scala.collection.JavaConverters._
 
 object GlutenIcebergSourceUtil {
@@ -50,6 +51,7 @@ object GlutenIcebergSourceUtil {
     }
   }
 
+  @nowarn
   def genSplitInfo(
       partition: SparkDataSourceRDDPartition,
       readPartitionSchema: StructType): SplitInfo = {
diff --git 
a/gluten-ut/spark40/src/test/scala/org/apache/spark/GlutenSQLQueryTestSuite.scala
 
b/gluten-ut/spark40/src/test/scala/org/apache/spark/GlutenSQLQueryTestSuite.scala
index b06901b921..8d1c08c73d 100644
--- 
a/gluten-ut/spark40/src/test/scala/org/apache/spark/GlutenSQLQueryTestSuite.scala
+++ 
b/gluten-ut/spark40/src/test/scala/org/apache/spark/GlutenSQLQueryTestSuite.scala
@@ -29,8 +29,8 @@ import org.apache.spark.sql.catalyst.parser.ParseException
 import org.apache.spark.sql.catalyst.plans.SQLHelper
 import org.apache.spark.sql.catalyst.plans.logical.{Command, LogicalPlan}
 import org.apache.spark.sql.catalyst.rules.RuleExecutor
-import org.apache.spark.sql.catalyst.util.{fileToString, stringToFile}
 import org.apache.spark.sql.catalyst.util.DateTimeConstants.NANOS_PER_SECOND
+import org.apache.spark.sql.catalyst.util.stringToFile
 import org.apache.spark.sql.execution.WholeStageCodegenExec
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.internal.SQLConf.TimestampTypes
@@ -40,6 +40,7 @@ import org.apache.spark.util.Utils
 
 import java.io.File
 import java.net.URI
+import java.nio.file.Files
 import java.util.Locale
 
 import scala.collection.mutable
@@ -320,7 +321,7 @@ class GlutenSQLQueryTestSuite
         newLine.startsWith("--") && !newLine.startsWith("--QUERY-DELIMITER")
     }
 
-    val input = fileToString(new File(testCase.inputFile))
+    val input = Files.readString(new File(testCase.inputFile).toPath)
 
     val (comments, code) = splitCommentsAndCodes(input)
 
@@ -331,7 +332,7 @@ class GlutenSQLQueryTestSuite
       testCaseName =>
         listTestCases.find(_.name == testCaseName).map {
           testCase =>
-            val input = fileToString(new File(testCase.inputFile))
+            val input = Files.readString(new File(testCase.inputFile).toPath)
             val (_, code) = splitCommentsAndCodes(input)
             code
         }
@@ -738,7 +739,7 @@ class GlutenSQLQueryTestSuite
       makeOutput: (String, Option[String], String) => QueryTestOutput): Unit = 
{
     // Read back the golden file.
     val expectedOutputs: Seq[QueryTestOutput] = {
-      val goldenOutput = fileToString(new File(resultFile))
+      val goldenOutput = Files.readString(new File(resultFile).toPath)
       val segments = goldenOutput.split("-- !query.*\n")
 
       val numSegments = outputs.map(_.numSegments).sum + 1
diff --git 
a/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/connector/GlutenDataSourceV2Suite.scala
 
b/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/connector/GlutenDataSourceV2Suite.scala
index 803c407ca8..080487820a 100644
--- 
a/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/connector/GlutenDataSourceV2Suite.scala
+++ 
b/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/connector/GlutenDataSourceV2Suite.scala
@@ -21,6 +21,7 @@ import org.apache.gluten.execution.SortExecTransformer
 import org.apache.spark.sql.{GlutenSQLTestsBaseTrait, Row}
 import org.apache.spark.sql.execution.ColumnarShuffleExchangeExec
 import org.apache.spark.sql.expressions.Window
+import org.apache.spark.sql.functions.col
 import org.apache.spark.sql.functions.row_number
 import org.apache.spark.sql.internal.SQLConf
 
@@ -38,25 +39,25 @@ class GlutenDataSourceV2Suite extends DataSourceV2Suite 
with GlutenSQLTestsBaseT
             val df = spark.read.format(cls.getName).load()
             checkAnswer(df, Seq(Row(1, 4), Row(1, 4), Row(3, 6), Row(2, 6), 
Row(4, 2), Row(4, 2)))
 
-            val groupByColA = df.groupBy('i).agg(sum('j))
+            val groupByColA = df.groupBy(col("i")).agg(sum(col("j")))
             checkAnswer(groupByColA, Seq(Row(1, 8), Row(2, 6), Row(3, 6), 
Row(4, 4)))
             assert(collectFirst(groupByColA.queryExecution.executedPlan) {
               case e: ColumnarShuffleExchangeExec => e
             }.isEmpty)
 
-            val groupByColAB = df.groupBy('i, 'j).agg(count("*"))
+            val groupByColAB = df.groupBy(col("i"), col("j")).agg(count("*"))
             checkAnswer(groupByColAB, Seq(Row(1, 4, 2), Row(2, 6, 1), Row(3, 
6, 1), Row(4, 2, 2)))
             assert(collectFirst(groupByColAB.queryExecution.executedPlan) {
               case e: ColumnarShuffleExchangeExec => e
             }.isEmpty)
 
-            val groupByColB = df.groupBy('j).agg(sum('i))
+            val groupByColB = df.groupBy(col("j")).agg(sum(col("i")))
             checkAnswer(groupByColB, Seq(Row(2, 8), Row(4, 2), Row(6, 5)))
             assert(collectFirst(groupByColB.queryExecution.executedPlan) {
               case e: ColumnarShuffleExchangeExec => e
             }.isDefined)
 
-            val groupByAPlusB = df.groupBy('i + 'j).agg(count("*"))
+            val groupByAPlusB = df.groupBy(col("i") + col("j")).agg(count("*"))
             checkAnswer(groupByAPlusB, Seq(Row(5, 2), Row(6, 2), Row(8, 1), 
Row(9, 1)))
             assert(collectFirst(groupByAPlusB.queryExecution.executedPlan) {
               case e: ColumnarShuffleExchangeExec => e
@@ -138,7 +139,7 @@ class GlutenDataSourceV2Suite extends DataSourceV2Suite 
with GlutenSQLTestsBaseT
                   {
                     val windowPartByColIOrderByColJ = df.withColumn(
                       "no",
-                      
row_number().over(Window.partitionBy(Symbol("i")).orderBy(Symbol("j"))))
+                      
row_number().over(Window.partitionBy(col("i")).orderBy(col("j"))))
                     checkAnswer(
                       windowPartByColIOrderByColJ,
                       Seq(
diff --git 
a/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/adaptive/clickhouse/ClickHouseAdaptiveQueryExecSuite.scala
 
b/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/adaptive/clickhouse/ClickHouseAdaptiveQueryExecSuite.scala
index 70e6c81c11..903c7ccd13 100644
--- 
a/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/adaptive/clickhouse/ClickHouseAdaptiveQueryExecSuite.scala
+++ 
b/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/adaptive/clickhouse/ClickHouseAdaptiveQueryExecSuite.scala
@@ -32,6 +32,7 @@ import org.apache.spark.sql.execution.exchange._
 import org.apache.spark.sql.execution.joins.{BaseJoinExec, 
BroadcastHashJoinExec, ShuffledHashJoinExec, SortMergeJoinExec}
 import org.apache.spark.sql.execution.metric.SQLShuffleReadMetricsReporter
 import 
org.apache.spark.sql.execution.ui.SparkListenerSQLAdaptiveExecutionUpdate
+import org.apache.spark.sql.functions.col
 import org.apache.spark.sql.functions.when
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.test.SQLTestData.TestData
@@ -254,13 +255,13 @@ class ClickHouseAdaptiveQueryExecSuite extends 
AdaptiveQueryExecSuite with Glute
       SQLConf.COALESCE_PARTITIONS_ENABLED.key -> "true",
       SQLConf.ADAPTIVE_OPTIMIZER_EXCLUDED_RULES.key -> 
AQEPropagateEmptyRelation.ruleName
     ) {
-      val df1 = spark.range(10).withColumn("a", 'id)
-      val df2 = spark.range(10).withColumn("b", 'id)
+      val df1 = spark.range(10).withColumn("a", col("id"))
+      val df2 = spark.range(10).withColumn("b", col("id"))
       withSQLConf(SQLConf.AUTO_BROADCASTJOIN_THRESHOLD.key -> "-1") {
         val testDf = df1
-          .where('a > 10)
-          .join(df2.where('b > 10), Seq("id"), "left_outer")
-          .groupBy('a)
+          .where(col("a") > 10)
+          .join(df2.where(col("b") > 10), Seq("id"), "left_outer")
+          .groupBy(col("a"))
           .count()
         checkAnswer(testDf, Seq())
         val plan = testDf.queryExecution.executedPlan
@@ -269,9 +270,9 @@ class ClickHouseAdaptiveQueryExecSuite extends 
AdaptiveQueryExecSuite with Glute
 
       withSQLConf(SQLConf.AUTO_BROADCASTJOIN_THRESHOLD.key -> "1") {
         val testDf = df1
-          .where('a > 10)
-          .join(df2.where('b > 10), Seq("id"), "left_outer")
-          .groupBy('a)
+          .where(col("a") > 10)
+          .join(df2.where(col("b") > 10), Seq("id"), "left_outer")
+          .groupBy(col("a"))
           .count()
         checkAnswer(testDf, Seq())
         val plan = testDf.queryExecution.executedPlan
@@ -346,8 +347,8 @@ class ClickHouseAdaptiveQueryExecSuite extends 
AdaptiveQueryExecSuite with Glute
       //             +- ShuffleExchange
 
       // After applied the 'OptimizeShuffleWithLocalRead' rule, we can convert 
all the four
-      // shuffle read to local shuffle read in the bottom two 
'BroadcastHashJoin'.
-      // For the top level 'BroadcastHashJoin', the probe side is not shuffle 
query stage
+      // shuffle read to local shuffle read in the bottom two 
Symbol("b")roadcastHashJoin'.
+      // For the top level Symbol("b")roadcastHashJoin', the probe side is not 
shuffle query stage
       // and the build side shuffle query stage is also converted to local 
shuffle read.
       checkNumLocalShuffleReads(adaptivePlan, 0)
     }
@@ -652,19 +653,19 @@ class ClickHouseAdaptiveQueryExecSuite extends 
AdaptiveQueryExecSuite with Glute
             spark
               .range(0, 1000, 1, 10)
               .select(
-                when('id < 250, 249)
-                  .when('id >= 750, 1000)
-                  .otherwise('id)
+                when(col("id") < 250, 249)
+                  .when(col("id") >= 750, 1000)
+                  .otherwise(col("id"))
                   .as("key1"),
-                'id.as("value1"))
+                col("id").as("value1"))
               .createOrReplaceTempView("skewData1")
             spark
               .range(0, 1000, 1, 10)
               .select(
-                when('id < 250, 249)
-                  .otherwise('id)
+                when(col("id") < 250, 249)
+                  .otherwise(col("id"))
                   .as("key2"),
-                'id.as("value2"))
+                col("id").as("value2"))
               .createOrReplaceTempView("skewData2")
 
             def checkSkewJoin(
@@ -780,19 +781,19 @@ class ClickHouseAdaptiveQueryExecSuite extends 
AdaptiveQueryExecSuite with Glute
           spark
             .range(0, 1000, 1, 10)
             .select(
-              when('id < 250, 249)
-                .when('id >= 750, 1000)
-                .otherwise('id)
+              when(col("id") < 250, 249)
+                .when(col("id") >= 750, 1000)
+                .otherwise(col("id"))
                 .as("key1"),
-              'id.as("value1"))
+              col("id").as("value1"))
             .createOrReplaceTempView("skewData1")
           spark
             .range(0, 1000, 1, 10)
             .select(
-              when('id < 250, 249)
-                .otherwise('id)
+              when(col("id") < 250, 249)
+                .otherwise(col("id"))
                 .as("key2"),
-              'id.as("value2"))
+              col("id").as("value2"))
             .createOrReplaceTempView("skewData2")
           val (_, adaptivePlan) =
             runAdaptiveAndVerifyResult("SELECT * FROM skewData1 join skewData2 
ON key1 = key2")
@@ -940,7 +941,7 @@ class ClickHouseAdaptiveQueryExecSuite extends 
AdaptiveQueryExecSuite with Glute
       withSQLConf(SQLConf.AUTO_BROADCASTJOIN_THRESHOLD.key -> "300") {
         // Repartition with no partition num specified.
         checkBHJ(
-          df.repartition('b),
+          df.repartition(col("b")),
           // The top shuffle from repartition is optimized out.
           optimizeOutRepartition = true,
           probeSideLocalRead = false,
@@ -949,7 +950,7 @@ class ClickHouseAdaptiveQueryExecSuite extends 
AdaptiveQueryExecSuite with Glute
 
         // Repartition with default partition num (5 in test env) specified.
         checkBHJ(
-          df.repartition(5, 'b),
+          df.repartition(5, col("b")),
           // The top shuffle from repartition is optimized out
           // The final plan must have 5 partitions, no optimization can be 
made to the probe side.
           optimizeOutRepartition = true,
@@ -959,7 +960,7 @@ class ClickHouseAdaptiveQueryExecSuite extends 
AdaptiveQueryExecSuite with Glute
 
         // Repartition with non-default partition num specified.
         checkBHJ(
-          df.repartition(4, 'b),
+          df.repartition(4, col("b")),
           // The top shuffle from repartition is not optimized out
           optimizeOutRepartition = false,
           probeSideLocalRead = true,
@@ -968,7 +969,7 @@ class ClickHouseAdaptiveQueryExecSuite extends 
AdaptiveQueryExecSuite with Glute
 
         // Repartition by col and project away the partition cols
         checkBHJ(
-          df.repartition('b).select('key),
+          df.repartition(col("b")).select(col("key")),
           // The top shuffle from repartition is not optimized out
           optimizeOutRepartition = false,
           probeSideLocalRead = true,
@@ -986,15 +987,16 @@ class ClickHouseAdaptiveQueryExecSuite extends 
AdaptiveQueryExecSuite with Glute
       ) {
         // Repartition with no partition num specified.
         checkSMJ(
-          df.repartition('b),
+          df.repartition(col("b")),
           // The top shuffle from repartition is optimized out.
           optimizeOutRepartition = true,
           optimizeSkewJoin = false,
-          coalescedRead = true)
+          coalescedRead = true
+        )
 
         // Repartition with default partition num (5 in test env) specified.
         checkSMJ(
-          df.repartition(5, 'b),
+          df.repartition(5, col("b")),
           // The top shuffle from repartition is optimized out.
           // The final plan must have 5 partitions, can't do coalesced read.
           optimizeOutRepartition = true,
@@ -1004,15 +1006,16 @@ class ClickHouseAdaptiveQueryExecSuite extends 
AdaptiveQueryExecSuite with Glute
 
         // Repartition with non-default partition num specified.
         checkSMJ(
-          df.repartition(4, 'b),
+          df.repartition(4, col("b")),
           // The top shuffle from repartition is not optimized out.
           optimizeOutRepartition = false,
           optimizeSkewJoin = true,
-          coalescedRead = false)
+          coalescedRead = false
+        )
 
         // Repartition by col and project away the partition cols
         checkSMJ(
-          df.repartition('b).select('key),
+          df.repartition(col("b")).select(col("key")),
           // The top shuffle from repartition is not optimized out.
           optimizeOutRepartition = false,
           optimizeSkewJoin = true,
diff --git 
a/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/adaptive/velox/VeloxAdaptiveQueryExecSuite.scala
 
b/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/adaptive/velox/VeloxAdaptiveQueryExecSuite.scala
index 4be6d072b4..74d2835c4b 100644
--- 
a/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/adaptive/velox/VeloxAdaptiveQueryExecSuite.scala
+++ 
b/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/adaptive/velox/VeloxAdaptiveQueryExecSuite.scala
@@ -32,6 +32,7 @@ import org.apache.spark.sql.execution.exchange._
 import org.apache.spark.sql.execution.joins.{BaseJoinExec, 
BroadcastHashJoinExec, ShuffledHashJoinExec, SortMergeJoinExec}
 import org.apache.spark.sql.execution.metric.SQLShuffleReadMetricsReporter
 import 
org.apache.spark.sql.execution.ui.SparkListenerSQLAdaptiveExecutionUpdate
+import org.apache.spark.sql.functions.col
 import org.apache.spark.sql.functions.when
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.test.SQLTestData.TestData
@@ -254,13 +255,13 @@ class VeloxAdaptiveQueryExecSuite extends 
AdaptiveQueryExecSuite with GlutenSQLT
       SQLConf.COALESCE_PARTITIONS_ENABLED.key -> "true",
       SQLConf.ADAPTIVE_OPTIMIZER_EXCLUDED_RULES.key -> 
AQEPropagateEmptyRelation.ruleName
     ) {
-      val df1 = spark.range(10).withColumn("a", 'id)
-      val df2 = spark.range(10).withColumn("b", 'id)
+      val df1 = spark.range(10).withColumn("a", col("id"))
+      val df2 = spark.range(10).withColumn("b", col("id"))
       withSQLConf(SQLConf.AUTO_BROADCASTJOIN_THRESHOLD.key -> "-1") {
         val testDf = df1
-          .where('a > 10)
-          .join(df2.where('b > 10), Seq("id"), "left_outer")
-          .groupBy('a)
+          .where(col("a") > 10)
+          .join(df2.where(col("b") > 10), Seq("id"), "left_outer")
+          .groupBy(col("a"))
           .count()
         checkAnswer(testDf, Seq())
         val plan = testDf.queryExecution.executedPlan
@@ -269,9 +270,9 @@ class VeloxAdaptiveQueryExecSuite extends 
AdaptiveQueryExecSuite with GlutenSQLT
 
       withSQLConf(SQLConf.AUTO_BROADCASTJOIN_THRESHOLD.key -> "1") {
         val testDf = df1
-          .where('a > 10)
-          .join(df2.where('b > 10), Seq("id"), "left_outer")
-          .groupBy('a)
+          .where(col("a") > 10)
+          .join(df2.where(col("b") > 10), Seq("id"), "left_outer")
+          .groupBy(col("a"))
           .count()
         checkAnswer(testDf, Seq())
         val plan = testDf.queryExecution.executedPlan
@@ -346,8 +347,8 @@ class VeloxAdaptiveQueryExecSuite extends 
AdaptiveQueryExecSuite with GlutenSQLT
       //             +- ShuffleExchange
 
       // After applied the 'OptimizeShuffleWithLocalRead' rule, we can convert 
all the four
-      // shuffle read to local shuffle read in the bottom two 
'BroadcastHashJoin'.
-      // For the top level 'BroadcastHashJoin', the probe side is not shuffle 
query stage
+      // shuffle read to local shuffle read in the bottom two 
Symbol("b")roadcastHashJoin'.
+      // For the top level Symbol("b")roadcastHashJoin', the probe side is not 
shuffle query stage
       // and the build side shuffle query stage is also converted to local 
shuffle read.
       checkNumLocalShuffleReads(adaptivePlan, 0)
     }
@@ -649,19 +650,19 @@ class VeloxAdaptiveQueryExecSuite extends 
AdaptiveQueryExecSuite with GlutenSQLT
             spark
               .range(0, 1000, 1, 10)
               .select(
-                when('id < 250, 249)
-                  .when('id >= 750, 1000)
-                  .otherwise('id)
+                when(col("id") < 250, 249)
+                  .when(col("id") >= 750, 1000)
+                  .otherwise(col("id"))
                   .as("key1"),
-                'id.as("value1"))
+                col("id").as("value1"))
               .createOrReplaceTempView("skewData1")
             spark
               .range(0, 1000, 1, 10)
               .select(
-                when('id < 250, 249)
-                  .otherwise('id)
+                when(col("id") < 250, 249)
+                  .otherwise(col("id"))
                   .as("key2"),
-                'id.as("value2"))
+                col("id").as("value2"))
               .createOrReplaceTempView("skewData2")
 
             def checkSkewJoin(
@@ -777,19 +778,19 @@ class VeloxAdaptiveQueryExecSuite extends 
AdaptiveQueryExecSuite with GlutenSQLT
           spark
             .range(0, 1000, 1, 10)
             .select(
-              when('id < 250, 249)
-                .when('id >= 750, 1000)
-                .otherwise('id)
+              when(col("id") < 250, 249)
+                .when(col("id") >= 750, 1000)
+                .otherwise(col("id"))
                 .as("key1"),
-              'id.as("value1"))
+              col("id").as("value1"))
             .createOrReplaceTempView("skewData1")
           spark
             .range(0, 1000, 1, 10)
             .select(
-              when('id < 250, 249)
-                .otherwise('id)
+              when(col("id") < 250, 249)
+                .otherwise(col("id"))
                 .as("key2"),
-              'id.as("value2"))
+              col("id").as("value2"))
             .createOrReplaceTempView("skewData2")
           val (_, adaptivePlan) =
             runAdaptiveAndVerifyResult("SELECT * FROM skewData1 join skewData2 
ON key1 = key2")
@@ -922,7 +923,7 @@ class VeloxAdaptiveQueryExecSuite extends 
AdaptiveQueryExecSuite with GlutenSQLT
       withSQLConf(SQLConf.AUTO_BROADCASTJOIN_THRESHOLD.key -> "300") {
         // Repartition with no partition num specified.
         checkBHJ(
-          df.repartition('b),
+          df.repartition(col("b")),
           // The top shuffle from repartition is optimized out.
           optimizeOutRepartition = true,
           probeSideLocalRead = false,
@@ -931,7 +932,7 @@ class VeloxAdaptiveQueryExecSuite extends 
AdaptiveQueryExecSuite with GlutenSQLT
 
         // Repartition with default partition num (5 in test env) specified.
         checkBHJ(
-          df.repartition(5, 'b),
+          df.repartition(5, col("b")),
           // The top shuffle from repartition is optimized out
           // The final plan must have 5 partitions, no optimization can be 
made to the probe side.
           optimizeOutRepartition = true,
@@ -941,7 +942,7 @@ class VeloxAdaptiveQueryExecSuite extends 
AdaptiveQueryExecSuite with GlutenSQLT
 
         // Repartition with non-default partition num specified.
         checkBHJ(
-          df.repartition(4, 'b),
+          df.repartition(4, col("b")),
           // The top shuffle from repartition is not optimized out
           optimizeOutRepartition = false,
           probeSideLocalRead = true,
@@ -950,7 +951,7 @@ class VeloxAdaptiveQueryExecSuite extends 
AdaptiveQueryExecSuite with GlutenSQLT
 
         // Repartition by col and project away the partition cols
         checkBHJ(
-          df.repartition('b).select('key),
+          df.repartition(col("b")).select(col("key")),
           // The top shuffle from repartition is not optimized out
           optimizeOutRepartition = false,
           probeSideLocalRead = true,
@@ -968,15 +969,16 @@ class VeloxAdaptiveQueryExecSuite extends 
AdaptiveQueryExecSuite with GlutenSQLT
       ) {
         // Repartition with no partition num specified.
         checkSMJ(
-          df.repartition('b),
+          df.repartition(col("b")),
           // The top shuffle from repartition is optimized out.
           optimizeOutRepartition = true,
           optimizeSkewJoin = false,
-          coalescedRead = true)
+          coalescedRead = true
+        )
 
         // Repartition with default partition num (5 in test env) specified.
         checkSMJ(
-          df.repartition(5, 'b),
+          df.repartition(5, col("b")),
           // The top shuffle from repartition is optimized out.
           // The final plan must have 5 partitions, can't do coalesced read.
           optimizeOutRepartition = true,
@@ -986,15 +988,16 @@ class VeloxAdaptiveQueryExecSuite extends 
AdaptiveQueryExecSuite with GlutenSQLT
 
         // Repartition with non-default partition num specified.
         checkSMJ(
-          df.repartition(4, 'b),
+          df.repartition(4, col("b")),
           // The top shuffle from repartition is not optimized out.
           optimizeOutRepartition = false,
           optimizeSkewJoin = true,
-          coalescedRead = false)
+          coalescedRead = false
+        )
 
         // Repartition by col and project away the partition cols
         checkSMJ(
-          df.repartition('b).select('key),
+          df.repartition(col("b")).select(col("key")),
           // The top shuffle from repartition is not optimized out.
           optimizeOutRepartition = false,
           optimizeSkewJoin = true,
diff --git a/pom.xml b/pom.xml
index 1d13dc5747..c87d46ceb5 100644
--- a/pom.xml
+++ b/pom.xml
@@ -969,14 +969,13 @@
                   <arg>-deprecation</arg>
                   <arg>-feature</arg>
                   <arg>-explaintypes</arg>
-                  <arg>-release:8</arg>
+                  <arg>-release:${java.version}</arg>
                   <arg>-Wconf:cat=deprecation:wv,any:e</arg>
                   <arg>-Wunused:imports</arg>
                   <!--
                     TODO(SPARK-33805): Undo the corresponding deprecated usage 
suppression rule after fixed
                   -->
                   <arg>-Wconf:cat=scaladoc:wv</arg>
-                  <arg>-Wconf:cat=lint-multiarg-infix:wv</arg>
                   <arg>-Wconf:cat=other-nullary-override:wv</arg>
                   <!--
                     SPARK-33775 Suppress compilation warnings that contain the 
following contents.


---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]

(incubator-gluten) branch main updated: [GLUTEN-11341][CORE] Support Scala 2.13 with IntelliJ IDE (#11342)

Reply via email to