francis0407 commented on a change in pull request #24563: [SPARK-27359]
[OPTIMIZER] [SQL] Rewrite ArraysOverlap Join
URL: https://github.com/apache/spark/pull/24563#discussion_r285929385
##########
File path:
sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/joins.scala
##########
@@ -20,13 +20,51 @@ package org.apache.spark.sql.catalyst.optimizer
import scala.annotation.tailrec
import org.apache.spark.sql.AnalysisException
+import org.apache.spark.sql.catalyst.analysis._
+import org.apache.spark.sql.catalyst.dsl.expressions._
+import org.apache.spark.sql.catalyst.dsl.plans._
import org.apache.spark.sql.catalyst.expressions._
import org.apache.spark.sql.catalyst.planning.ExtractFiltersAndInnerJoins
import org.apache.spark.sql.catalyst.plans._
import org.apache.spark.sql.catalyst.plans.logical._
import org.apache.spark.sql.catalyst.rules._
import org.apache.spark.sql.internal.SQLConf
+
+/**
+ * Replace an expensive array_overlap join with an equivalent equijoin.
+ */
+object RewriteArraysOverlapJoin extends Rule[LogicalPlan] {
+ private def makePrime(p: LogicalPlan, arr: NamedExpression, alias: String) =
{
+ val exploded = Alias(Explode(arr), alias)(explicitMetadata =
Some(arr.metadata))
+ val generate = ExtractGenerator(
Review comment:
Emm.... I didn't find this method in my IDE, where is it?
----------------------------------------------------------------
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.
For queries about this service, please contact Infrastructure at:
[email protected]
With regards,
Apache Git Services
---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]