Github user gatorsmile commented on a diff in the pull request:

    https://github.com/apache/spark/pull/21052#discussion_r183219812
  
    --- Diff: 
sql/core/src/test/scala/org/apache/spark/sql/StatisticsCollectionSuite.scala ---
    @@ -382,4 +382,32 @@ class StatisticsCollectionSuite extends 
StatisticsCollectionTestBase with Shared
           }
         }
       }
    +
    +  test("Simple queries must be working, if CBO is turned on") {
    +    withSQLConf(SQLConf.CBO_ENABLED.key -> "true") {
    +      withTable("TBL1", "TBL") {
    +        import org.apache.spark.sql.functions._
    +        val df = spark.range(1000L).select('id,
    +          'id * 2 as "FLD1",
    +          'id * 12 as "FLD2",
    +          lit("aaa") + 'id as "fld3")
    +        df.write
    +          .mode(SaveMode.Overwrite)
    +          .bucketBy(10, "id", "FLD1", "FLD2")
    +          .sortBy("id", "FLD1", "FLD2")
    +          .saveAsTable("TBL")
    +        sql("ANALYZE TABLE TBL COMPUTE STATISTICS ")
    +        sql("ANALYZE TABLE TBL COMPUTE STATISTICS FOR COLUMNS ID, FLD1, 
FLD2, FLD3")
    +        val df2 = spark.sql(
    +          """
    +             SELECT t1.id, t1.fld1, t1.fld2, t1.fld3
    +             FROM tbl t1
    +             JOIN tbl t2 on t1.id=t2.id
    +             WHERE  t1.fld3 IN (-123.23,321.23)
    +          """.stripMargin)
    --- End diff --
    
    Nit:
    ```Scala
              """
                |SELECT t1.id, t1.fld1, t1.fld2, t1.fld3
                |FROM tbl t1
                |JOIN tbl t2 on t1.id=t2.id
                |WHERE  t1.fld3 IN (-123.23,321.23)
              """.stripMargin)
    ```


---

---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]

Reply via email to