[GitHub] spark pull request #22320: [SPARK-25313][SQL]Fix regression in FileFormatWri...

cloud-fan Mon, 03 Sep 2018 08:29:56 -0700

Github user cloud-fan commented on a diff in the pull request:

    https://github.com/apache/spark/pull/22320#discussion_r214722030
  
    --- Diff: 
sql/core/src/test/scala/org/apache/spark/sql/test/DataFrameReaderWriterSuite.scala
 ---
    @@ -805,6 +805,81 @@ class DataFrameReaderWriterSuite extends QueryTest 
with SharedSQLContext with Be
         }
       }
     
    +  test("Insert overwrite table command should output correct schema: 
basic") {
    +    withTable("tbl", "tbl2") {
    +      withView("view1") {
    +        val df = spark.range(10).toDF("id")
    +        df.write.format("parquet").saveAsTable("tbl")
    +        spark.sql("CREATE VIEW view1 AS SELECT id FROM tbl")
    +        spark.sql("CREATE TABLE tbl2(ID long) USING parquet")
    +        spark.sql("INSERT OVERWRITE TABLE tbl2 SELECT ID FROM view1")
    +        val identifier = TableIdentifier("tbl2", Some("default"))
    +        val location = 
spark.sessionState.catalog.getTableMetadata(identifier).location.toString
    +        val expectedSchema = StructType(Seq(StructField("ID", LongType, 
true)))
    +        assert(spark.read.parquet(location).schema == expectedSchema)
    +        checkAnswer(spark.table("tbl2"), df)
    +      }
    +    }
    +  }
    +
    +  test("Insert overwrite table command should output correct schema: 
complex") {
    +    withTable("tbl", "tbl2") {
    +      withView("view1") {
    +        val df = spark.range(10).map(x => (x, x.toInt, 
x.toInt)).toDF("col1", "col2", "col3")
    +        df.write.format("parquet").saveAsTable("tbl")
    +        spark.sql("CREATE VIEW view1 AS SELECT * FROM tbl")
    +        spark.sql("CREATE TABLE tbl2(COL1 long, COL2 int, COL3 int) USING 
parquet PARTITIONED " +
    +          "BY (COL2) CLUSTERED BY (COL3) INTO 3 BUCKETS")
    +        spark.sql("INSERT OVERWRITE TABLE tbl2 SELECT COL1, COL2, COL3 " +
    +          "FROM view1 CLUSTER BY COL3")
    --- End diff --
    
    is it legal to put `CLUSTER BY` in the INSERT statement?



---

---------------------------------------------------------------------
To unsubscribe, e-mail: reviews-unsubscr...@spark.apache.org
For additional commands, e-mail: reviews-h...@spark.apache.org

[GitHub] spark pull request #22320: [SPARK-25313][SQL]Fix regression in FileFormatWri...

Reply via email to