Github user WeichenXu123 commented on a diff in the pull request:

    https://github.com/apache/spark/pull/20686#discussion_r171546765
  
    --- Diff: 
mllib/src/test/scala/org/apache/spark/ml/feature/QuantileDiscretizerSuite.scala 
---
    @@ -364,18 +419,47 @@ class QuantileDiscretizerSuite
           .setOutputCols(Array("result1", "result2", "result3"))
           .setNumBucketsArray(Array(10, 10, 10))
     
    -    val result1 = discretizerSingleNumBuckets.fit(df).transform(df)
    -      .select("result1", "result2", "result3")
    -      .collect()
    -    val result2 = discretizerNumBucketsArray.fit(df).transform(df)
    -      .select("result1", "result2", "result3")
    +    val expected = Seq(
    +      (0.0, 0.0, 0.0),
    +      (1.0, 1.0, 1.0),
    +      (1.0, 1.0, 1.0),
    +      (2.0, 2.0, 2.0),
    +      (2.0, 2.0, 2.0),
    +      (2.0, 2.0, 2.0),
    +      (3.0, 3.0, 3.0),
    +      (4.0, 4.0, 4.0),
    +      (4.0, 4.0, 4.0),
    +      (5.0, 5.0, 5.0),
    +      (5.0, 5.0, 5.0),
    +      (5.0, 5.0, 5.0),
    +      (6.0, 6.0, 6.0),
    +      (6.0, 6.0, 6.0),
    +      (7.0, 7.0, 7.0),
    +      (8.0, 8.0, 8.0),
    +      (8.0, 8.0, 8.0),
    +      (9.0, 9.0, 9.0),
    +      (9.0, 9.0, 9.0),
    +      (9.0, 9.0, 9.0)
    +    ).toDF("result1", "result2", "result3")
    --- End diff --
    
    ditto.


---

---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]

Reply via email to