Github user ludatabricks commented on a diff in the pull request:

    https://github.com/apache/spark/pull/21195#discussion_r186566521
  
    --- Diff: 
mllib/src/test/scala/org/apache/spark/ml/clustering/LDASuite.scala ---
    @@ -323,4 +324,21 @@ class LDASuite extends SparkFunSuite with 
MLlibTestSparkContext with DefaultRead
           assert(model.getOptimizer === optimizer)
         }
       }
    +
    +  test("LDA with Array input") {
    +    def trainAndLogLikelihoodAndPerplexity(dataset: Dataset[_]): (Double, 
Double) = {
    +      val model = new 
LDA().setK(k).setOptimizer("online").setMaxIter(1).setSeed(1).fit(dataset)
    +      (model.logLikelihood(dataset), model.logPerplexity(dataset))
    +    }
    +
    +    val (newDataset, newDatasetD, newDatasetF) = 
MLTestingUtils.generateArrayFeatureDataset(dataset)
    +    val (ll, lp) = trainAndLogLikelihoodAndPerplexity(newDataset)
    --- End diff --
    
    Yes. I want to use this as the base for the comparison after we fix 
SPARK-22210.


---

---------------------------------------------------------------------
To unsubscribe, e-mail: reviews-unsubscr...@spark.apache.org
For additional commands, e-mail: reviews-h...@spark.apache.org

Reply via email to