Andrew Palumbo created MAHOUT-1815:
--------------------------------------
Summary: dsqDist(X,Y) and dsqDist(X) failing in flink tests.
Key: MAHOUT-1815
URL: https://issues.apache.org/jira/browse/MAHOUT-1815
Project: Mahout
Issue Type: Bug
Reporter: Andrew Palumbo
Priority: Blocker
{code}
test("dsqDist(X,Y)") {
val m = 100
val n = 300
val d = 7
val mxX = Matrices.symmetricUniformView(m, d, 12345).cloned -= 5
val mxY = Matrices.symmetricUniformView(n, d, 1234).cloned += 10
val (drmX, drmY) = (drmParallelize(mxX, 3), drmParallelize(mxY, 4))
val mxDsq = dsqDist(drmX, drmY).collect
val mxDsqControl = new DenseMatrix(m, n) := { (r, c, _) ⇒ (mxX(r, ::) -
mxY(c, ::)) ^= 2 sum }
(mxDsq - mxDsqControl).norm should be < 1e-7
}
{code}
And
{code}
test("dsqDist(X)") {
val m = 100
val d = 7
val mxX = Matrices.symmetricUniformView(m, d, 12345).cloned -= 5
val drmX = drmParallelize(mxX, 3)
val mxDsq = dsqDist(drmX).collect
val mxDsqControl = sqDist(drmX)
(mxDsq - mxDsqControl).norm should be < 1e-7
}
{code}
are both failing in flink tests with {{arrayOutOfBounds}} Exceptions:
{code}
03/15/2016 17:02:19 DataSink
(org.apache.flink.api.java.Utils$CollectHelper@568b43ab)(5/10) switched to
FINISHED
1 [CHAIN GroupReduce (GroupReduce at
org.apache.mahout.flinkbindings.blas.FlinkOpAtB$.notZippable(FlinkOpAtB.scala:78))
-> Map (Map at
org.apache.mahout.flinkbindings.blas.FlinkOpMapBlock$.apply(FlinkOpMapBlock.scala:37))
-> FlatMap (FlatMap at
org.apache.mahout.flinkbindings.drm.BlockifiedFlinkDrm.asRowWise(FlinkDrm.scala:93))
(8/10)] ERROR org.apache.flink.runtime.operators.BatchTask - Error in task
code: CHAIN GroupReduce (GroupReduce at
org.apache.mahout.flinkbindings.blas.FlinkOpAtB$.notZippable(FlinkOpAtB.scala:78))
-> Map (Map at
org.apache.mahout.flinkbindings.blas.FlinkOpMapBlock$.apply(FlinkOpMapBlock.scala:37))
-> FlatMap (FlatMap at
org.apache.mahout.flinkbindings.drm.BlockifiedFlinkDrm.asRowWise(FlinkDrm.scala:93))
(8/10)
java.lang.ArrayIndexOutOfBoundsException: 5
at
org.apache.mahout.math.drm.package$$anonfun$4$$anonfun$apply$3.apply(package.scala:317)
at
org.apache.mahout.math.drm.package$$anonfun$4$$anonfun$apply$3.apply(package.scala:317)
at
org.apache.mahout.math.scalabindings.MatrixOps$$anonfun$$colon$eq$3$$anonfun$apply$2.apply(MatrixOps.scala:164)
at
org.apache.mahout.math.scalabindings.MatrixOps$$anonfun$$colon$eq$3$$anonfun$apply$2.apply(MatrixOps.scala:164)
at scala.collection.Iterator$class.foreach(Iterator.scala:727)
at scala.collection.AbstractIterator.foreach(Iterator.scala:1157)
at scala.collection.IterableLike$class.foreach(IterableLike.scala:72)
at scala.collection.AbstractIterable.foreach(Iterable.scala:54)
at
org.apache.mahout.math.scalabindings.MatrixOps$$anonfun$$colon$eq$3.apply(MatrixOps.scala:164)
at
org.apache.mahout.math.scalabindings.MatrixOps$$anonfun$$colon$eq$3.apply(MatrixOps.scala:164)
at scala.collection.Iterator$class.foreach(Iterator.scala:727)
at scala.collection.AbstractIterator.foreach(Iterator.scala:1157)
at scala.collection.IterableLike$class.foreach(IterableLike.scala:72)
at scala.collection.AbstractIterable.foreach(Iterable.scala:54)
at
org.apache.mahout.math.scalabindings.MatrixOps.$colon$eq(MatrixOps.scala:164)
at
org.apache.mahout.math.drm.package$$anonfun$4.apply(package.scala:317)
at
org.apache.mahout.math.drm.package$$anonfun$4.apply(package.scala:311)
at
org.apache.mahout.flinkbindings.blas.FlinkOpMapBlock$$anonfun$1.apply(FlinkOpMapBlock.scala:39)
at
org.apache.mahout.flinkbindings.blas.FlinkOpMapBlock$$anonfun$1.apply(FlinkOpMapBlock.scala:38)
at org.apache.flink.api.scala.DataSet$$anon$1.map(DataSet.scala:297)
at
org.apache.flink.runtime.operators.chaining.ChainedMapDriver.collect(ChainedMapDriver.java:78)
at
org.apache.mahout.flinkbindings.blas.FlinkOpAtB$$anon$6.reduce(FlinkOpAtB.scala:86)
at
org.apache.flink.runtime.operators.GroupReduceDriver.run(GroupReduceDriver.java:125)
at org.apache.flink.runtime.operators.BatchTask.run(BatchTask.java:480)
at
org.apache.flink.runtime.operators.BatchTask.invoke(BatchTask.java:345)
at org.apache.flink.runtime.taskmanager.Task.run(Task.java:559)
at java.lang.Thread.run(Thread.java:745)
{code}
--
This message was sent by Atlassian JIRA
(v6.3.4#6332)