[
https://issues.apache.org/jira/browse/MAHOUT-1815?page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel&focusedCommentId=15200531#comment-15200531
]
Andrew Palumbo edited comment on MAHOUT-1815 at 3/17/16 10:35 PM:
------------------------------------------------------------------
merged to apache/flink-binding
was (Author: andrew_palumbo):
merged to flinl-binding
> dsqDist(X,Y) and dsqDist(X) failing in flink tests.
> ---------------------------------------------------
>
> Key: MAHOUT-1815
> URL: https://issues.apache.org/jira/browse/MAHOUT-1815
> Project: Mahout
> Issue Type: Bug
> Reporter: Andrew Palumbo
> Assignee: Andrew Palumbo
> Priority: Blocker
>
> {code}
> test("dsqDist(X,Y)") {
> val m = 100
> val n = 300
> val d = 7
> val mxX = Matrices.symmetricUniformView(m, d, 12345).cloned -= 5
> val mxY = Matrices.symmetricUniformView(n, d, 1234).cloned += 10
> val (drmX, drmY) = (drmParallelize(mxX, 3), drmParallelize(mxY, 4))
> val mxDsq = dsqDist(drmX, drmY).collect
> val mxDsqControl = new DenseMatrix(m, n) := { (r, c, _) ⇒ (mxX(r, ::) -
> mxY(c, ::)) ^= 2 sum }
> (mxDsq - mxDsqControl).norm should be < 1e-7
> }
> {code}
> And
> {code}
> test("dsqDist(X)") {
> val m = 100
> val d = 7
> val mxX = Matrices.symmetricUniformView(m, d, 12345).cloned -= 5
> val drmX = drmParallelize(mxX, 3)
> val mxDsq = dsqDist(drmX).collect
> val mxDsqControl = sqDist(drmX)
> (mxDsq - mxDsqControl).norm should be < 1e-7
> }
> {code}
> are both failing in flink tests with {{arrayOutOfBounds}} Exceptions:
> {code}
> 03/15/2016 17:02:19 DataSink
> (org.apache.flink.api.java.Utils$CollectHelper@568b43ab)(5/10) switched to
> FINISHED
> 1 [CHAIN GroupReduce (GroupReduce at
> org.apache.mahout.flinkbindings.blas.FlinkOpAtB$.notZippable(FlinkOpAtB.scala:78))
> -> Map (Map at
> org.apache.mahout.flinkbindings.blas.FlinkOpMapBlock$.apply(FlinkOpMapBlock.scala:37))
> -> FlatMap (FlatMap at
> org.apache.mahout.flinkbindings.drm.BlockifiedFlinkDrm.asRowWise(FlinkDrm.scala:93))
> (8/10)] ERROR org.apache.flink.runtime.operators.BatchTask - Error in task
> code: CHAIN GroupReduce (GroupReduce at
> org.apache.mahout.flinkbindings.blas.FlinkOpAtB$.notZippable(FlinkOpAtB.scala:78))
> -> Map (Map at
> org.apache.mahout.flinkbindings.blas.FlinkOpMapBlock$.apply(FlinkOpMapBlock.scala:37))
> -> FlatMap (FlatMap at
> org.apache.mahout.flinkbindings.drm.BlockifiedFlinkDrm.asRowWise(FlinkDrm.scala:93))
> (8/10)
> java.lang.ArrayIndexOutOfBoundsException: 5
> at
> org.apache.mahout.math.drm.package$$anonfun$4$$anonfun$apply$3.apply(package.scala:317)
> at
> org.apache.mahout.math.drm.package$$anonfun$4$$anonfun$apply$3.apply(package.scala:317)
> at
> org.apache.mahout.math.scalabindings.MatrixOps$$anonfun$$colon$eq$3$$anonfun$apply$2.apply(MatrixOps.scala:164)
> at
> org.apache.mahout.math.scalabindings.MatrixOps$$anonfun$$colon$eq$3$$anonfun$apply$2.apply(MatrixOps.scala:164)
> at scala.collection.Iterator$class.foreach(Iterator.scala:727)
> at scala.collection.AbstractIterator.foreach(Iterator.scala:1157)
> at scala.collection.IterableLike$class.foreach(IterableLike.scala:72)
> at scala.collection.AbstractIterable.foreach(Iterable.scala:54)
> at
> org.apache.mahout.math.scalabindings.MatrixOps$$anonfun$$colon$eq$3.apply(MatrixOps.scala:164)
> at
> org.apache.mahout.math.scalabindings.MatrixOps$$anonfun$$colon$eq$3.apply(MatrixOps.scala:164)
> at scala.collection.Iterator$class.foreach(Iterator.scala:727)
> at scala.collection.AbstractIterator.foreach(Iterator.scala:1157)
> at scala.collection.IterableLike$class.foreach(IterableLike.scala:72)
> at scala.collection.AbstractIterable.foreach(Iterable.scala:54)
> at
> org.apache.mahout.math.scalabindings.MatrixOps.$colon$eq(MatrixOps.scala:164)
> at
> org.apache.mahout.math.drm.package$$anonfun$4.apply(package.scala:317)
> at
> org.apache.mahout.math.drm.package$$anonfun$4.apply(package.scala:311)
> at
> org.apache.mahout.flinkbindings.blas.FlinkOpMapBlock$$anonfun$1.apply(FlinkOpMapBlock.scala:39)
> at
> org.apache.mahout.flinkbindings.blas.FlinkOpMapBlock$$anonfun$1.apply(FlinkOpMapBlock.scala:38)
> at org.apache.flink.api.scala.DataSet$$anon$1.map(DataSet.scala:297)
> at
> org.apache.flink.runtime.operators.chaining.ChainedMapDriver.collect(ChainedMapDriver.java:78)
> at
> org.apache.mahout.flinkbindings.blas.FlinkOpAtB$$anon$6.reduce(FlinkOpAtB.scala:86)
> at
> org.apache.flink.runtime.operators.GroupReduceDriver.run(GroupReduceDriver.java:125)
> at org.apache.flink.runtime.operators.BatchTask.run(BatchTask.java:480)
> at
> org.apache.flink.runtime.operators.BatchTask.invoke(BatchTask.java:345)
> at org.apache.flink.runtime.taskmanager.Task.run(Task.java:559)
> at java.lang.Thread.run(Thread.java:745)
> {code}
--
This message was sent by Atlassian JIRA
(v6.3.4#6332)