diff --git a/mllib-dal/src/main/scala/com/intel/oap/mllib/OneDAL.scala b/mllib-dal/src/main/scala/com/intel/oap/mllib/OneDAL.scala index 6fa6f400e..5c781cf4e 100644 --- a/mllib-dal/src/main/scala/com/intel/oap/mllib/OneDAL.scala +++ b/mllib-dal/src/main/scala/com/intel/oap/mllib/OneDAL.scala @@ -395,6 +395,10 @@ object OneDAL { mergedTables } + /** + * Return a new RDD containing two Tuple3, Each Tuple3 represents(featuresArrayAddress, featuresNumRows, featuresNumCols), + * (labelsArrayAddress, labelsNumRows, labelsNumCols) in this RDD. + */ def coalesceLabelPointsToHomogenTables(labeledPoints: Dataset[_], labelCol: String, featuresCol: String, @@ -578,6 +582,9 @@ object OneDAL { matrix } + /** + * Return a new RDD containing targetArrayAddress, numRows, numCols in this RDD. + */ def coalesceVectorsToHomogenTables(data: RDD[Vector], executorNum: Int, device: Common.ComputeDevice): RDD[Tuple3[Long, Long, Long]] = { logger.info(s"Processing partitions with $executorNum executors")