dusenberrymw · MechCoder · Jul 23, 2015
diff --git a/docs/mllib-data-types.md b/docs/mllib-data-types.md
@@ -379,14 +379,14 @@ A [`RowMatrix`](api/python/pyspark.mllib.html#pyspark.mllib.linalg.RowMatrix) ca
 an `RDD` of Vectors.
 
 {% highlight python %}
-from pyspark.mllib.linalg import DistributedMatrices, Vectors
+from pyspark.mllib.linalg import RowMatrix, Vectors
 
 # Create an RDD of Vectors.
 rows = sc.parallelize([Vectors.dense([1, 2, 3]), Vectors.dense([4, 5, 6]), 
                        Vectors.dense([7, 8, 9]), Vectors.dense([10, 11, 12])])
 
 # Create a RowMatrix from an RDD[Vector].
-mat = DistributedMatrices.rowMatrix(rows)
+mat = RowMatrix(rows)
 
 # Get its size.
 m = mat.numRows()  # 4
@@ -468,7 +468,7 @@ created from an `RDD` of IndexedRows, where
 indices.
 
 {% highlight python %}
-from pyspark.mllib.linalg import Vectors, DistributedMatrices, IndexedRow, IndexedRowMatrix
+from pyspark.mllib.linalg import Vectors, IndexedRow, IndexedRowMatrix
 
 # Create an RDD of indexed rows.
 #   - This can be done explicitly with the IndexedRow class:
@@ -481,7 +481,7 @@ indexedRows = sc.parallelize([(0, Vectors.dense([1, 2, 3])), (1, Vectors.dense([
                               (2, Vectors.dense([7, 8, 9])), (3, Vectors.dense([10, 11, 12]))])
 
 # Create an IndexedRowMatrix from an RDD[IndexedRow].
-mat = DistributedMatrices.indexedRowMatrix(indexedRows)
+mat = IndexedRowMatrix(indexedRows)
 
 # Get its size.
 m = mat.numRows()  # 4
@@ -572,7 +572,7 @@ created from a `RDD` of MatrixEntry entries, where
 `toRowMatrix`, or to an `IndexedRowMatrix` with sparse rows by calling `toIndexedRowMatrix`.
 
 {% highlight python %}
-from pyspark.mllib.linalg import DistributedMatrices, MatrixEntry, CoordinateMatrix
+from pyspark.mllib.linalg import MatrixEntry, CoordinateMatrix
 
 # Create an RDD of coordinate entries.
 #   - This can be done explicitly with the MatrixEntry class:
@@ -581,7 +581,7 @@ entries = sc.parallelize([MatrixEntry(0, 0, 1.2), MatrixEntry(1, 0, 2.1), Matrix
 entries = sc.parallelize([(0, 0, 1.2), (1, 0, 2.1), (2, 1, 3.7)])
 
 # Create an CoordinateMatrix from an RDD[MatrixEntry].
-mat = DistributedMatrices.coordinateMatrix(entries)
+mat = CoordinateMatrix(entries)
 
 # Get its size.
 m = mat.numRows()  # 3

diff --git a/mllib/src/main/scala/org/apache/spark/mllib/api/python/PythonMLLibAPI.scala b/mllib/src/main/scala/org/apache/spark/mllib/api/python/PythonMLLibAPI.scala
@@ -21,7 +21,7 @@ import java.io.OutputStream
 import java.nio.{ByteBuffer, ByteOrder}
 import java.util.{ArrayList => JArrayList, List => JList, Map => JMap}
 
-import org.apache.spark.mllib.linalg.distributed.{DistributedMatrices, RowMatrix, IndexedRowMatrix, IndexedRow,
+import org.apache.spark.mllib.linalg.distributed.{RowMatrix, IndexedRowMatrix, IndexedRow,
   MatrixEntry, CoordinateMatrix}
 
 import scala.collection.JavaConverters._
@@ -1109,22 +1109,22 @@ private[python] class PythonMLLibAPI extends Serializable {
   }
 
   /**
-   * Wrapper around DistributedMatrices.rowMatrix factory method.
+   * Wrapper around RowMatrix.
    */
   def createRowMatrix(rows: JavaRDD[Vector], numRows: Long, numCols: Int): RowMatrix = {
-    DistributedMatrices.rowMatrix(rows.rdd, numRows, numCols)
+    new RowMatrix(rows.rdd, numRows, numCols)
   }
 
   /**
-   * Wrapper around DistributedMatrices.indexedRowMatrix factory method.
+   * Wrapper around IndexedRowMatrix.
    */
   def createIndexedRowMatrix(rows: DataFrame, numRows: Long, numCols: Int): IndexedRowMatrix = {
     // We use DataFrames for serialization of IndexedRows from Python, so map each Row in the
     // DataFrame back to an IndexedRow.
     val indexedRows = rows.map {
       case Row(index: Long, vector: Vector) => IndexedRow(index, vector)
     }
-    DistributedMatrices.indexedRowMatrix(indexedRows, numRows, numCols)
+    new IndexedRowMatrix(indexedRows, numRows, numCols)
   }
 
   /**
@@ -1137,15 +1137,15 @@ private[python] class PythonMLLibAPI extends Serializable {
   }
 
   /**
-   * Wrapper around DistributedMatrices.coordinateMatrix factory method.
+   * Wrapper around CoordinateMatrix.
    */
   def createCoordinateMatrix(rows: DataFrame, numRows: Long, numCols: Long): CoordinateMatrix = {
     // We use DataFrames for serialization of MatrixEntry entries from Python, so map each Row in
     // the DataFrame back to a MatrixEntry.
     val entries = rows.map {
       case Row(i: Long, j: Long, value: Double) => MatrixEntry(i, j, value)
     }
-    DistributedMatrices.coordinateMatrix(entries, numRows, numCols)
+    new CoordinateMatrix(entries, numRows, numCols)
   }
 
   /**

diff --git a/mllib/src/main/scala/org/apache/spark/mllib/linalg/distributed/DistributedMatrix.scala b/mllib/src/main/scala/org/apache/spark/mllib/linalg/distributed/DistributedMatrix.scala