2020-07-27 04:49:21 -04:00
|
|
|
.. Licensed to the Apache Software Foundation (ASF) under one
|
|
|
|
or more contributor license agreements. See the NOTICE file
|
|
|
|
distributed with this work for additional information
|
|
|
|
regarding copyright ownership. The ASF licenses this file
|
|
|
|
to you under the Apache License, Version 2.0 (the
|
|
|
|
"License"); you may not use this file except in compliance
|
|
|
|
with the License. You may obtain a copy of the License at
|
|
|
|
|
|
|
|
.. http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
|
|
|
|
.. Unless required by applicable law or agreed to in writing,
|
|
|
|
software distributed under the License is distributed on an
|
|
|
|
"AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
|
|
|
|
KIND, either express or implied. See the License for the
|
|
|
|
specific language governing permissions and limitations
|
|
|
|
under the License.
|
|
|
|
|
|
|
|
|
|
|
|
MLlib
|
|
|
|
=====
|
|
|
|
|
|
|
|
Classification
|
|
|
|
--------------
|
|
|
|
|
|
|
|
.. currentmodule:: pyspark.mllib.classification
|
|
|
|
|
|
|
|
.. autosummary::
|
2020-10-27 01:03:57 -04:00
|
|
|
:template: autosummary/class_with_docs.rst
|
2020-07-27 04:49:21 -04:00
|
|
|
:toctree: api/
|
|
|
|
|
|
|
|
LogisticRegressionModel
|
|
|
|
LogisticRegressionWithSGD
|
|
|
|
LogisticRegressionWithLBFGS
|
|
|
|
SVMModel
|
|
|
|
SVMWithSGD
|
|
|
|
NaiveBayesModel
|
|
|
|
NaiveBayes
|
|
|
|
StreamingLogisticRegressionWithSGD
|
|
|
|
|
|
|
|
|
|
|
|
Clustering
|
|
|
|
----------
|
|
|
|
|
|
|
|
.. currentmodule:: pyspark.mllib.clustering
|
|
|
|
|
|
|
|
.. autosummary::
|
2020-10-27 01:03:57 -04:00
|
|
|
:template: autosummary/class_with_docs.rst
|
2020-07-27 04:49:21 -04:00
|
|
|
:toctree: api/
|
|
|
|
|
|
|
|
|
|
|
|
BisectingKMeansModel
|
|
|
|
BisectingKMeans
|
|
|
|
KMeansModel
|
|
|
|
KMeans
|
|
|
|
GaussianMixtureModel
|
|
|
|
GaussianMixture
|
|
|
|
PowerIterationClusteringModel
|
|
|
|
PowerIterationClustering
|
|
|
|
StreamingKMeans
|
|
|
|
StreamingKMeansModel
|
|
|
|
LDA
|
|
|
|
LDAModel
|
|
|
|
|
|
|
|
|
|
|
|
Evaluation
|
|
|
|
----------
|
|
|
|
|
|
|
|
.. currentmodule:: pyspark.mllib.evaluation
|
|
|
|
|
|
|
|
.. autosummary::
|
2020-10-27 01:03:57 -04:00
|
|
|
:template: autosummary/class_with_docs.rst
|
2020-07-27 04:49:21 -04:00
|
|
|
:toctree: api/
|
|
|
|
|
|
|
|
BinaryClassificationMetrics
|
|
|
|
RegressionMetrics
|
|
|
|
MulticlassMetrics
|
|
|
|
RankingMetrics
|
|
|
|
|
|
|
|
|
|
|
|
Feature
|
|
|
|
-------
|
|
|
|
|
|
|
|
.. currentmodule:: pyspark.mllib.feature
|
|
|
|
|
|
|
|
.. autosummary::
|
2020-10-27 01:03:57 -04:00
|
|
|
:template: autosummary/class_with_docs.rst
|
2020-07-27 04:49:21 -04:00
|
|
|
:toctree: api/
|
|
|
|
|
|
|
|
Normalizer
|
|
|
|
StandardScalerModel
|
|
|
|
StandardScaler
|
|
|
|
HashingTF
|
|
|
|
IDFModel
|
|
|
|
IDF
|
|
|
|
Word2Vec
|
|
|
|
Word2VecModel
|
|
|
|
ChiSqSelector
|
|
|
|
ChiSqSelectorModel
|
|
|
|
ElementwiseProduct
|
|
|
|
|
|
|
|
|
|
|
|
Frequency Pattern Mining
|
|
|
|
------------------------
|
|
|
|
|
|
|
|
.. currentmodule:: pyspark.mllib.fpm
|
|
|
|
|
|
|
|
.. autosummary::
|
2020-10-27 01:03:57 -04:00
|
|
|
:template: autosummary/class_with_docs.rst
|
2020-07-27 04:49:21 -04:00
|
|
|
:toctree: api/
|
|
|
|
|
|
|
|
FPGrowth
|
|
|
|
FPGrowthModel
|
|
|
|
PrefixSpan
|
|
|
|
PrefixSpanModel
|
|
|
|
|
|
|
|
|
|
|
|
Vector and Matrix
|
|
|
|
-----------------
|
|
|
|
|
|
|
|
.. currentmodule:: pyspark.mllib.linalg
|
|
|
|
|
|
|
|
.. autosummary::
|
2020-10-27 01:03:57 -04:00
|
|
|
:template: autosummary/class_with_docs.rst
|
2020-07-27 04:49:21 -04:00
|
|
|
:toctree: api/
|
|
|
|
|
|
|
|
Vector
|
|
|
|
DenseVector
|
|
|
|
SparseVector
|
|
|
|
Vectors
|
|
|
|
Matrix
|
|
|
|
DenseMatrix
|
|
|
|
SparseMatrix
|
|
|
|
Matrices
|
|
|
|
QRDecomposition
|
|
|
|
|
|
|
|
|
|
|
|
Distributed Representation
|
|
|
|
~~~~~~~~~~~~~~~~~~~~~~~~~~
|
|
|
|
|
|
|
|
.. currentmodule:: pyspark.mllib.linalg.distributed
|
|
|
|
|
|
|
|
.. autosummary::
|
2020-10-27 01:03:57 -04:00
|
|
|
:template: autosummary/class_with_docs.rst
|
2020-07-27 04:49:21 -04:00
|
|
|
:toctree: api/
|
|
|
|
|
|
|
|
BlockMatrix
|
|
|
|
CoordinateMatrix
|
|
|
|
DistributedMatrix
|
|
|
|
IndexedRow
|
|
|
|
IndexedRowMatrix
|
|
|
|
MatrixEntry
|
|
|
|
RowMatrix
|
|
|
|
SingularValueDecomposition
|
|
|
|
|
|
|
|
|
|
|
|
Random
|
|
|
|
------
|
|
|
|
|
|
|
|
.. currentmodule:: pyspark.mllib.random
|
|
|
|
|
|
|
|
.. autosummary::
|
2020-10-27 01:03:57 -04:00
|
|
|
:template: autosummary/class_with_docs.rst
|
2020-07-27 04:49:21 -04:00
|
|
|
:toctree: api/
|
|
|
|
|
|
|
|
RandomRDDs
|
|
|
|
|
|
|
|
|
|
|
|
Recommendation
|
|
|
|
--------------
|
|
|
|
|
|
|
|
.. currentmodule:: pyspark.mllib.recommendation
|
|
|
|
|
|
|
|
.. autosummary::
|
2020-10-27 01:03:57 -04:00
|
|
|
:template: autosummary/class_with_docs.rst
|
2020-07-27 04:49:21 -04:00
|
|
|
:toctree: api/
|
|
|
|
|
|
|
|
MatrixFactorizationModel
|
|
|
|
ALS
|
|
|
|
Rating
|
|
|
|
|
|
|
|
|
|
|
|
Regression
|
|
|
|
----------
|
|
|
|
|
|
|
|
.. currentmodule:: pyspark.mllib.regression
|
|
|
|
|
|
|
|
.. autosummary::
|
2020-10-27 01:03:57 -04:00
|
|
|
:template: autosummary/class_with_docs.rst
|
2020-07-27 04:49:21 -04:00
|
|
|
:toctree: api/
|
|
|
|
|
|
|
|
LabeledPoint
|
|
|
|
LinearModel
|
|
|
|
LinearRegressionModel
|
|
|
|
LinearRegressionWithSGD
|
|
|
|
RidgeRegressionModel
|
|
|
|
RidgeRegressionWithSGD
|
|
|
|
LassoModel
|
|
|
|
LassoWithSGD
|
|
|
|
IsotonicRegressionModel
|
|
|
|
IsotonicRegression
|
|
|
|
StreamingLinearAlgorithm
|
|
|
|
StreamingLinearRegressionWithSGD
|
|
|
|
|
|
|
|
|
|
|
|
Statistics
|
|
|
|
----------
|
|
|
|
|
|
|
|
.. currentmodule:: pyspark.mllib.stat
|
|
|
|
|
|
|
|
.. autosummary::
|
2020-10-27 01:03:57 -04:00
|
|
|
:template: autosummary/class_with_docs.rst
|
2020-07-27 04:49:21 -04:00
|
|
|
:toctree: api/
|
|
|
|
|
|
|
|
Statistics
|
|
|
|
MultivariateStatisticalSummary
|
|
|
|
ChiSqTestResult
|
|
|
|
MultivariateGaussian
|
|
|
|
KernelDensity
|
2020-11-24 20:24:41 -05:00
|
|
|
ChiSqTestResult
|
|
|
|
KolmogorovSmirnovTestResult
|
2020-07-27 04:49:21 -04:00
|
|
|
|
|
|
|
|
|
|
|
Tree
|
|
|
|
----
|
|
|
|
|
|
|
|
.. currentmodule:: pyspark.mllib.tree
|
|
|
|
|
|
|
|
.. autosummary::
|
2020-10-27 01:03:57 -04:00
|
|
|
:template: autosummary/class_with_docs.rst
|
2020-07-27 04:49:21 -04:00
|
|
|
:toctree: api/
|
|
|
|
|
|
|
|
DecisionTreeModel
|
|
|
|
DecisionTree
|
|
|
|
RandomForestModel
|
|
|
|
RandomForest
|
|
|
|
GradientBoostedTreesModel
|
|
|
|
GradientBoostedTrees
|
|
|
|
|
|
|
|
|
|
|
|
Utilities
|
|
|
|
---------
|
|
|
|
|
|
|
|
.. currentmodule:: pyspark.mllib.util
|
|
|
|
|
|
|
|
.. autosummary::
|
2020-10-27 01:03:57 -04:00
|
|
|
:template: autosummary/class_with_docs.rst
|
2020-07-27 04:49:21 -04:00
|
|
|
:toctree: api/
|
|
|
|
|
|
|
|
JavaLoader
|
|
|
|
JavaSaveable
|
|
|
|
LinearDataGenerator
|
|
|
|
Loader
|
|
|
|
MLUtils
|
|
|
|
Saveable
|