Fix spacing and formatting inconsistencies (scikit-learn#13747)

Scowley4 · jnothman · commit 51d25d7d0b16 · 2019-05-06T23:13:30.000+10:00
diff --git a/sklearn/cluster/hierarchical.py b/sklearn/cluster/hierarchical.py
@@ -148,7 +148,7 @@ def ward_tree(X, connectivity=None, n_clusters=None, return_distance=False):
     Parameters
     ----------
     X : array, shape (n_samples, n_features)
-        feature matrix  representing n_samples samples to be clustered
+        feature matrix representing n_samples samples to be clustered
 
     connectivity : sparse matrix (optional).
         connectivity matrix. Defines for each sample the neighboring samples
@@ -219,7 +219,7 @@ def ward_tree(X, connectivity=None, n_clusters=None, return_distance=False):
     n_samples, n_features = X.shape
 
     if connectivity is None:
-        from scipy.cluster import hierarchy     # imports PIL
+        from scipy.cluster import hierarchy  # imports PIL
 
         if n_clusters is not None:
             warnings.warn('Partial build of the tree is implemented '
@@ -433,7 +433,7 @@ def linkage_tree(X, connectivity=None, n_clusters=None, linkage='complete',
             'of %s, but %s was given' % (linkage_choices.keys(), linkage))
 
     if connectivity is None:
-        from scipy.cluster import hierarchy     # imports PIL
+        from scipy.cluster import hierarchy  # imports PIL
 
         if n_clusters is not None:
             warnings.warn('Partial build of the tree is implemented '
@@ -597,7 +597,7 @@ def _single_linkage(*args, **kwargs):
 
 
 ###############################################################################
-# Functions for cutting  hierarchical clustering tree
+# Functions for cutting hierarchical clustering tree
 
 def _hc_cut(n_clusters, children, n_leaves):
     """Function cutting the ward tree for a given number of clusters.
diff --git a/sklearn/cluster/k_means_.py b/sklearn/cluster/k_means_.py
@@ -706,7 +706,7 @@ def _init_centroids(X, k, init, random_state=None, x_squared_norms=None,
         an int to make the randomness deterministic.
         See :term:`Glossary <random_state>`.
 
-    x_squared_norms :  array, shape (n_samples,), optional
+    x_squared_norms : array, shape (n_samples,), optional
         Squared euclidean norm of each data point. Pass it if you have it at
         hands already to avoid it being recomputed here. Default: None
 
@@ -1419,8 +1419,8 @@ class MiniBatchKMeans(KMeans):
     ...               [3, 2], [5, 5], [1, -1]])
     >>> # manually fit on batches
     >>> kmeans = MiniBatchKMeans(n_clusters=2,
-    ...         random_state=0,
-    ...         batch_size=6)
+    ...                          random_state=0,
+    ...                          batch_size=6)
     >>> kmeans = kmeans.partial_fit(X[0:6,:])
     >>> kmeans = kmeans.partial_fit(X[6:12,:])
     >>> kmeans.cluster_centers_
@@ -1430,9 +1430,9 @@ class MiniBatchKMeans(KMeans):
     array([0, 1], dtype=int32)
     >>> # fit on the whole data
     >>> kmeans = MiniBatchKMeans(n_clusters=2,
-    ...         random_state=0,
-    ...         batch_size=6,
-    ...         max_iter=10).fit(X)
+    ...                          random_state=0,
+    ...                          batch_size=6,
+    ...                          max_iter=10).fit(X)
     >>> kmeans.cluster_centers_
     array([[3.95918367, 2.40816327],
            [1.12195122, 1.3902439 ]])
diff --git a/sklearn/covariance/empirical_covariance_.py b/sklearn/covariance/empirical_covariance_.py
@@ -122,8 +122,8 @@ class EmpiricalCovariance(BaseEstimator):
     ...                      [.3, .4]])
     >>> rng = np.random.RandomState(0)
     >>> X = rng.multivariate_normal(mean=[0, 0],
-    ...                                   cov=real_cov,
-    ...                                   size=500)
+    ...                             cov=real_cov,
+    ...                             size=500)
     >>> cov = EmpiricalCovariance().fit(X)
     >>> cov.covariance_ # doctest: +ELLIPSIS
     array([[0.7569..., 0.2818...],
diff --git a/sklearn/covariance/graph_lasso_.py b/sklearn/covariance/graph_lasso_.py
@@ -337,10 +337,10 @@ class GraphicalLasso(EmpiricalCovariance):
     --------
     >>> import numpy as np
     >>> from sklearn.covariance import GraphicalLasso
-    >>> true_cov = np.array([[.8, 0., .2, 0.],
-    ...                      [0., .4, 0., 0.],
-    ...                      [.2, 0., .3, .1],
-    ...                      [0., 0., .1, .7]])
+    >>> true_cov = np.array([[0.8, 0.0, 0.2, 0.0],
+    ...                      [0.0, 0.4, 0.0, 0.0],
+    ...                      [0.2, 0.0, 0.3, 0.1],
+    ...                      [0.0, 0.0, 0.1, 0.7]])
     >>> np.random.seed(0)
     >>> X = np.random.multivariate_normal(mean=[0, 0, 0, 0],
     ...                                   cov=true_cov,
@@ -592,10 +592,10 @@ class GraphicalLassoCV(GraphicalLasso):
     --------
     >>> import numpy as np
     >>> from sklearn.covariance import GraphicalLassoCV
-    >>> true_cov = np.array([[.8, 0., .2, 0.],
-    ...                      [0., .4, 0., 0.],
-    ...                      [.2, 0., .3, .1],
-    ...                      [0., 0., .1, .7]])
+    >>> true_cov = np.array([[0.8, 0.0, 0.2, 0.0],
+    ...                      [0.0, 0.4, 0.0, 0.0],
+    ...                      [0.2, 0.0, 0.3, 0.1],
+    ...                      [0.0, 0.0, 0.1, 0.7]])
     >>> np.random.seed(0)
     >>> X = np.random.multivariate_normal(mean=[0, 0, 0, 0],
     ...                                   cov=true_cov,
diff --git a/sklearn/datasets/base.py b/sklearn/datasets/base.py
@@ -568,12 +568,12 @@ def load_digits(n_class=10, return_X_y=False):
 def load_diabetes(return_X_y=False):
     """Load and return the diabetes dataset (regression).
 
-    ==============      ==================
-    Samples total       442
-    Dimensionality      10
-    Features            real, -.2 < x < .2
-    Targets             integer 25 - 346
-    ==============      ==================
+    ==============   ==================
+    Samples total    442
+    Dimensionality   10
+    Features         real, -.2 < x < .2
+    Targets          integer 25 - 346
+    ==============   ==================
 
     Read more in the :ref:`User Guide <diabetes_dataset>`.
 
@@ -621,12 +621,12 @@ def load_diabetes(return_X_y=False):
 def load_linnerud(return_X_y=False):
     """Load and return the linnerud dataset (multivariate regression).
 
-    ==============    ============================
-    Samples total     20
-    Dimensionality    3 (for both data and target)
-    Features          integer
-    Targets           integer
-    ==============    ============================
+    ==============   ============================
+    Samples total    20
+    Dimensionality   3 (for both data and target)
+    Features         integer
+    Targets          integer
+    ==============   ============================
 
     Read more in the :ref:`User Guide <linnerrud_dataset>`.
 
@@ -685,12 +685,12 @@ def load_linnerud(return_X_y=False):
 def load_boston(return_X_y=False):
     """Load and return the boston house-prices dataset (regression).
 
-    ==============     ==============
-    Samples total                 506
-    Dimensionality                 13
-    Features           real, positive
-    Targets             real 5. - 50.
-    ==============     ==============
+    ==============   ==============
+    Samples total               506
+    Dimensionality               13
+    Features         real, positive
+    Targets           real 5. - 50.
+    ==============   ==============
 
     Read more in the :ref:`User Guide <boston_dataset>`.
 
diff --git a/sklearn/datasets/california_housing.py b/sklearn/datasets/california_housing.py
@@ -50,12 +50,12 @@ def fetch_california_housing(data_home=None, download_if_missing=True,
                              return_X_y=False):
     """Load the California housing dataset (regression).
 
-    ==============     ==============
-    Samples total               20640
-    Dimensionality                  8
-    Features                     real
-    Target             real 0.15 - 5.
-    ==============     ==============
+    ==============   ==============
+    Samples total             20640
+    Dimensionality                8
+    Features                   real
+    Target           real 0.15 - 5.
+    ==============   ==============
 
     Read more in the :ref:`User Guide <california_housing_dataset>`.
 
diff --git a/sklearn/datasets/svmlight_format.py b/sklearn/datasets/svmlight_format.py
@@ -435,7 +435,7 @@ def dump_svmlight_file(X, y, f,  zero_based=True, comment=None, query_id=None,
         # if a user wants to get fancy, they'll have to decode themselves.
         # Avoid mention of str and unicode types for Python 3.x compat.
         if isinstance(comment, bytes):
-            comment.decode("ascii")     # just for the exception
+            comment.decode("ascii")  # just for the exception
         else:
             comment = comment.encode("utf-8")
         if b"\0" in comment:
diff --git a/sklearn/decomposition/base.py b/sklearn/decomposition/base.py
@@ -27,7 +27,7 @@ def get_covariance(self):
         """Compute data covariance with the generative model.
 
         ``cov = components_.T * S**2 * components_ + sigma2 * eye(n_features)``
-        where  S**2 contains the explained variances, and sigma2 contains the
+        where S**2 contains the explained variances, and sigma2 contains the
         noise variances.
 
         Returns
diff --git a/sklearn/decomposition/dict_learning.py b/sklearn/decomposition/dict_learning.py
@@ -171,7 +171,7 @@ def _sparse_encode(X, dictionary, gram, cov=None, algorithm='lasso_lars',
             copy_Xy=copy_cov).T
     else:
         raise ValueError('Sparse coding method must be "lasso_lars" '
-                         '"lasso_cd",  "lasso", "threshold" or "omp", got %s.'
+                         '"lasso_cd", "lasso", "threshold" or "omp", got %s.'
                          % algorithm)
     if new_code.ndim != 2:
         return new_code.reshape(n_samples, n_components)
diff --git a/sklearn/decomposition/kernel_pca.py b/sklearn/decomposition/kernel_pca.py
@@ -230,9 +230,9 @@ def _fit_transform(self, K):
         # there is a link between
         # the eigenvectors of K=Phi(X)'Phi(X) and the ones of Phi(X)Phi(X)'
         # if v is an eigenvector of K
-        #                      then Phi(X)v  is an eigenvector of Phi(X)Phi(X)'
+        #     then Phi(X)v  is an eigenvector of Phi(X)Phi(X)'
         # if u is an eigenvector of Phi(X)Phi(X)'
-        #                      then Phi(X)'u is an eigenvector of Phi(X)Phi(X)'
+        #     then Phi(X)'u is an eigenvector of Phi(X)Phi(X)'
         #
         # At this stage our self.alphas_ (the v) have norm 1, we need to scale
         # them so that eigenvectors in kernel feature space (the u) have norm=1
diff --git a/sklearn/discriminant_analysis.py b/sklearn/discriminant_analysis.py
@@ -716,7 +716,7 @@ def _decision_function(self, X):
             Xm = X - self.means_[i]
             X2 = np.dot(Xm, R * (S ** (-0.5)))
             norm2.append(np.sum(X2 ** 2, 1))
-        norm2 = np.array(norm2).T   # shape = [len(X), n_classes]
+        norm2 = np.array(norm2).T  # shape = [len(X), n_classes]
         u = np.asarray([np.sum(np.log(s)) for s in self.scalings_])
         return (-0.5 * (norm2 + u) + np.log(self.priors_))
 
diff --git a/sklearn/dummy.py b/sklearn/dummy.py
@@ -492,10 +492,10 @@ def predict(self, X, return_std=False):
 
         Returns
         -------
-        y : array, shape = [n_samples]  or [n_samples, n_outputs]
+        y : array, shape = [n_samples] or [n_samples, n_outputs]
             Predicted target values for X.
 
-        y_std : array, shape = [n_samples]  or [n_samples, n_outputs]
+        y_std : array, shape = [n_samples] or [n_samples, n_outputs]
             Standard deviation of predictive distribution of query points.
         """
         check_is_fitted(self, "constant_")
diff --git a/sklearn/ensemble/_gb_losses.py b/sklearn/ensemble/_gb_losses.py
@@ -879,6 +879,6 @@ def get_init_raw_predictions(self, X, estimator):
     'lad': LeastAbsoluteError,
     'huber': HuberLossFunction,
     'quantile': QuantileLossFunction,
-    'deviance': None,    # for both, multinomial and binomial
+    'deviance': None,  # for both, multinomial and binomial
     'exponential': ExponentialLoss,
 }
diff --git a/sklearn/ensemble/gradient_boosting.py b/sklearn/ensemble/gradient_boosting.py
@@ -1694,7 +1694,7 @@ def _staged_raw_predict(self, X):
             Regression and binary classification are special cases with
             ``k == 1``, otherwise ``k==n_classes``.
         """
-        X = check_array(X, dtype=DTYPE, order="C",  accept_sparse='csr')
+        X = check_array(X, dtype=DTYPE, order="C", accept_sparse='csr')
         raw_predictions = self._raw_predict_init(X)
         for i in range(self.estimators_.shape[0]):
             predict_stage(self.estimators_, i, X, self.learning_rate,
@@ -2085,7 +2085,7 @@ def decision_function(self, X):
             `classes_`. Regression and binary classification produce an
             array of shape [n_samples].
         """
-        X = check_array(X, dtype=DTYPE, order="C",  accept_sparse='csr')
+        X = check_array(X, dtype=DTYPE, order="C", accept_sparse='csr')
         raw_predictions = self._raw_predict(X)
         if raw_predictions.shape[1] == 1:
             return raw_predictions.ravel()
@@ -2527,7 +2527,7 @@ def predict(self, X):
         y : array, shape (n_samples,)
             The predicted values.
         """
-        X = check_array(X, dtype=DTYPE, order="C",  accept_sparse='csr')
+        X = check_array(X, dtype=DTYPE, order="C", accept_sparse='csr')
         # In regression we can directly return the raw value from the trees.
         return self._raw_predict(X).ravel()
 
diff --git a/sklearn/ensemble/weight_boosting.py b/sklearn/ensemble/weight_boosting.py
@@ -685,7 +685,7 @@ class in ``classes_``, respectively.
             # The weights are all 1. for SAMME.R
             pred = sum(_samme_proba(estimator, n_classes, X)
                        for estimator in self.estimators_)
-        else:   # self.algorithm == "SAMME"
+        else:  # self.algorithm == "SAMME"
             pred = sum((estimator.predict(X) == classes).T * w
                        for estimator, w in zip(self.estimators_,
                                                self.estimator_weights_))
@@ -780,7 +780,7 @@ def predict_proba(self, X):
             # The weights are all 1. for SAMME.R
             proba = sum(_samme_proba(estimator, n_classes, X)
                         for estimator in self.estimators_)
-        else:   # self.algorithm == "SAMME"
+        else:  # self.algorithm == "SAMME"
             proba = sum(estimator.predict_proba(X) * w
                         for estimator, w in zip(self.estimators_,
                                                 self.estimator_weights_))
diff --git a/sklearn/exceptions.py b/sklearn/exceptions.py
@@ -29,7 +29,7 @@ class NotFittedError(ValueError, AttributeError):
     ...     LinearSVC().predict([[1, 2], [2, 3], [3, 4]])
     ... except NotFittedError as e:
     ...     print(repr(e))
-    ...                        # doctest: +NORMALIZE_WHITESPACE +ELLIPSIS
+    ... # doctest: +NORMALIZE_WHITESPACE +ELLIPSIS
     NotFittedError('This LinearSVC instance is not fitted yet'...)
 
     .. versionchanged:: 0.18
@@ -114,7 +114,7 @@ class FitFailedWarning(RuntimeWarning):
     >>> X, y = [[1, 2], [3, 4], [5, 6], [7, 8]], [0, 0, 1, 1]
     >>> with warnings.catch_warnings(record=True) as w:
     ...     try:
-    ...         gs.fit(X, y)   # This will raise a ValueError since C is < 0
+    ...         gs.fit(X, y)  # This will raise a ValueError since C is < 0
     ...     except ValueError:
     ...         pass
     ...     print(repr(w[-1].message))
diff --git a/sklearn/feature_extraction/text.py b/sklearn/feature_extraction/text.py
@@ -110,7 +110,7 @@ def _check_stop_list(stop):
         raise ValueError("not a built-in stop list: %s" % stop)
     elif stop is None:
         return None
-    else:               # assume it's a collection
+    else:  # assume it's a collection
         return frozenset(stop)
 
 
@@ -1496,7 +1496,7 @@ class TfidfVectorizer(CountVectorizer):
 
     idf_ : array, shape (n_features)
         The inverse document frequency (IDF) vector; only defined
-        if  ``use_idf`` is True.
+        if ``use_idf`` is True.
 
     stop_words_ : set
         Terms that were ignored because they either:
diff --git a/sklearn/kernel_ridge.py b/sklearn/kernel_ridge.py
@@ -27,7 +27,7 @@ class KernelRidge(BaseEstimator, RegressorMixin, MultiOutputMixin):
     squared error loss while support vector regression uses epsilon-insensitive
     loss, both combined with l2 regularization. In contrast to SVR, fitting a
     KRR model can be done in closed-form and is typically faster for
-    medium-sized datasets. On the other  hand, the learned model is non-sparse
+    medium-sized datasets. On the other hand, the learned model is non-sparse
     and thus slower than SVR, which learns a sparse model for epsilon > 0, at
     prediction-time.
 
diff --git a/sklearn/metrics/pairwise.py b/sklearn/metrics/pairwise.py
@@ -1169,17 +1169,17 @@ def distance_metrics():
 
     The valid distance metrics, and the function they map to, are:
 
-    ============     ====================================
-    metric           Function
-    ============     ====================================
-    'cityblock'      metrics.pairwise.manhattan_distances
-    'cosine'         metrics.pairwise.cosine_distances
-    'euclidean'      metrics.pairwise.euclidean_distances
-    'haversine'      metrics.pairwise.haversine_distances
-    'l1'             metrics.pairwise.manhattan_distances
-    'l2'             metrics.pairwise.euclidean_distances
-    'manhattan'      metrics.pairwise.manhattan_distances
-    ============     ====================================
+    ============   ====================================
+    metric         Function
+    ============   ====================================
+    'cityblock'    metrics.pairwise.manhattan_distances
+    'cosine'       metrics.pairwise.cosine_distances
+    'euclidean'    metrics.pairwise.euclidean_distances
+    'haversine'    metrics.pairwise.haversine_distances
+    'l1'           metrics.pairwise.manhattan_distances
+    'l2'           metrics.pairwise.euclidean_distances
+    'manhattan'    metrics.pairwise.manhattan_distances
+    ============   ====================================
 
     Read more in the :ref:`User Guide <metrics>`.
 
diff --git a/sklearn/model_selection/_validation.py b/sklearn/model_selection/_validation.py
@@ -1118,7 +1118,7 @@ def learning_curve(estimator, X, y, groups=None,
                    train_sizes=np.linspace(0.1, 1.0, 5), cv='warn',
                    scoring=None, exploit_incremental_learning=False,
                    n_jobs=None, pre_dispatch="all", verbose=0, shuffle=False,
-                   random_state=None,  error_score='raise-deprecating'):
+                   random_state=None, error_score='raise-deprecating'):
     """Learning curve.
 
     Determines cross-validated training and test scores for different training
diff --git a/sklearn/neighbors/lof.py b/sklearn/neighbors/lof.py
@@ -500,5 +500,5 @@ def _local_reachability_density(self, distances_X, neighbors_indices):
                                         self.n_neighbors_ - 1]
         reach_dist_array = np.maximum(distances_X, dist_k)
 
-        #  1e-10 to avoid `nan' when nb of duplicates > n_neighbors_:
+        # 1e-10 to avoid `nan' when nb of duplicates > n_neighbors_:
         return 1. / (np.mean(reach_dist_array, axis=1) + 1e-10)
diff --git a/sklearn/neural_network/_stochastic_optimizers.py b/sklearn/neural_network/_stochastic_optimizers.py
@@ -1,7 +1,7 @@
 """Stochastic optimization methods for MLP
 """
 
-# Authors:  Jiyuan Qian <jq401@nyu.edu>
+# Authors: Jiyuan Qian <jq401@nyu.edu>
 # License: BSD 3 clause
 
 import numpy as np
diff --git a/sklearn/pipeline.py b/sklearn/pipeline.py
diff --git a/sklearn/preprocessing/data.py b/sklearn/preprocessing/data.py
diff --git a/sklearn/preprocessing/label.py b/sklearn/preprocessing/label.py
diff --git a/sklearn/svm/base.py b/sklearn/svm/base.py
diff --git a/sklearn/tree/__init__.py b/sklearn/tree/__init__.py

Original file line number	Diff line number	Diff line change
`@@ -879,6 +879,6 @@ def get_init_raw_predictions(self, X, estimator):`
`879`	`879`	`'lad': LeastAbsoluteError,`
`880`	`880`	`'huber': HuberLossFunction,`
`881`	`881`	`'quantile': QuantileLossFunction,`
`882`		`- 'deviance': None, # for both, multinomial and binomial`
	`882`	`+ 'deviance': None, # for both, multinomial and binomial`
`883`	`883`	`'exponential': ExponentialLoss,`
`884`	`884`	`}`