scikit-learn
diff --git a/‎asv_benchmarks/benchmarks/datasets.py
Lines changed: 6 additions & 7 deletions b/‎asv_benchmarks/benchmarks/datasets.py
Lines changed: 6 additions & 7 deletions
diff --git a/‎benchmarks/bench_feature_expansions.py
Lines changed: 2 additions & 2 deletions b/‎benchmarks/bench_feature_expansions.py
Lines changed: 2 additions & 2 deletions
diff --git a/‎benchmarks/bench_plot_randomized_svd.py
Lines changed: 1 addition & 1 deletion b/‎benchmarks/bench_plot_randomized_svd.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎benchmarks/bench_random_projections.py
Lines changed: 1 addition & 1 deletion b/‎benchmarks/bench_random_projections.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎doc/modules/impute.rst
Lines changed: 2 additions & 2 deletions b/‎doc/modules/impute.rst
Lines changed: 2 additions & 2 deletions
diff --git a/‎doc/modules/multiclass.rst
Lines changed: 4 additions & 4 deletions b/‎doc/modules/multiclass.rst
Lines changed: 4 additions & 4 deletions
diff --git a/‎examples/applications/plot_tomography_l1_reconstruction.py
Lines changed: 3 additions & 1 deletion b/‎examples/applications/plot_tomography_l1_reconstruction.py
Lines changed: 3 additions & 1 deletion
diff --git a/‎examples/applications/wikipedia_principal_eigenvector.py
Lines changed: 1 addition & 1 deletion b/‎examples/applications/wikipedia_principal_eigenvector.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎examples/linear_model/plot_lasso_dense_vs_sparse_data.py
Lines changed: 2 additions & 2 deletions b/‎examples/linear_model/plot_lasso_dense_vs_sparse_data.py
Lines changed: 2 additions & 2 deletions
diff --git a/‎examples/neighbors/approximate_nearest_neighbors.py
Lines changed: 2 additions & 2 deletions b/‎examples/neighbors/approximate_nearest_neighbors.py
Lines changed: 2 additions & 2 deletions
@@ -1,7 +1,6 @@
 from pathlib import Path
 
 import numpy as np
-import scipy.sparse as sp
 from joblib import Memory
 
 from sklearn.datasets import (
@@ -17,6 +16,7 @@
 from sklearn.feature_extraction.text import TfidfVectorizer
 from sklearn.model_selection import train_test_split
 from sklearn.preprocessing import MaxAbsScaler, StandardScaler
+from sklearn.utils._sparse import _sparse_random
 
 # memory location for caching datasets
 M = Memory(location=str(Path(__file__).resolve().parent / "cache"))
@@ -100,12 +100,12 @@ def _synth_regression_dataset(n_samples=100000, n_features=100, dtype=np.float32
 def _synth_regression_sparse_dataset(
     n_samples=10000, n_features=10000, density=0.01, dtype=np.float32
 ):
-    X = sp.random(
-        m=n_samples, n=n_features, density=density, format="csr", random_state=0
+    X = _sparse_random(
+        (n_samples, n_features), density=density, format="csr", random_state=0
     )
     X.data = np.random.RandomState(0).randn(X.getnnz())
     X = X.astype(dtype, copy=False)
-    coefs = sp.random(m=n_features, n=1, density=0.5, random_state=0)
+    coefs = _sparse_random((n_features, 1), density=0.5, random_state=0)
     coefs.data = np.random.RandomState(0).randn(coefs.getnnz())
     y = X.dot(coefs.toarray()).reshape(-1)
     y += 0.2 * y.std() * np.random.randn(n_samples)
@@ -155,9 +155,8 @@ def _random_dataset(
         X = np.random.RandomState(0).random_sample((n_samples, n_features))
         X = X.astype(dtype, copy=False)
     else:
-        X = sp.random(
-            n_samples,
-            n_features,
+        X = _sparse_random(
+            (n_samples, n_features),
             density=0.05,
             format="csr",
             dtype=dtype,
 
@@ -2,9 +2,9 @@
 
 import matplotlib.pyplot as plt
 import numpy as np
-import scipy.sparse as sparse
 
 from sklearn.preprocessing import PolynomialFeatures
+from sklearn.utils._sparse import _sparse_random
 
 degree = 2
 trials = 3
@@ -21,7 +21,7 @@
     for density in densities:
         for dim_index, dim in enumerate(dimensionalities):
             print(trial, density, dim)
-            X_csr = sparse.random(num_rows, dim, density).tocsr()
+            X_csr = _sparse_random((num_rows, dim), density=density, format="csr")
             X_dense = X_csr.toarray()
             # CSR
             t0 = time()
 
@@ -188,7 +188,7 @@ def get_data(dataset_name):
         data = np.repeat(data, 10)
         row = np.random.uniform(0, small_size, sparsity)
         col = np.random.uniform(0, small_size, sparsity)
-        X = sp.sparse.csr_matrix((data, (row, col)), shape=(size, small_size))
+        X = sp.sparse.csr_array((data, (row, col)), shape=(size, small_size))
         del data
         del row
         del col
 
@@ -70,7 +70,7 @@ def bench_scikit_transformer(X, transformer):
 # Gaussian distributed values
 def make_sparse_random_data(n_samples, n_features, n_nonzeros, random_state=None):
     rng = np.random.RandomState(random_state)
-    data_coo = sp.coo_matrix(
+    data_coo = sp.coo_array(
         (
             rng.randn(n_nonzeros),
             (
 
@@ -56,11 +56,11 @@ that contain the missing values::
 The :class:`SimpleImputer` class also supports sparse matrices::
 
     >>> import scipy.sparse as sp
-    >>> X = sp.csc_matrix([[1, 2], [0, -1], [8, 4]])
+    >>> X = sp.csc_array([[1, 2], [0, -1], [8, 4]])
     >>> imp = SimpleImputer(missing_values=-1, strategy='mean')
     >>> imp.fit(X)
     SimpleImputer(missing_values=-1)
-    >>> X_test = sp.csc_matrix([[-1, 2], [6, -1], [7, 6]])
+    >>> X_test = sp.csc_array([[-1, 2], [6, -1], [7, 6]])
     >>> print(imp.transform(X_test).toarray())
     [[3. 2.]
      [6. 3.]
 
@@ -170,9 +170,9 @@ Valid :term:`multiclass` representations for
      [1 0 0]
      [0 1 0]]
     >>> from scipy import sparse
-    >>> y_sparse = sparse.csr_matrix(y_dense)
+    >>> y_sparse = sparse.csr_array(y_dense)
     >>> print(y_sparse)
-    <Compressed Sparse Row sparse matrix of dtype 'int64'
+    <Compressed Sparse Row sparse array of dtype 'int64'
       with 4 stored elements and shape (4, 3)>
       Coords Values
       (0, 0) 1
@@ -380,9 +380,9 @@ refer to :ref:`preprocessing_targets`.
 
 An example of the same ``y`` in sparse matrix form:
 
-  >>> y_sparse = sparse.csr_matrix(y)
+  >>> y_sparse = sparse.csr_array(y)
   >>> print(y_sparse)
-  <Compressed Sparse Row sparse matrix of dtype 'int64'
+  <Compressed Sparse Row sparse array of dtype 'int64'
     with 4 stored elements and shape (3, 4)>
     Coords Values
     (0, 0) 1
 
@@ -89,7 +89,9 @@ def build_projection_operator(l_x, n_dir):
         weights += list(w[mask])
         camera_inds += list(inds[mask] + i * l_x)
         data_inds += list(data_unravel_indices[mask])
-    proj_operator = sparse.coo_matrix((weights, (camera_inds, data_inds)))
+    camera_inds = np.array(camera_inds, dtype=np.int32)  # lasso needs int32 inds
+    data_inds = np.array(data_inds, dtype=np.int32)
+    proj_operator = sparse.coo_array((weights, (camera_inds, data_inds)))
     return proj_operator
 
 
 
@@ -146,7 +146,7 @@ def get_adjacency_matrix(redirects_filename, page_links_filename, limit=None):
             break
 
     print("Computing the adjacency matrix")
-    X = sparse.lil_matrix((len(index_map), len(index_map)), dtype=np.float32)
+    X = sparse.lil_array((len(index_map), len(index_map)), dtype=np.float32)
     for i, j in links:
         X[i, j] = 1.0
     del links
 
@@ -32,7 +32,7 @@
 
 X, y = make_regression(n_samples=200, n_features=5000, random_state=0)
 # create a copy of X in sparse format
-X_sp = sparse.coo_matrix(X)
+X_sp = sparse.coo_array(X)
 
 alpha = 1
 sparse_lasso = Lasso(alpha=alpha, fit_intercept=False, max_iter=1000)
@@ -64,7 +64,7 @@
 # make Xs sparse by replacing the values lower than 2.5 with 0s
 Xs[Xs < 2.5] = 0.0
 # create a copy of Xs in sparse format
-Xs_sp = sparse.coo_matrix(Xs)
+Xs_sp = sparse.coo_array(Xs)
 Xs_sp = Xs_sp.tocsc()
 
 # compute the proportion of non-zero coefficient in the data matrix
 
@@ -39,7 +39,7 @@
 # `nmslib`, as well as a loading function.
 import joblib
 import numpy as np
-from scipy.sparse import csr_matrix
+from scipy.sparse import csr_array
 
 from sklearn.base import BaseEstimator, TransformerMixin
 from sklearn.datasets import fetch_openml
@@ -93,7 +93,7 @@ def transform(self, X):
         indices, distances = np.vstack(indices), np.vstack(distances)
 
         indptr = np.arange(0, n_samples_transform * n_neighbors + 1, n_neighbors)
-        kneighbors_graph = csr_matrix(
+        kneighbors_graph = csr_array(
             (distances.ravel(), indices.ravel(), indptr),
             shape=(n_samples_transform, self.n_samples_fit_),
         )
Original file line number	Diff line number	Diff line change
`@@ -70,7 +70,7 @@ def bench_scikit_transformer(X, transformer):`
`70`	`70`	`# Gaussian distributed values`
`71`	`71`	`def make_sparse_random_data(n_samples, n_features, n_nonzeros, random_state=None):`
`72`	`72`	`rng = np.random.RandomState(random_state)`
`73`		`- data_coo = sp.coo_matrix(`
	`73`	`+ data_coo = sp.coo_array(`
`74`	`74`	`(`
`75`	`75`	`rng.randn(n_nonzeros),`
`76`	`76`	`(`