DOC fix linear programming derivation comment in QuantileRegressor (scikit-learn#21952)

lorentzenchr · glemaitre · commit bde8b38b52f1 · 2021-12-25T12:26:49.000+01:00
diff --git a/doc/whats_new/v1.1.rst b/doc/whats_new/v1.1.rst
@@ -158,6 +158,11 @@ Changelog
   This is particularly relevant when `n_features > n_samples` and the
   estimator of the noise variance cannot be computed.
   :pr:`21481` by :user:`Guillaume Lemaitre <glemaitre>`
+  :pr:`21481` by :user:`Guillaume Lemaitre <glemaitre>`.
+
+- |Enhancement| :class:`linear_model.QuantileRegressor` support sparse input
+  for the highs based solvers.
+  :pr:`21086` by :user:`Venkatachalam Natchiappan <venkyyuvy>`.
 
 - |Fix| :class:`linear_model.LassoLarsIC` now correctly computes AIC
   and BIC. An error is now raised when `n_features > n_samples` and
diff --git a/sklearn/linear_model/_quantile.py b/sklearn/linear_model/_quantile.py
@@ -200,13 +200,15 @@ def fit(self, X, y, sample_weight=None):
         else:
             solver_options = self.solver_options
 
+        # After rescaling alpha, the minimization problem is
+        #     min sum(pinball loss) + alpha * L1
         # Use linear programming formulation of quantile regression
         #     min_x c x
         #           A_eq x = b_eq
         #                0 <= x
         # x = (s0, s, t0, t, u, v) = slack variables
-        # intercept = s0 + t0
-        # coef = s + t
+        # intercept = s0 - t0
+        # coef = s - t
         # c = (alpha * 1_p, alpha * 1_p, quantile * 1_n, (1-quantile) * 1_n)
         # residual = y - X@coef - intercept = u - v
         # A_eq = (1_n, X, -1_n, -X, diag(1_n), -diag(1_n))
@@ -216,7 +218,7 @@ def fit(self, X, y, sample_weight=None):
         # 1_n = vector of length n with entries equal one
         # see https://stats.stackexchange.com/questions/384909/
         #
-        # Filtering out zero samples weights from the beginning makes life
+        # Filtering out zero sample weights from the beginning makes life
         # easier for the linprog solver.
         mask = sample_weight != 0
         n_mask = int(np.sum(mask))  # use n_mask instead of n_samples