siyacoderza
diff --git a/‎doc/developers/develop.rst
Lines changed: 18 additions & 9 deletions b/‎doc/developers/develop.rst
Lines changed: 18 additions & 9 deletions
diff --git a/‎sklearn/base.py
Lines changed: 5 additions & 26 deletions b/‎sklearn/base.py
Lines changed: 5 additions & 26 deletions
diff --git a/‎sklearn/feature_selection/_base.py
Lines changed: 14 additions & 6 deletions b/‎sklearn/feature_selection/_base.py
Lines changed: 14 additions & 6 deletions
diff --git a/‎sklearn/feature_selection/_from_model.py
Lines changed: 4 additions & 2 deletions b/‎sklearn/feature_selection/_from_model.py
Lines changed: 4 additions & 2 deletions
diff --git a/‎sklearn/feature_selection/_rfe.py
Lines changed: 8 additions & 6 deletions b/‎sklearn/feature_selection/_rfe.py
Lines changed: 8 additions & 6 deletions
diff --git a/‎sklearn/feature_selection/_sequential.py
Lines changed: 3 additions & 4 deletions b/‎sklearn/feature_selection/_sequential.py
Lines changed: 3 additions & 4 deletions
diff --git a/‎sklearn/feature_selection/tests/test_rfe.py
Lines changed: 3 additions & 6 deletions b/‎sklearn/feature_selection/tests/test_rfe.py
Lines changed: 3 additions & 6 deletions
diff --git a/‎sklearn/linear_model/_glm/tests/test_glm.py
Lines changed: 7 additions & 7 deletions b/‎sklearn/linear_model/_glm/tests/test_glm.py
Lines changed: 7 additions & 7 deletions
diff --git a/‎sklearn/linear_model/tests/test_coordinate_descent.py
Lines changed: 2 additions & 2 deletions b/‎sklearn/linear_model/tests/test_coordinate_descent.py
Lines changed: 2 additions & 2 deletions
diff --git a/‎sklearn/model_selection/_search.py
Lines changed: 2 additions & 2 deletions b/‎sklearn/model_selection/_search.py
Lines changed: 2 additions & 2 deletions
@@ -511,12 +511,12 @@ Scikit-learn introduced estimator tags in version 0.21. These are annotations
 of estimators that allow programmatic inspection of their capabilities, such as
 sparse matrix support, supported output types and supported methods. The
 estimator tags are a dictionary returned by the method ``_get_tags()``. These
-tags are used by the common tests and the
-:func:`sklearn.utils.estimator_checks.check_estimator` function to decide what
-tests to run and what input data is appropriate. Tags can depend on estimator
-parameters or even system architecture and can in general only be determined at
-runtime. The default values for the estimator tags are defined in the
-``BaseEstimator`` class.
+tags are used in the common checks run by the
+:func:`~sklearn.utils.estimator_checks.check_estimator` function and the
+:func:`~sklearn.utils.estimator_checks.parametrize_with_checks` decorator.
+Tags determine which checks to run and what input data is appropriate. Tags
+can depend on estimator parameters or even system architecture and can in
+general only be determined at runtime.
 
 The current set of estimator tags are:
 
@@ -618,16 +618,25 @@ X_types (default=['2darray'])
     ``'categorical'`` data. For now, the test for sparse data do not make use
     of the ``'sparse'`` tag.
 
-
-To override the tags of a child class, one must define the `_more_tags()`
-method and return a dict with the desired tags, e.g::
+It is unlikely that the default values for each tag will suit the needs of your
+specific estimator. Additional tags can be created or default tags can be
+overridden by defining a `_more_tags()` method which returns a dict with the
+desired overridden tags or new tags. For example::
 
     class MyMultiOutputEstimator(BaseEstimator):
 
         def _more_tags(self):
             return {'multioutput_only': True,
                     'non_deterministic': True}
 
+Any tag that is not in `_more_tags()` will just fall-back to the default values
+documented above.
+
+Even if it is not recommended, it is possible to override the method
+`_get_tags()`. Note however that **all tags must be present in the dict**. If
+any of the keys documented above is not present in the output of `_get_tags()`,
+an error will occur.
+
 In addition to the tags, estimators also need to declare any non-optional
 parameters to ``__init__`` in the ``_required_parameters`` class attribute,
 which is a list or tuple.  If ``_required_parameters`` is only
 
@@ -15,32 +15,15 @@
 from . import __version__
 from ._config import get_config
 from .utils import _IS_32BIT
+from .utils._tags import (
+    _DEFAULT_TAGS,
+    _safe_tags,
+)
 from .utils.validation import check_X_y
 from .utils.validation import check_array
 from .utils._estimator_html_repr import estimator_html_repr
 from .utils.validation import _deprecate_positional_args
 
-_DEFAULT_TAGS = {
-    'non_deterministic': False,
-    'requires_positive_X': False,
-    'requires_positive_y': False,
-    'X_types': ['2darray'],
-    'poor_score': False,
-    'no_validation': False,
-    'multioutput': False,
-    "allow_nan": False,
-    'stateless': False,
-    'multilabel': False,
-    '_skip_test': False,
-    '_xfail_checks': False,
-    'multioutput_only': False,
-    'binary_only': False,
-    'requires_fit': True,
-    'preserves_dtype': [np.float64],
-    'requires_y': False,
-    'pairwise': False,
-    }
-
 
 @_deprecate_positional_args
 def clone(estimator, *, safe=True):
@@ -858,11 +841,7 @@ def _is_pairwise(estimator):
         warnings.filterwarnings('ignore', category=FutureWarning)
         has_pairwise_attribute = hasattr(estimator, '_pairwise')
         pairwise_attribute = getattr(estimator, '_pairwise', False)
-
-    if hasattr(estimator, '_get_tags') and callable(estimator._get_tags):
-        pairwise_tag = estimator._get_tags().get('pairwise', False)
-    else:
-        pairwise_tag = False
+    pairwise_tag = _safe_tags(estimator, key="pairwise")
 
     if has_pairwise_attribute:
         if pairwise_attribute != pairwise_tag:
 
@@ -12,9 +12,12 @@
 from scipy.sparse import issparse, csc_matrix
 
 from ..base import TransformerMixin
-from ..utils import check_array
-from ..utils import safe_mask
-from ..utils import safe_sqr
+from ..utils import (
+    check_array,
+    safe_mask,
+    safe_sqr,
+)
+from ..utils._tags import _safe_tags
 
 
 class SelectorMixin(TransformerMixin, metaclass=ABCMeta):
@@ -74,9 +77,14 @@ def transform(self, X):
         X_r : array of shape [n_samples, n_selected_features]
             The input samples with only the selected features.
         """
-        tags = self._get_tags()
-        X = check_array(X, dtype=None, accept_sparse='csr',
-                        force_all_finite=not tags.get('allow_nan', True))
+        # note: we use _safe_tags instead of _get_tags because this is a
+        # public Mixin.
+        X = check_array(
+            X,
+            dtype=None,
+            accept_sparse="csr",
+            force_all_finite=not _safe_tags(self, key="allow_nan"),
+        )
         mask = self.get_support()
         if not mask.any():
             warn("No features were selected: either the data is"
 
@@ -7,6 +7,7 @@
 from ._base import SelectorMixin
 from ._base import _get_feature_importances
 from ..base import BaseEstimator, clone, MetaEstimatorMixin
+from ..utils._tags import _safe_tags
 from ..utils.validation import check_is_fitted
 
 from ..exceptions import NotFittedError
@@ -283,5 +284,6 @@ def n_features_in_(self):
         return self.estimator_.n_features_in_
 
     def _more_tags(self):
-        estimator_tags = self.estimator._get_tags()
-        return {'allow_nan': estimator_tags.get('allow_nan', True)}
+        return {
+            'allow_nan': _safe_tags(self.estimator, key="allow_nan")
+        }
@@ -10,8 +10,10 @@
 import numbers
 from joblib import Parallel, effective_n_jobs
 
+
 from ..utils.metaestimators import if_delegate_has_method
 from ..utils.metaestimators import _safe_split
+from ..utils._tags import _safe_tags
 from ..utils.validation import check_is_fitted
 from ..utils.validation import _deprecate_positional_args
 from ..utils.fixes import delayed
@@ -191,7 +193,7 @@ def _fit(self, X, y, step_score=None):
         X, y = self._validate_data(
             X, y, accept_sparse="csc",
             ensure_min_features=2,
-            force_all_finite=not tags.get('allow_nan', True),
+            force_all_finite=not tags.get("allow_nan", True),
             multi_output=True
         )
         error_msg = ("n_features_to_select must be either None, a "
@@ -371,11 +373,11 @@ def predict_log_proba(self, X):
         return self.estimator_.predict_log_proba(self.transform(X))
 
     def _more_tags(self):
-        estimator_tags = self.estimator._get_tags()
-        return {'poor_score': True,
-                'allow_nan': estimator_tags.get('allow_nan', True),
-                'requires_y': True,
-                }
+        return {
+            'poor_score': True,
+            'allow_nan': _safe_tags(self.estimator, key='allow_nan'),
+            'requires_y': True,
+        }
 
 
 class RFECV(RFE):
 
@@ -7,6 +7,7 @@
 
 from ._base import SelectorMixin
 from ..base import BaseEstimator, MetaEstimatorMixin, clone
+from ..utils._tags import _safe_tags
 from ..utils.validation import check_is_fitted
 from ..model_selection import cross_val_score
 
@@ -128,12 +129,11 @@ def fit(self, X, y):
         -------
         self : object
         """
-
         tags = self._get_tags()
         X, y = self._validate_data(
             X, y, accept_sparse="csc",
             ensure_min_features=2,
-            force_all_finite=not tags.get('allow_nan', True),
+            force_all_finite=not tags.get("allow_nan", True),
             multi_output=True
         )
         n_features = X.shape[1]
@@ -207,8 +207,7 @@ def _get_support_mask(self):
         return self.support_
 
     def _more_tags(self):
-        estimator_tags = self.estimator._get_tags()
         return {
-            'allow_nan': estimator_tags.get('allow_nan', True),
+            'allow_nan': _safe_tags(self.estimator, key="allow_nan"),
             'requires_y': True,
         }
@@ -56,8 +56,8 @@ def get_params(self, deep=True):
     def set_params(self, **params):
         return self
 
-    def _get_tags(self):
-        return {}
+    def _more_tags(self):
+        return {"allow_nan": True}
 
 
 def test_rfe_features_importance():
@@ -448,10 +448,7 @@ def test_rfe_importance_getter_validation(importance_getter, err_type,
         model.fit(X, y)
 
 
-@pytest.mark.parametrize("cv", [
-    None,
-    5
-])
+@pytest.mark.parametrize("cv", [None, 5])
 def test_rfe_allow_nan_inf_in_x(cv):
     iris = load_iris()
     X = iris.data
 
@@ -419,13 +419,13 @@ def test_tweedie_regression_family(regression_data):
 
 
 @pytest.mark.parametrize(
-        'estimator, value',
-        [
-            (PoissonRegressor(), True),
-            (GammaRegressor(), True),
-            (TweedieRegressor(power=1.5), True),
-            (TweedieRegressor(power=0), False)
-        ],
+    'estimator, value',
+    [
+        (PoissonRegressor(), True),
+        (GammaRegressor(), True),
+        (TweedieRegressor(power=1.5), True),
+        (TweedieRegressor(power=0), False),
+    ],
 )
 def test_tags(estimator, value):
     assert estimator._get_tags()['requires_positive_y'] is value
@@ -300,7 +300,7 @@ def test_lasso_cv_positive_constraint():
      (Lars, {}),
      (LinearRegression, {}),
      (LassoLarsIC, {})]
- )
+)
 def test_model_pipeline_same_as_normalize_true(LinearModel, params):
     # Test that linear models (LinearModel) set with normalize set to True are
     # doing the same as the same linear model preceeded by StandardScaler
@@ -315,7 +315,7 @@ def test_model_pipeline_same_as_normalize_true(LinearModel, params):
         LinearModel(normalize=False, fit_intercept=True, **params)
     )
 
-    is_multitask = model_normalize._get_tags().get("multioutput_only", False)
+    is_multitask = model_normalize._get_tags()["multioutput_only"]
 
     # prepare the data
     n_samples, n_features = 100, 2
 
@@ -35,6 +35,7 @@
 from joblib import Parallel
 from ..utils import check_random_state
 from ..utils.random import sample_without_replacement
+from ..utils._tags import _safe_tags
 from ..utils.validation import indexable, check_is_fitted, _check_fit_params
 from ..utils.validation import _deprecate_positional_args
 from ..utils.metaestimators import if_delegate_has_method
@@ -433,9 +434,8 @@ def _estimator_type(self):
 
     def _more_tags(self):
         # allows cross-validation to see 'precomputed' metrics
-        estimator_tags = self.estimator._get_tags()
         return {
-            'pairwise': estimator_tags.get('pairwise', False),
+            'pairwise': _safe_tags(self.estimator, "pairwise"),
             "_xfail_checks": {"check_supervised_y_2d":
                               "DataConversionWarning not caught"},
         }