From 6a2745c7cc86826390e12c1bd6319f38109b601c Mon Sep 17 00:00:00 2001
From: x99b <Bartek.Betkowski@freenet.ag>
Date: Thu, 12 Jun 2025 12:23:44 +0000
Subject: [PATCH 1/5] Add `TargetEncoder` for scikit-learn

---
 stubs/sklearn/preprocessing/__init__.pyi  |  3 ++-
 stubs/sklearn/preprocessing/_encoders.pyi | 28 ++++++++++++++++++++++-
 2 files changed, 29 insertions(+), 2 deletions(-)

diff --git a/stubs/sklearn/preprocessing/__init__.pyi b/stubs/sklearn/preprocessing/__init__.pyi
index ea623258..e360a6c1 100644
--- a/stubs/sklearn/preprocessing/__init__.pyi
+++ b/stubs/sklearn/preprocessing/__init__.pyi
@@ -19,7 +19,7 @@ from ._data import (
     scale as scale,
 )
 from ._discretization import KBinsDiscretizer as KBinsDiscretizer
-from ._encoders import OneHotEncoder as OneHotEncoder, OrdinalEncoder as OrdinalEncoder
+from ._encoders import OneHotEncoder as OneHotEncoder, OrdinalEncoder as OrdinalEncoder, TargetEncoder as TargetEncoder
 from ._function_transformer import FunctionTransformer as FunctionTransformer
 from ._label import (
     LabelBinarizer as LabelBinarizer,
@@ -47,6 +47,7 @@ __all__ = [
     "RobustScaler",
     "SplineTransformer",
     "StandardScaler",
+    "TargetEncoder",
     "add_dummy_feature",
     "PolynomialFeatures",
     "binarize",
diff --git a/stubs/sklearn/preprocessing/_encoders.pyi b/stubs/sklearn/preprocessing/_encoders.pyi
index 15fb4bcb..f2676543 100644
--- a/stubs/sklearn/preprocessing/_encoders.pyi
+++ b/stubs/sklearn/preprocessing/_encoders.pyi
@@ -13,7 +13,7 @@ from ..base import BaseEstimator, OneToOneFeatureMixin, TransformerMixin
 #          Joris Van den Bossche <jorisvandenbossche@gmail.com>
 # License: BSD 3 clause
 
-__all__ = ["OneHotEncoder", "OrdinalEncoder"]
+__all__ = ["OneHotEncoder", "OrdinalEncoder", "TargetEncoder"]
 
 class _BaseEncoder(TransformerMixin, BaseEstimator): ...
 
@@ -67,3 +67,29 @@ class OrdinalEncoder(OneToOneFeatureMixin, _BaseEncoder):
     def fit(self, X: MatrixLike, y: Series | None = None) -> Self: ...
     def transform(self, X: MatrixLike) -> ndarray: ...
     def inverse_transform(self, X: MatrixLike) -> ndarray: ...
+
+class TargetEncoder(OneToOneFeatureMixin, _BaseEncoder):
+    feature_names_in_: ndarray = ...
+    n_features_in_: int = ...
+    categories_: list[ndarray] = ...
+    encodings_: list[ndarray] = ...
+    target_type_: str = ...
+    target_mean_: float = ...
+    classes_: ndarray | None = ...
+
+    _parameter_constraints: ClassVar[dict] = ...
+
+    def __init__(
+        self,
+        *,
+        categories: Sequence[ArrayLike] | Literal["auto"] = "auto",
+        target_type: Literal["auto", "continuous", "binary", "multiclass"] = "auto",
+        smooth: Literal["auto"] | float = "auto",
+        cv: int = 5,
+        shuffle: bool = True,
+        random_state: Int | None = None,
+    ) -> None: ...
+    def fit(self, X: MatrixLike, y: ArrayLike) -> Self: ...
+    def transform(self, X: MatrixLike) -> ndarray: ...
+    def fit_transform(self, X: MatrixLike, y: ArrayLike) -> ndarray: ...
+    def get_feature_names_out(self, input_features: None | ArrayLike = None) -> ndarray: ...

From 65063a3432e3963edd1e20d6409c41b6347c0416 Mon Sep 17 00:00:00 2001
From: x99b <Bartek.Betkowski@freenet.ag>
Date: Fri, 13 Jun 2025 04:33:11 +0000
Subject: [PATCH 2/5] Update `TargetEncoder` to change `target_mean_` type to
 `ndarray` and add `infrequent_categories_` property

---
 stubs/sklearn/preprocessing/_encoders.pyi | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/stubs/sklearn/preprocessing/_encoders.pyi b/stubs/sklearn/preprocessing/_encoders.pyi
index f2676543..a83e3529 100644
--- a/stubs/sklearn/preprocessing/_encoders.pyi
+++ b/stubs/sklearn/preprocessing/_encoders.pyi
@@ -74,9 +74,12 @@ class TargetEncoder(OneToOneFeatureMixin, _BaseEncoder):
     categories_: list[ndarray] = ...
     encodings_: list[ndarray] = ...
     target_type_: str = ...
-    target_mean_: float = ...
+    target_mean_: ndarray = ...
     classes_: ndarray | None = ...
 
+    @property
+    def infrequent_categories_(self) -> list[ndarray]: ...
+
     _parameter_constraints: ClassVar[dict] = ...
 
     def __init__(

From 2ce83943f079316802b8b818efaf7184fd3dc500 Mon Sep 17 00:00:00 2001
From: x99b <Bartek.Betkowski@freenet.ag>
Date: Fri, 13 Jun 2025 05:32:14 +0000
Subject: [PATCH 3/5] Make TargetEncoder from sklearn.preprocessing match with
 actual sourcecode

---
 stubs/sklearn/preprocessing/__init__.pyi      |  21 +-
 stubs/sklearn/preprocessing/_encoders.pyi     |  31 +--
 .../sklearn/preprocessing/_target_encoder.pyi | 201 ++++++++++++++++++
 3 files changed, 213 insertions(+), 40 deletions(-)
 create mode 100644 stubs/sklearn/preprocessing/_target_encoder.pyi

diff --git a/stubs/sklearn/preprocessing/__init__.pyi b/stubs/sklearn/preprocessing/__init__.pyi
index e360a6c1..7c548a89 100644
--- a/stubs/sklearn/preprocessing/__init__.pyi
+++ b/stubs/sklearn/preprocessing/__init__.pyi
@@ -19,7 +19,7 @@ from ._data import (
     scale as scale,
 )
 from ._discretization import KBinsDiscretizer as KBinsDiscretizer
-from ._encoders import OneHotEncoder as OneHotEncoder, OrdinalEncoder as OrdinalEncoder, TargetEncoder as TargetEncoder
+from ._encoders import OneHotEncoder as OneHotEncoder, OrdinalEncoder as OrdinalEncoder
 from ._function_transformer import FunctionTransformer as FunctionTransformer
 from ._label import (
     LabelBinarizer as LabelBinarizer,
@@ -28,6 +28,7 @@ from ._label import (
     label_binarize as label_binarize,
 )
 from ._polynomial import PolynomialFeatures as PolynomialFeatures, SplineTransformer as SplineTransformer
+from ._target_encoder import TargetEncoder as TargetEncoder
 
 __all__ = [
     "Binarizer",
@@ -36,27 +37,27 @@ __all__ = [
     "KernelCenterer",
     "LabelBinarizer",
     "LabelEncoder",
-    "MultiLabelBinarizer",
-    "MinMaxScaler",
     "MaxAbsScaler",
-    "QuantileTransformer",
+    "MinMaxScaler",
+    "MultiLabelBinarizer",
     "Normalizer",
     "OneHotEncoder",
     "OrdinalEncoder",
+    "PolynomialFeatures",
     "PowerTransformer",
+    "QuantileTransformer",
     "RobustScaler",
     "SplineTransformer",
     "StandardScaler",
     "TargetEncoder",
     "add_dummy_feature",
-    "PolynomialFeatures",
     "binarize",
-    "normalize",
-    "scale",
-    "robust_scale",
+    "label_binarize",
     "maxabs_scale",
     "minmax_scale",
-    "label_binarize",
-    "quantile_transform",
+    "normalize",
     "power_transform",
+    "quantile_transform",
+    "robust_scale",
+    "scale",
 ]
diff --git a/stubs/sklearn/preprocessing/_encoders.pyi b/stubs/sklearn/preprocessing/_encoders.pyi
index a83e3529..15fb4bcb 100644
--- a/stubs/sklearn/preprocessing/_encoders.pyi
+++ b/stubs/sklearn/preprocessing/_encoders.pyi
@@ -13,7 +13,7 @@ from ..base import BaseEstimator, OneToOneFeatureMixin, TransformerMixin
 #          Joris Van den Bossche <jorisvandenbossche@gmail.com>
 # License: BSD 3 clause
 
-__all__ = ["OneHotEncoder", "OrdinalEncoder", "TargetEncoder"]
+__all__ = ["OneHotEncoder", "OrdinalEncoder"]
 
 class _BaseEncoder(TransformerMixin, BaseEstimator): ...
 
@@ -67,32 +67,3 @@ class OrdinalEncoder(OneToOneFeatureMixin, _BaseEncoder):
     def fit(self, X: MatrixLike, y: Series | None = None) -> Self: ...
     def transform(self, X: MatrixLike) -> ndarray: ...
     def inverse_transform(self, X: MatrixLike) -> ndarray: ...
-
-class TargetEncoder(OneToOneFeatureMixin, _BaseEncoder):
-    feature_names_in_: ndarray = ...
-    n_features_in_: int = ...
-    categories_: list[ndarray] = ...
-    encodings_: list[ndarray] = ...
-    target_type_: str = ...
-    target_mean_: ndarray = ...
-    classes_: ndarray | None = ...
-
-    @property
-    def infrequent_categories_(self) -> list[ndarray]: ...
-
-    _parameter_constraints: ClassVar[dict] = ...
-
-    def __init__(
-        self,
-        *,
-        categories: Sequence[ArrayLike] | Literal["auto"] = "auto",
-        target_type: Literal["auto", "continuous", "binary", "multiclass"] = "auto",
-        smooth: Literal["auto"] | float = "auto",
-        cv: int = 5,
-        shuffle: bool = True,
-        random_state: Int | None = None,
-    ) -> None: ...
-    def fit(self, X: MatrixLike, y: ArrayLike) -> Self: ...
-    def transform(self, X: MatrixLike) -> ndarray: ...
-    def fit_transform(self, X: MatrixLike, y: ArrayLike) -> ndarray: ...
-    def get_feature_names_out(self, input_features: None | ArrayLike = None) -> ndarray: ...
diff --git a/stubs/sklearn/preprocessing/_target_encoder.pyi b/stubs/sklearn/preprocessing/_target_encoder.pyi
new file mode 100644
index 00000000..c97f15f8
--- /dev/null
+++ b/stubs/sklearn/preprocessing/_target_encoder.pyi
@@ -0,0 +1,201 @@
+from typing import ClassVar, Literal
+from typing_extensions import Self
+
+from numpy import ndarray
+
+from .._typing import ArrayLike, Int, MatrixLike
+from ..base import OneToOneFeatureMixin
+from ._encoders import _BaseEncoder
+
+class TargetEncoder(OneToOneFeatureMixin, _BaseEncoder):
+    """Target Encoder for regression and classification targets.
+
+    Each category is encoded based on a shrunk estimate of the average target
+    values for observations belonging to the category. The encoding scheme mixes
+    the global target mean with the target mean conditioned on the value of the
+    category (see [MIC]_).
+
+    When the target type is "multiclass", encodings are based
+    on the conditional probability estimate for each class. The target is first
+    binarized using the "one-vs-all" scheme via
+    :class:`~sklearn.preprocessing.LabelBinarizer`, then the average target
+    value for each class and each category is used for encoding, resulting in
+    `n_features` * `n_classes` encoded output features.
+
+    :class:`TargetEncoder` considers missing values, such as `np.nan` or `None`,
+    as another category and encodes them like any other category. Categories
+    that are not seen during :meth:`fit` are encoded with the target mean, i.e.
+    `target_mean_`.
+
+    For a demo on the importance of the `TargetEncoder` internal cross-fitting,
+    see
+    :ref:`sphx_glr_auto_examples_preprocessing_plot_target_encoder_cross_val.py`.
+    For a comparison of different encoders, refer to
+    :ref:`sphx_glr_auto_examples_preprocessing_plot_target_encoder.py`. Read
+    more in the :ref:`User Guide <target_encoder>`.
+
+    .. note::
+        `fit(X, y).transform(X)` does not equal `fit_transform(X, y)` because a
+        :term:`cross fitting` scheme is used in `fit_transform` for encoding.
+        See the :ref:`User Guide <target_encoder>` for details.
+
+    .. versionadded:: 1.3
+
+    Parameters
+    ----------
+    categories : "auto" or list of shape (n_features,) of array-like, default="auto"
+        Categories (unique values) per feature:
+
+        - `"auto"` : Determine categories automatically from the training data.
+        - list : `categories[i]` holds the categories expected in the i-th column. The
+          passed categories should not mix strings and numeric values within a single
+          feature, and should be sorted in case of numeric values.
+
+        The used categories are stored in the `categories_` fitted attribute.
+
+    target_type : {"auto", "continuous", "binary", "multiclass"}, default="auto"
+        Type of target.
+
+        - `"auto"` : Type of target is inferred with
+          :func:`~sklearn.utils.multiclass.type_of_target`.
+        - `"continuous"` : Continuous target
+        - `"binary"` : Binary target
+        - `"multiclass"` : Multiclass target
+
+        .. note::
+            The type of target inferred with `"auto"` may not be the desired target
+            type used for modeling. For example, if the target consisted of integers
+            between 0 and 100, then :func:`~sklearn.utils.multiclass.type_of_target`
+            will infer the target as `"multiclass"`. In this case, setting
+            `target_type="continuous"` will specify the target as a regression
+            problem. The `target_type_` attribute gives the target type used by the
+            encoder.
+
+        .. versionchanged:: 1.4
+           Added the option 'multiclass'.
+
+    smooth : "auto" or float, default="auto"
+        The amount of mixing of the target mean conditioned on the value of the
+        category with the global target mean. A larger `smooth` value will put
+        more weight on the global target mean.
+        If `"auto"`, then `smooth` is set to an empirical Bayes estimate.
+
+    cv : int, default=5
+        Determines the number of folds in the :term:`cross fitting` strategy used in
+        :meth:`fit_transform`. For classification targets, `StratifiedKFold` is used
+        and for continuous targets, `KFold` is used.
+
+    shuffle : bool, default=True
+        Whether to shuffle the data in :meth:`fit_transform` before splitting into
+        folds. Note that the samples within each split will not be shuffled.
+
+    random_state : int, RandomState instance or None, default=None
+        When `shuffle` is True, `random_state` affects the ordering of the
+        indices, which controls the randomness of each fold. Otherwise, this
+        parameter has no effect.
+        Pass an int for reproducible output across multiple function calls.
+        See :term:`Glossary <random_state>`.
+
+    Attributes
+    ----------
+    encodings_ : list of shape (n_features,) or (n_features * n_classes) of \
+                    ndarray
+        Encodings learnt on all of `X`.
+        For feature `i`, `encodings_[i]` are the encodings matching the
+        categories listed in `categories_[i]`. When `target_type_` is
+        "multiclass", the encoding for feature `i` and class `j` is stored in
+        `encodings_[j + (i * len(classes_))]`. E.g., for 2 features (f) and
+        3 classes (c), encodings are ordered:
+        f0_c0, f0_c1, f0_c2, f1_c0, f1_c1, f1_c2,
+
+    categories_ : list of shape (n_features,) of ndarray
+        The categories of each input feature determined during fitting or
+        specified in `categories`
+        (in order of the features in `X` and corresponding with the output
+        of :meth:`transform`).
+
+    target_type_ : str
+        Type of target.
+
+    target_mean_ : float
+        The overall mean of the target. This value is only used in :meth:`transform`
+        to encode categories.
+
+    n_features_in_ : int
+        Number of features seen during :term:`fit`.
+
+    feature_names_in_ : ndarray of shape (`n_features_in_`,)
+        Names of features seen during :term:`fit`. Defined only when `X`
+        has feature names that are all strings.
+
+    classes_ : ndarray or None
+        If `target_type_` is 'binary' or 'multiclass', holds the label for each class,
+        otherwise `None`.
+
+    See Also
+    --------
+    OrdinalEncoder : Performs an ordinal (integer) encoding of the categorical features.
+        Contrary to TargetEncoder, this encoding is not supervised. Treating the
+        resulting encoding as a numerical features therefore lead arbitrarily
+        ordered values and therefore typically lead to lower predictive performance
+        when used as preprocessing for a classifier or regressor.
+    OneHotEncoder : Performs a one-hot encoding of categorical features. This
+        unsupervised encoding is better suited for low cardinality categorical
+        variables as it generate one new feature per unique category.
+
+    References
+    ----------
+    .. [MIC] :doi:`Micci-Barreca, Daniele. "A preprocessing scheme for high-cardinality
+       categorical attributes in classification and prediction problems"
+       SIGKDD Explor. Newsl. 3, 1 (July 2001), 27–32. <10.1145/507533.507538>`
+
+    Examples
+    --------
+    With `smooth="auto"`, the smoothing parameter is set to an empirical Bayes estimate:
+
+    >>> import numpy as np
+    >>> from sklearn.preprocessing import TargetEncoder
+    >>> X = np.array([["dog"] * 20 + ["cat"] * 30 + ["snake"] * 38], dtype=object).T
+    >>> y = [90.3] * 5 + [80.1] * 15 + [20.4] * 5 + [20.1] * 25 + [21.2] * 8 + [49] * 30
+    >>> enc_auto = TargetEncoder(smooth="auto")
+    >>> X_trans = enc_auto.fit_transform(X, y)
+
+    >>> # A high `smooth` parameter puts more weight on global mean on the categorical
+    >>> # encodings:
+    >>> enc_high_smooth = TargetEncoder(smooth=5000.0).fit(X, y)
+    >>> enc_high_smooth.target_mean_
+    np.float64(44.3)
+    >>> enc_high_smooth.encodings_
+    [array([44.1, 44.4, 44.3])]
+
+    >>> # On the other hand, a low `smooth` parameter puts more weight on target
+    >>> # conditioned on the value of the categorical:
+    >>> enc_low_smooth = TargetEncoder(smooth=1.0).fit(X, y)
+    >>> enc_low_smooth.encodings_
+    [array([21, 80.8, 43.2])]
+    """
+
+    encodings_: list[ndarray]
+    categories_: list[ndarray]
+    target_type_: str
+    target_mean_: float
+    n_features_in_: int
+    feature_names_in_: ndarray
+    classes_: ndarray | None
+
+    _parameter_constraints: ClassVar[dict] = ...
+
+    def __init__(
+        self,
+        categories: list[ArrayLike] | Literal["auto"] = "auto",
+        target_type: Literal["auto", "continuous", "binary", "multiclass"] = "auto",
+        smooth: Literal["auto"] | float = "auto",
+        cv: int = 5,
+        shuffle: bool = True,
+        random_state: Int | None = None,
+    ) -> None: ...
+    def fit(self, X: MatrixLike, y: ArrayLike) -> Self: ...
+    def fit_transform(self, X: MatrixLike, y: ArrayLike) -> ndarray: ...
+    def transform(self, X: MatrixLike) -> ndarray: ...
+    def get_feature_names_out(self, input_features: ArrayLike | None = None) -> ndarray: ...
+    def __sklearn_tags__(self) -> dict: ...

From 42c218416d4a1ea31136cbfd3e31ad0bd9b2f9c9 Mon Sep 17 00:00:00 2001
From: x99b <Bartek.Betkowski@freenet.ag>
Date: Fri, 13 Jun 2025 05:37:04 +0000
Subject: [PATCH 4/5] Fix formatting of citation in TargetEncoder docstring

---
 stubs/sklearn/preprocessing/_target_encoder.pyi | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/stubs/sklearn/preprocessing/_target_encoder.pyi b/stubs/sklearn/preprocessing/_target_encoder.pyi
index c97f15f8..93a6517f 100644
--- a/stubs/sklearn/preprocessing/_target_encoder.pyi
+++ b/stubs/sklearn/preprocessing/_target_encoder.pyi
@@ -147,7 +147,7 @@ class TargetEncoder(OneToOneFeatureMixin, _BaseEncoder):
     ----------
     .. [MIC] :doi:`Micci-Barreca, Daniele. "A preprocessing scheme for high-cardinality
        categorical attributes in classification and prediction problems"
-       SIGKDD Explor. Newsl. 3, 1 (July 2001), 27–32. <10.1145/507533.507538>`
+       SIGKDD Explor. Newsl. 3, 1 (July 2001), 27-32. <10.1145/507533.507538>`
 
     Examples
     --------

From b3389c1329433ef7afc299e5e662d82108cab09d Mon Sep 17 00:00:00 2001
From: x99b <Bartek.Betkowski@freenet.ag>
Date: Fri, 13 Jun 2025 05:38:33 +0000
Subject: [PATCH 5/5] Remove extensive docstring from TargetEncoder class

---
 .../sklearn/preprocessing/_target_encoder.pyi | 167 ------------------
 1 file changed, 167 deletions(-)

diff --git a/stubs/sklearn/preprocessing/_target_encoder.pyi b/stubs/sklearn/preprocessing/_target_encoder.pyi
index 93a6517f..31a178d9 100644
--- a/stubs/sklearn/preprocessing/_target_encoder.pyi
+++ b/stubs/sklearn/preprocessing/_target_encoder.pyi
@@ -8,173 +8,6 @@ from ..base import OneToOneFeatureMixin
 from ._encoders import _BaseEncoder
 
 class TargetEncoder(OneToOneFeatureMixin, _BaseEncoder):
-    """Target Encoder for regression and classification targets.
-
-    Each category is encoded based on a shrunk estimate of the average target
-    values for observations belonging to the category. The encoding scheme mixes
-    the global target mean with the target mean conditioned on the value of the
-    category (see [MIC]_).
-
-    When the target type is "multiclass", encodings are based
-    on the conditional probability estimate for each class. The target is first
-    binarized using the "one-vs-all" scheme via
-    :class:`~sklearn.preprocessing.LabelBinarizer`, then the average target
-    value for each class and each category is used for encoding, resulting in
-    `n_features` * `n_classes` encoded output features.
-
-    :class:`TargetEncoder` considers missing values, such as `np.nan` or `None`,
-    as another category and encodes them like any other category. Categories
-    that are not seen during :meth:`fit` are encoded with the target mean, i.e.
-    `target_mean_`.
-
-    For a demo on the importance of the `TargetEncoder` internal cross-fitting,
-    see
-    :ref:`sphx_glr_auto_examples_preprocessing_plot_target_encoder_cross_val.py`.
-    For a comparison of different encoders, refer to
-    :ref:`sphx_glr_auto_examples_preprocessing_plot_target_encoder.py`. Read
-    more in the :ref:`User Guide <target_encoder>`.
-
-    .. note::
-        `fit(X, y).transform(X)` does not equal `fit_transform(X, y)` because a
-        :term:`cross fitting` scheme is used in `fit_transform` for encoding.
-        See the :ref:`User Guide <target_encoder>` for details.
-
-    .. versionadded:: 1.3
-
-    Parameters
-    ----------
-    categories : "auto" or list of shape (n_features,) of array-like, default="auto"
-        Categories (unique values) per feature:
-
-        - `"auto"` : Determine categories automatically from the training data.
-        - list : `categories[i]` holds the categories expected in the i-th column. The
-          passed categories should not mix strings and numeric values within a single
-          feature, and should be sorted in case of numeric values.
-
-        The used categories are stored in the `categories_` fitted attribute.
-
-    target_type : {"auto", "continuous", "binary", "multiclass"}, default="auto"
-        Type of target.
-
-        - `"auto"` : Type of target is inferred with
-          :func:`~sklearn.utils.multiclass.type_of_target`.
-        - `"continuous"` : Continuous target
-        - `"binary"` : Binary target
-        - `"multiclass"` : Multiclass target
-
-        .. note::
-            The type of target inferred with `"auto"` may not be the desired target
-            type used for modeling. For example, if the target consisted of integers
-            between 0 and 100, then :func:`~sklearn.utils.multiclass.type_of_target`
-            will infer the target as `"multiclass"`. In this case, setting
-            `target_type="continuous"` will specify the target as a regression
-            problem. The `target_type_` attribute gives the target type used by the
-            encoder.
-
-        .. versionchanged:: 1.4
-           Added the option 'multiclass'.
-
-    smooth : "auto" or float, default="auto"
-        The amount of mixing of the target mean conditioned on the value of the
-        category with the global target mean. A larger `smooth` value will put
-        more weight on the global target mean.
-        If `"auto"`, then `smooth` is set to an empirical Bayes estimate.
-
-    cv : int, default=5
-        Determines the number of folds in the :term:`cross fitting` strategy used in
-        :meth:`fit_transform`. For classification targets, `StratifiedKFold` is used
-        and for continuous targets, `KFold` is used.
-
-    shuffle : bool, default=True
-        Whether to shuffle the data in :meth:`fit_transform` before splitting into
-        folds. Note that the samples within each split will not be shuffled.
-
-    random_state : int, RandomState instance or None, default=None
-        When `shuffle` is True, `random_state` affects the ordering of the
-        indices, which controls the randomness of each fold. Otherwise, this
-        parameter has no effect.
-        Pass an int for reproducible output across multiple function calls.
-        See :term:`Glossary <random_state>`.
-
-    Attributes
-    ----------
-    encodings_ : list of shape (n_features,) or (n_features * n_classes) of \
-                    ndarray
-        Encodings learnt on all of `X`.
-        For feature `i`, `encodings_[i]` are the encodings matching the
-        categories listed in `categories_[i]`. When `target_type_` is
-        "multiclass", the encoding for feature `i` and class `j` is stored in
-        `encodings_[j + (i * len(classes_))]`. E.g., for 2 features (f) and
-        3 classes (c), encodings are ordered:
-        f0_c0, f0_c1, f0_c2, f1_c0, f1_c1, f1_c2,
-
-    categories_ : list of shape (n_features,) of ndarray
-        The categories of each input feature determined during fitting or
-        specified in `categories`
-        (in order of the features in `X` and corresponding with the output
-        of :meth:`transform`).
-
-    target_type_ : str
-        Type of target.
-
-    target_mean_ : float
-        The overall mean of the target. This value is only used in :meth:`transform`
-        to encode categories.
-
-    n_features_in_ : int
-        Number of features seen during :term:`fit`.
-
-    feature_names_in_ : ndarray of shape (`n_features_in_`,)
-        Names of features seen during :term:`fit`. Defined only when `X`
-        has feature names that are all strings.
-
-    classes_ : ndarray or None
-        If `target_type_` is 'binary' or 'multiclass', holds the label for each class,
-        otherwise `None`.
-
-    See Also
-    --------
-    OrdinalEncoder : Performs an ordinal (integer) encoding of the categorical features.
-        Contrary to TargetEncoder, this encoding is not supervised. Treating the
-        resulting encoding as a numerical features therefore lead arbitrarily
-        ordered values and therefore typically lead to lower predictive performance
-        when used as preprocessing for a classifier or regressor.
-    OneHotEncoder : Performs a one-hot encoding of categorical features. This
-        unsupervised encoding is better suited for low cardinality categorical
-        variables as it generate one new feature per unique category.
-
-    References
-    ----------
-    .. [MIC] :doi:`Micci-Barreca, Daniele. "A preprocessing scheme for high-cardinality
-       categorical attributes in classification and prediction problems"
-       SIGKDD Explor. Newsl. 3, 1 (July 2001), 27-32. <10.1145/507533.507538>`
-
-    Examples
-    --------
-    With `smooth="auto"`, the smoothing parameter is set to an empirical Bayes estimate:
-
-    >>> import numpy as np
-    >>> from sklearn.preprocessing import TargetEncoder
-    >>> X = np.array([["dog"] * 20 + ["cat"] * 30 + ["snake"] * 38], dtype=object).T
-    >>> y = [90.3] * 5 + [80.1] * 15 + [20.4] * 5 + [20.1] * 25 + [21.2] * 8 + [49] * 30
-    >>> enc_auto = TargetEncoder(smooth="auto")
-    >>> X_trans = enc_auto.fit_transform(X, y)
-
-    >>> # A high `smooth` parameter puts more weight on global mean on the categorical
-    >>> # encodings:
-    >>> enc_high_smooth = TargetEncoder(smooth=5000.0).fit(X, y)
-    >>> enc_high_smooth.target_mean_
-    np.float64(44.3)
-    >>> enc_high_smooth.encodings_
-    [array([44.1, 44.4, 44.3])]
-
-    >>> # On the other hand, a low `smooth` parameter puts more weight on target
-    >>> # conditioned on the value of the categorical:
-    >>> enc_low_smooth = TargetEncoder(smooth=1.0).fit(X, y)
-    >>> enc_low_smooth.encodings_
-    [array([21, 80.8, 43.2])]
-    """
-
     encodings_: list[ndarray]
     categories_: list[ndarray]
     target_type_: str