@@ -633,7 +633,7 @@ class HashingVectorizer(
633
633
'ascii' is a fast method that only works on characters that have
634
634
a direct ASCII mapping.
635
635
'unicode' is a slightly slower method that works on any character.
636
- None (default) does nothing .
636
+ None (default) means no character normalization is performed .
637
637
638
638
Both 'ascii' and 'unicode' use NFKD normalization from
639
639
:func:`unicodedata.normalize`.
@@ -964,7 +964,7 @@ class CountVectorizer(_VectorizerMixin, BaseEstimator):
964
964
'ascii' is a fast method that only works on characters that have
965
965
a direct ASCII mapping.
966
966
'unicode' is a slightly slower method that works on any characters.
967
- None (default) does nothing .
967
+ None (default) means no character normalization is performed .
968
968
969
969
Both 'ascii' and 'unicode' use NFKD normalization from
970
970
:func:`unicodedata.normalize`.
@@ -1786,7 +1786,7 @@ class TfidfVectorizer(CountVectorizer):
1786
1786
'ascii' is a fast method that only works on characters that have
1787
1787
a direct ASCII mapping.
1788
1788
'unicode' is a slightly slower method that works on any characters.
1789
- None (default) does nothing .
1789
+ None (default) means no character normalization is performed .
1790
1790
1791
1791
Both 'ascii' and 'unicode' use NFKD normalization from
1792
1792
:func:`unicodedata.normalize`.
@@ -1881,7 +1881,8 @@ class TfidfVectorizer(CountVectorizer):
1881
1881
binary : bool, default=False
1882
1882
If True, all non-zero term counts are set to 1. This does not mean
1883
1883
outputs will have only 0/1 values, only that the tf term in tf-idf
1884
- is binary. (Set idf and normalization to False to get 0/1 outputs).
1884
+ is binary. (Set `binary` to True, `use_idf` to False and
1885
+ `norm` to None to get 0/1 outputs).
1885
1886
1886
1887
dtype : dtype, default=float64
1887
1888
Type of the matrix returned by fit_transform() or transform().
0 commit comments