diff --git a/scikits/learn/feature_extraction/text/dense.py b/scikits/learn/feature_extraction/text/dense.py index 379f1c92c75bbc81e84f86d0f73f3a41a50ef6d3..181627efc44ff551bab46ef47773d7faaea8418d 100644 --- a/scikits/learn/feature_extraction/text/dense.py +++ b/scikits/learn/feature_extraction/text/dense.py @@ -228,7 +228,7 @@ class BaseCountVectorizer(BaseEstimator): Type of the matrix returned by fit_transform() or transform(). """ - def __init__(self, analyzer=DEFAULT_ANALYZER, vocabulary={}, max_df=0.5, + def __init__(self, analyzer=DEFAULT_ANALYZER, vocabulary={}, max_df=1.0, max_features=None, dtype=long): self.analyzer = analyzer self.vocabulary = vocabulary