8000 ADD test cases to fill out VectorizerMixin coverage · seckcoder/scikit-learn@789d1d3 · GitHub
[go: up one dir, main page]

Skip to content

Commit 789d1d3

Browse files
committed
ADD test cases to fill out VectorizerMixin coverage
1 parent 357db85 commit 789d1d3

File tree

1 file changed

+13
-0
lines changed

1 file changed

+13
-0
lines changed

sklearn/feature_extraction/tests/test_text.py

Lines changed: 13 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -8,6 +8,7 @@
88
from sklearn.feature_extraction.text import CountVectorizer
99
from sklearn.feature_extraction.text import TfidfTransformer
1010
from sklearn.feature_extraction.text import TfidfVectorizer
11+
from sklearn.feature_extraction.text import VectorizerMixin
1112

1213
from sklearn.feature_extraction.text import ENGLISH_STOP_WORDS
1314

@@ -427,6 +428,18 @@ def test_vectorizer():
427428
assert_raises(ValueError, v3.transform, train_data)
428429

429430

431+
def test_vectorizer_mixin():
432+
# test a few cases in VectorizerMixin
433+
vm = VectorizerMixin()
434+
vm.preprocessor = None
435+
vm.strip_accents = 'gabbldegook'
436+
assert_raises(ValueError, vm.build_preprocessor)
437+
438+
vm.lowercase = False
439+
vm.strip_accents = 'ascii'
440+
assert_equal(vm.build_preprocessor(), strip_accents_ascii)
441+
442+
430443
def test_hashing_vectorizer():
431444 3D8F
v = HashingVectorizer()
432445
X = v.transform(ALL_FOOD_DOCS)

0 commit comments

Comments
 (0)
0