spaCy/spacy/tests/regression/test_issue3521.py

17 lines
313 B
Python
Raw Normal View History

2019-04-02 11:15:35 +00:00
import pytest
@pytest.mark.parametrize(
"word",
[
2019-04-02 11:52:07 +00:00
u"don't",
u"dont",
u"I'd",
u"Id",
2019-04-02 11:15:35 +00:00
],
)
def test_issue3521(en_tokenizer, word):
tok = en_tokenizer(word)[1]
# 'not' and 'would' should be stopwords, also in their abbreviated forms
2019-04-02 11:15:35 +00:00
assert tok.is_stop