spaCy/spacy/tests/regression/test_issue3521.py

# coding: utf8
from __future__ import unicode_literals

import pytest


@pytest.mark.parametrize("word", ["don't", "don’t", "I'd", "I’d"])
def test_issue3521(en_tokenizer, word):
    tok = en_tokenizer(word)[1]
    # 'not' and 'would' should be stopwords, also in their abbreviated forms
    assert tok.is_stop