* Add test for hyphenation problem in Issue #302

This commit is contained in:
Matthew Honnibal 2016-03-29 14:27:13 +11:00
parent d249e2f7f3
commit 9c73983bdd
1 changed files with 6 additions and 0 deletions

View File

@ -32,3 +32,9 @@ def test_email(en_tokenizer):
assert len(tokens) == 1
def test_double_hyphen(en_tokenizer):
tokens = en_tokenizer(u'No decent--let alone well-bred--people.')
assert tokens[0].text == u'No'
assert tokens[1].text == u'decent'
assert tokens[2].text == u'--'
assert tokens[3].text == u'let'