2017-04-24 08:09:01 +00:00
|
|
|
from __future__ import unicode_literals
|
|
|
|
|
2017-04-23 15:57:01 +00:00
|
|
|
import pytest
|
|
|
|
|
|
|
|
|
2017-05-29 20:14:31 +00:00
|
|
|
@pytest.mark.models('en')
|
2017-06-04 21:00:44 +00:00
|
|
|
def test_issue955(EN):
|
2017-04-23 15:57:01 +00:00
|
|
|
'''Test that we don't have any nested noun chunks'''
|
2017-05-29 20:14:31 +00:00
|
|
|
doc = EN('Does flight number three fifty-four require a connecting flight'
|
|
|
|
' to get to Boston?')
|
2017-04-23 15:57:01 +00:00
|
|
|
seen_tokens = set()
|
|
|
|
for np in doc.noun_chunks:
|
|
|
|
for word in np:
|
|
|
|
key = (word.i, word.text)
|
|
|
|
assert key not in seen_tokens
|
|
|
|
seen_tokens.add(key)
|