spaCy/spacy/tests/parser/test_space_attachment.py

24 lines
550 B
Python
Raw Normal View History

from __future__ import unicode_literals
import pytest
import numpy
from spacy.attrs import HEAD
@pytest.mark.models
def test_space_attachment(EN):
sentence = 'This is a test.\nTo ensure spaces are attached well.'
doc = EN(sentence)
2015-10-14 16:20:51 +00:00
for sent in doc.sents:
2015-10-14 16:24:57 +00:00
if len(sent) == 1:
assert not sent[-1].is_space
def test_sentence_space(EN):
text = ('''I look forward to using Thingamajig. I've been told it will '''
'''make my life easier...''')
doc = EN(text)
assert len(list(doc.sents)) == 2