mirror of https://github.com/explosion/spaCy.git
15 lines
400 B
Python
15 lines
400 B
Python
# coding: utf-8
|
|
from __future__ import unicode_literals
|
|
|
|
from ..util import get_doc
|
|
|
|
|
|
def test_sbd_empty_string(en_tokenizer):
|
|
"""Test Issue #309: SBD fails on empty string"""
|
|
tokens = en_tokenizer(" ")
|
|
doc = get_doc(tokens.vocab, [t.text for t in tokens], heads=[0], deps=['ROOT'])
|
|
doc.is_parsed = True
|
|
assert len(doc) == 1
|
|
sents = list(doc.sents)
|
|
assert len(sents) == 1
|