* Add test for reading in POS tags

This commit is contained in:
Matthew Honnibal 2014-10-22 10:18:43 +11:00
parent 224bdae996
commit 077885637d
1 changed files with 15 additions and 0 deletions

15
tests/test_read_pos.py Normal file
View File

@ -0,0 +1,15 @@
import py.test
from spacy.pos_util import realign_tagged
from spacy.pos_util import _parse_line
def test_realign():
rules = ["<SEP>,", "ca<SEP>n't", "``<SEP>"]
tagged = "``/`` I/PRP ca/MD n't/RB"
assert realign_tagged(rules, tagged) == "``<SEP>I/``_PRP ca<SEP>n't/MD_RB"
def test_parse_line():
line = "Pierre/NNP Vinken,/NNP_, isn't/VBZ_RB 61/CD years/NNS old./RB_.\n"
tokens, tags = _parse_line(line, '/')
assert len(tokens) == len(tags)
assert len(tokens) == 9