spaCy/spacy/tests/morphology/test_morph_features.py

48 lines
1.3 KiB
Python
Raw Normal View History

2018-09-25 18:38:08 +00:00
import pytest
2019-03-08 12:28:53 +00:00
from spacy.morphology import Morphology
from spacy.strings import StringStore, get_string_id
from spacy.lemmatizer import Lemmatizer
from spacy.lookups import Lookups
2018-09-25 18:38:08 +00:00
@pytest.fixture
def morphology():
lemmatizer = Lemmatizer(Lookups())
return Morphology(StringStore(), {}, lemmatizer)
2018-09-25 18:38:08 +00:00
2019-03-08 12:28:53 +00:00
2018-09-25 18:38:08 +00:00
def test_init(morphology):
pass
2019-03-08 12:28:53 +00:00
2018-09-25 19:07:48 +00:00
def test_add_morphology_with_string_names(morphology):
morphology.add({"Case_gen", "Number_sing"})
2018-09-25 18:38:08 +00:00
2019-03-08 12:28:53 +00:00
2018-09-25 19:07:48 +00:00
def test_add_morphology_with_int_ids(morphology):
2019-03-07 16:14:57 +00:00
morphology.add({get_string_id("Case_gen"), get_string_id("Number_sing")})
2018-09-25 18:38:08 +00:00
2019-03-08 12:28:53 +00:00
2018-09-25 19:07:48 +00:00
def test_add_morphology_with_mix_strings_and_ints(morphology):
2019-03-08 12:28:53 +00:00
morphology.add({get_string_id("PunctSide_ini"), "VerbType_aux"})
2018-09-25 18:38:08 +00:00
2018-09-25 19:07:48 +00:00
def test_morphology_tags_hash_distinctly(morphology):
2019-03-08 12:28:53 +00:00
tag1 = morphology.add({"PunctSide_ini", "VerbType_aux"})
tag2 = morphology.add({"Case_gen", "Number_sing"})
2018-09-25 19:07:48 +00:00
assert tag1 != tag2
2019-03-08 12:28:53 +00:00
2018-09-25 19:07:48 +00:00
def test_morphology_tags_hash_independent_of_order(morphology):
2019-03-08 12:28:53 +00:00
tag1 = morphology.add({"Case_gen", "Number_sing"})
tag2 = morphology.add({"Number_sing", "Case_gen"})
2018-09-25 19:07:48 +00:00
assert tag1 == tag2
2019-03-08 12:28:53 +00:00
2018-09-25 19:07:48 +00:00
def test_update_morphology_tag(morphology):
tag1 = morphology.add({"Case_gen"})
tag2 = morphology.update(tag1, {"Number_sing"})
assert tag1 != tag2
2019-03-08 12:28:53 +00:00
tag3 = morphology.add({"Number_sing", "Case_gen"})
2018-09-25 19:07:48 +00:00
assert tag2 == tag3