Add test for vocab serialization

2017-05-29 01:08:10 +02:00 · 2017-05-29 01:08:10 +02:00 · 7b1ddcc04d
parent 00b2094dc3
commit 7b1ddcc04d
1 changed files with 10 additions and 0 deletions
--- a/spacy/tests/serialize/test_serialization.py
+++ b/spacy/tests/serialize/test_serialization.py
@ -3,6 +3,7 @@ from __future__ import unicode_literals

 from ..util import get_doc, assert_docs_equal
 from ...tokens import Doc
+from ...vocab import Vocab

 import pytest

@ -22,6 +23,15 @@ def test_serialize_empty_doc(en_vocab):
    for token1, token2 in zip(doc, doc2):
        assert token1.text == token2.text

+
+@pytest.mark.xfail
+@pytest.mark.parametrize('text', ['rat'])
+def test_serialize_vocab(en_vocab, text):
+    text_hash = en_vocab.strings.add(text)
+    vocab_bytes = en_vocab.to_bytes()
+    new_vocab = Vocab().from_bytes(vocab_bytes)
+    assert new_vocab.strings(text_hash) == text
+
 #
 #@pytest.mark.parametrize('text', [TEXT])
 #def test_serialize_tokens(en_vocab, text):