spaCy/spacy/tests/test_underscore.py

96 lines
3.1 KiB
Python
Raw Normal View History

# coding: utf-8
from __future__ import unicode_literals
import pytest
2017-10-07 16:56:19 +00:00
from mock import Mock
from ..vocab import Vocab
from ..tokens.doc import Doc
2017-10-07 16:56:19 +00:00
from ..tokens.underscore import Underscore
def test_create_doc_underscore():
doc = Mock()
doc.doc = doc
uscore = Underscore(Underscore.doc_extensions, doc)
assert uscore._doc is doc
assert uscore._start is None
assert uscore._end is None
2017-10-11 11:34:11 +00:00
2017-10-07 16:56:19 +00:00
def test_doc_underscore_getattr_setattr():
doc = Mock()
doc.doc = doc
doc.user_data = {}
Underscore.doc_extensions['hello'] = (False, None, None, None)
doc._ = Underscore(Underscore.doc_extensions, doc)
assert doc._.hello == False
doc._.hello = True
assert doc._.hello == True
2017-10-11 11:34:11 +00:00
2017-10-07 16:56:19 +00:00
def test_create_span_underscore():
span = Mock(doc=Mock(), start=0, end=2)
uscore = Underscore(Underscore.span_extensions, span,
start=span.start, end=span.end)
assert uscore._doc is span.doc
assert uscore._start is span.start
assert uscore._end is span.end
2017-10-11 11:34:11 +00:00
2017-10-07 16:56:19 +00:00
def test_span_underscore_getter_setter():
span = Mock(doc=Mock(), start=0, end=2)
Underscore.span_extensions['hello'] = (None, None,
lambda s: (s.start, 'hi'),
lambda s, value: setattr(s, 'start',
value))
span._ = Underscore(Underscore.span_extensions, span,
start=span.start, end=span.end)
2017-10-11 11:34:11 +00:00
2017-10-07 16:56:19 +00:00
assert span._.hello == (0, 'hi')
span._.hello = 1
assert span._.hello == (1, 'hi')
def test_token_underscore_method():
2017-10-11 11:34:19 +00:00
token = Mock(doc=Mock(), idx=7, say_cheese=lambda token: 'cheese')
2017-10-07 16:56:19 +00:00
Underscore.token_extensions['hello'] = (None, token.say_cheese,
None, None)
token._ = Underscore(Underscore.token_extensions, token, start=token.idx)
assert token._.hello() == 'cheese'
@pytest.mark.parametrize('obj', [
Doc(Vocab(), words=['hello', 'world']),
Doc(Vocab(), words=['hello', 'world'])[1],
Doc(Vocab(), words=['hello', 'world'])[0:2]])
def test_underscore_raises_for_dup(obj):
obj.set_extension('test', default=None)
with pytest.raises(ValueError):
obj.set_extension('test', default=None)
@pytest.mark.parametrize('invalid_kwargs', [
{'getter': None, 'setter': lambda: None},
{'default': None, 'method': lambda: None, 'getter': lambda: None},
{'setter': lambda: None},
{'default': None, 'method': lambda: None},
{'getter': True}])
def test_underscore_raises_for_invalid(invalid_kwargs):
2018-04-03 16:51:31 +00:00
invalid_kwargs['force'] = True
doc = Doc(Vocab(), words=['hello', 'world'])
with pytest.raises(ValueError):
2018-04-03 16:51:31 +00:00
doc.set_extension('test', **invalid_kwargs)
@pytest.mark.parametrize('valid_kwargs', [
{'getter': lambda: None},
{'getter': lambda: None, 'setter': lambda: None},
{'default': 'hello'},
{'default': None},
{'method': lambda: None}])
def test_underscore_accepts_valid(valid_kwargs):
2018-04-03 16:51:31 +00:00
valid_kwargs['force'] = True
doc = Doc(Vocab(), words=['hello', 'world'])
2018-04-03 16:51:31 +00:00
doc.set_extension('test', **valid_kwargs)