2018-04-03 16:30:17 +00:00
|
|
|
# coding: utf-8
|
|
|
|
from __future__ import unicode_literals
|
|
|
|
|
|
|
|
import pytest
|
2017-10-07 16:56:19 +00:00
|
|
|
from mock import Mock
|
2018-07-24 21:38:44 +00:00
|
|
|
from spacy.tokens import Doc, Span, Token
|
|
|
|
from spacy.tokens.underscore import Underscore
|
2017-10-07 16:56:19 +00:00
|
|
|
|
|
|
|
|
|
|
|
def test_create_doc_underscore():
|
|
|
|
doc = Mock()
|
|
|
|
doc.doc = doc
|
|
|
|
uscore = Underscore(Underscore.doc_extensions, doc)
|
|
|
|
assert uscore._doc is doc
|
|
|
|
assert uscore._start is None
|
|
|
|
assert uscore._end is None
|
|
|
|
|
2017-10-11 11:34:11 +00:00
|
|
|
|
2017-10-07 16:56:19 +00:00
|
|
|
def test_doc_underscore_getattr_setattr():
|
|
|
|
doc = Mock()
|
|
|
|
doc.doc = doc
|
|
|
|
doc.user_data = {}
|
2018-11-27 00:09:36 +00:00
|
|
|
Underscore.doc_extensions["hello"] = (False, None, None, None)
|
2017-10-07 16:56:19 +00:00
|
|
|
doc._ = Underscore(Underscore.doc_extensions, doc)
|
2018-11-30 16:43:08 +00:00
|
|
|
assert doc._.hello is False
|
2017-10-07 16:56:19 +00:00
|
|
|
doc._.hello = True
|
2018-11-30 16:43:08 +00:00
|
|
|
assert doc._.hello is True
|
2017-10-07 16:56:19 +00:00
|
|
|
|
2017-10-11 11:34:11 +00:00
|
|
|
|
2017-10-07 16:56:19 +00:00
|
|
|
def test_create_span_underscore():
|
|
|
|
span = Mock(doc=Mock(), start=0, end=2)
|
2018-11-27 00:09:36 +00:00
|
|
|
uscore = Underscore(
|
|
|
|
Underscore.span_extensions, span, start=span.start, end=span.end
|
|
|
|
)
|
2017-10-07 16:56:19 +00:00
|
|
|
assert uscore._doc is span.doc
|
|
|
|
assert uscore._start is span.start
|
|
|
|
assert uscore._end is span.end
|
|
|
|
|
2017-10-11 11:34:11 +00:00
|
|
|
|
2017-10-07 16:56:19 +00:00
|
|
|
def test_span_underscore_getter_setter():
|
|
|
|
span = Mock(doc=Mock(), start=0, end=2)
|
2018-11-27 00:09:36 +00:00
|
|
|
Underscore.span_extensions["hello"] = (
|
|
|
|
None,
|
|
|
|
None,
|
|
|
|
lambda s: (s.start, "hi"),
|
|
|
|
lambda s, value: setattr(s, "start", value),
|
|
|
|
)
|
|
|
|
span._ = Underscore(
|
|
|
|
Underscore.span_extensions, span, start=span.start, end=span.end
|
|
|
|
)
|
|
|
|
|
|
|
|
assert span._.hello == (0, "hi")
|
2017-10-07 16:56:19 +00:00
|
|
|
span._.hello = 1
|
2018-11-27 00:09:36 +00:00
|
|
|
assert span._.hello == (1, "hi")
|
2017-10-07 16:56:19 +00:00
|
|
|
|
|
|
|
|
|
|
|
def test_token_underscore_method():
|
2018-11-27 00:09:36 +00:00
|
|
|
token = Mock(doc=Mock(), idx=7, say_cheese=lambda token: "cheese")
|
|
|
|
Underscore.token_extensions["hello"] = (None, token.say_cheese, None, None)
|
2017-10-07 16:56:19 +00:00
|
|
|
token._ = Underscore(Underscore.token_extensions, token, start=token.idx)
|
2018-11-27 00:09:36 +00:00
|
|
|
assert token._.hello() == "cheese"
|
2018-04-03 16:30:17 +00:00
|
|
|
|
|
|
|
|
2018-11-27 00:09:36 +00:00
|
|
|
@pytest.mark.parametrize("obj", [Doc, Span, Token])
|
2018-04-28 21:33:09 +00:00
|
|
|
def test_doc_underscore_remove_extension(obj):
|
2018-11-27 00:09:36 +00:00
|
|
|
ext_name = "to_be_removed"
|
2018-04-28 21:33:09 +00:00
|
|
|
obj.set_extension(ext_name, default=False)
|
|
|
|
assert obj.has_extension(ext_name)
|
|
|
|
obj.remove_extension(ext_name)
|
|
|
|
assert not obj.has_extension(ext_name)
|
|
|
|
|
|
|
|
|
2018-11-27 00:09:36 +00:00
|
|
|
@pytest.mark.parametrize("obj", [Doc, Span, Token])
|
2018-04-03 16:30:17 +00:00
|
|
|
def test_underscore_raises_for_dup(obj):
|
2018-11-27 00:09:36 +00:00
|
|
|
obj.set_extension("test", default=None)
|
2018-04-03 16:30:17 +00:00
|
|
|
with pytest.raises(ValueError):
|
2018-11-27 00:09:36 +00:00
|
|
|
obj.set_extension("test", default=None)
|
|
|
|
|
|
|
|
|
|
|
|
@pytest.mark.parametrize(
|
|
|
|
"invalid_kwargs",
|
|
|
|
[
|
|
|
|
{"getter": None, "setter": lambda: None},
|
|
|
|
{"default": None, "method": lambda: None, "getter": lambda: None},
|
|
|
|
{"setter": lambda: None},
|
|
|
|
{"default": None, "method": lambda: None},
|
|
|
|
{"getter": True},
|
|
|
|
],
|
|
|
|
)
|
2018-04-03 16:30:17 +00:00
|
|
|
def test_underscore_raises_for_invalid(invalid_kwargs):
|
2018-11-27 00:09:36 +00:00
|
|
|
invalid_kwargs["force"] = True
|
2018-04-03 16:30:17 +00:00
|
|
|
with pytest.raises(ValueError):
|
2018-11-27 00:09:36 +00:00
|
|
|
Doc.set_extension("test", **invalid_kwargs)
|
|
|
|
|
|
|
|
|
|
|
|
@pytest.mark.parametrize(
|
|
|
|
"valid_kwargs",
|
|
|
|
[
|
|
|
|
{"getter": lambda: None},
|
|
|
|
{"getter": lambda: None, "setter": lambda: None},
|
|
|
|
{"default": "hello"},
|
|
|
|
{"default": None},
|
|
|
|
{"method": lambda: None},
|
|
|
|
],
|
|
|
|
)
|
2018-04-03 16:30:17 +00:00
|
|
|
def test_underscore_accepts_valid(valid_kwargs):
|
2018-11-27 00:09:36 +00:00
|
|
|
valid_kwargs["force"] = True
|
|
|
|
Doc.set_extension("test", **valid_kwargs)
|