spaCy/spacy/tests/regression/test_issue587.py

21 lines
721 B
Python
Raw Normal View History

2017-01-10 18:24:10 +00:00
# coding: utf-8
from __future__ import unicode_literals
from ...matcher import Matcher
from ...attrs import IS_PUNCT, ORTH
import pytest
2017-01-10 18:24:10 +00:00
@pytest.mark.models
def test_issue587(EN):
"""Test that Matcher doesn't segfault on particular input"""
matcher = Matcher(EN.vocab)
2017-01-10 18:24:10 +00:00
content = '''a b; c'''
2016-10-28 15:41:16 +00:00
matcher.add(entity_key='1', label='TEST', attrs={}, specs=[[{ORTH: 'a'}, {ORTH: 'b'}]])
matcher(EN(content))
2016-10-28 15:41:16 +00:00
matcher.add(entity_key='2', label='TEST', attrs={}, specs=[[{ORTH: 'a'}, {ORTH: 'b'}, {IS_PUNCT: True}, {ORTH: 'c'}]])
matcher(EN(content))
2016-10-28 15:41:16 +00:00
matcher.add(entity_key='3', label='TEST', attrs={}, specs=[[{ORTH: 'a'}, {ORTH: 'b'}, {IS_PUNCT: True}, {ORTH: 'd'}]])
matcher(EN(content))