mirror of https://github.com/explosion/spaCy.git
Allow entity types with dashes (resolves #1967)
This commit is contained in:
parent
9615ed5ed7
commit
3eb67bbe4b
|
@ -84,9 +84,7 @@ cdef class BiluoPushDown(TransitionSystem):
|
||||||
for (ids, words, tags, heads, labels, biluo), _ in sents:
|
for (ids, words, tags, heads, labels, biluo), _ in sents:
|
||||||
for i, ner_tag in enumerate(biluo):
|
for i, ner_tag in enumerate(biluo):
|
||||||
if ner_tag != 'O' and ner_tag != '-':
|
if ner_tag != 'O' and ner_tag != '-':
|
||||||
if ner_tag.count('-') != 1:
|
_, label = ner_tag.split('-', 1)
|
||||||
raise ValueError(ner_tag)
|
|
||||||
_, label = ner_tag.split('-')
|
|
||||||
if label not in seen_entities:
|
if label not in seen_entities:
|
||||||
seen_entities.add(label)
|
seen_entities.add(label)
|
||||||
for move_str in ('B', 'I', 'L', 'U'):
|
for move_str in ('B', 'I', 'L', 'U'):
|
||||||
|
|
|
@ -0,0 +1,15 @@
|
||||||
|
# coding: utf8
|
||||||
|
from __future__ import unicode_literals
|
||||||
|
|
||||||
|
import pytest
|
||||||
|
|
||||||
|
from ...pipeline import EntityRecognizer
|
||||||
|
from ...vocab import Vocab
|
||||||
|
|
||||||
|
|
||||||
|
@pytest.mark.parametrize('label', ['U-JOB-NAME'])
|
||||||
|
def test_issue1967(label):
|
||||||
|
ner = EntityRecognizer(Vocab())
|
||||||
|
entry = ([0], ['word'], ['tag'], [0], ['dep'], [label])
|
||||||
|
gold_parses = [(None, [(entry, None)])]
|
||||||
|
ner.moves.get_actions(gold_parses=gold_parses)
|
Loading…
Reference in New Issue