|
class RegexMerger(object):
|
|
def __init__(self, regexes):
|
|
self.regexes = regexes
|
|
|
|
def __call__(self, tokens):
|
|
for tag, entity_type, regex in self.regexes:
|
|
for m in regex.finditer(unicode(tokens)):
|
|
tokens.merge(m.start(), m.end(), tag, m.group(), entity_type)
|