spaCy/spacy/lang/it/tokenizer_exceptions.py

8 lines
167 B
Python
Raw Normal View History

# coding: utf8
from __future__ import unicode_literals
from ...symbols import ORTH, LEMMA
2019-08-20 15:36:34 +00:00
_exc = {"po'": [{ORTH: "po'", LEMMA: "poco"}]}
TOKENIZER_EXCEPTIONS = _exc