mirror of https://github.com/explosion/spaCy.git
enable tokenizer exceptions
This commit is contained in:
parent
ad56c9179a
commit
7aad6718bc
|
@ -1,4 +1,11 @@
|
|||
# coding: utf8
|
||||
from __future__ import unicode_literals
|
||||
|
||||
TOKENIZER_EXCEPTIONS = {}
|
||||
from ._tokenizer_exceptions_list import FR_BASE_EXCEPTIONS
|
||||
|
||||
_exc = {}
|
||||
|
||||
for orth in FR_BASE_EXCEPTIONS + ["etc."]:
|
||||
_exc[orth] = [{ORTH: orth}]
|
||||
|
||||
TOKENIZER_EXCEPTIONS = dict(_exc)
|
Loading…
Reference in New Issue