mirror of https://github.com/explosion/spaCy.git
enable tokenizer exceptions
This commit is contained in:
parent
ad56c9179a
commit
7aad6718bc
|
@ -1,4 +1,11 @@
|
||||||
# coding: utf8
|
# coding: utf8
|
||||||
from __future__ import unicode_literals
|
from __future__ import unicode_literals
|
||||||
|
|
||||||
TOKENIZER_EXCEPTIONS = {}
|
from ._tokenizer_exceptions_list import FR_BASE_EXCEPTIONS
|
||||||
|
|
||||||
|
_exc = {}
|
||||||
|
|
||||||
|
for orth in FR_BASE_EXCEPTIONS + ["etc."]:
|
||||||
|
_exc[orth] = [{ORTH: orth}]
|
||||||
|
|
||||||
|
TOKENIZER_EXCEPTIONS = dict(_exc)
|
Loading…
Reference in New Issue