diff --git a/spacy/lang/id/tokenizer_exceptions.py b/spacy/lang/id/tokenizer_exceptions.py index 339f5a54c..915197cd8 100644 --- a/spacy/lang/id/tokenizer_exceptions.py +++ b/spacy/lang/id/tokenizer_exceptions.py @@ -1,4 +1,11 @@ # coding: utf8 from __future__ import unicode_literals -TOKENIZER_EXCEPTIONS = {} \ No newline at end of file +from ._tokenizer_exceptions_list import FR_BASE_EXCEPTIONS + +_exc = {} + +for orth in FR_BASE_EXCEPTIONS + ["etc."]: + _exc[orth] = [{ORTH: orth}] + +TOKENIZER_EXCEPTIONS = dict(_exc) \ No newline at end of file