From 15479b3baea8d0f5cb58bf7d22321646ac4513bc Mon Sep 17 00:00:00 2001 From: ines Date: Tue, 26 Sep 2017 16:43:28 +0200 Subject: [PATCH] Add comment to like_num re: future work --- spacy/lang/nl/lex_attrs.py | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/spacy/lang/nl/lex_attrs.py b/spacy/lang/nl/lex_attrs.py index 4a9c0bdc3..08b1df3be 100644 --- a/spacy/lang/nl/lex_attrs.py +++ b/spacy/lang/nl/lex_attrs.py @@ -19,6 +19,10 @@ miljardste biljoenste biljardste triljoenste triljardste def like_num(text): + # This only does the most basic check for whether a token is a digit + # or matches one of the number words. In order to handle numbers like + # "drieëntwintig", more work is required. + # See this discussion: https://github.com/explosion/spaCy/pull/1177 text = text.replace(',', '').replace('.', '') if text.isdigit(): return True