From 47af3f676e54138bd83a971be0679f3cf93ff9a7 Mon Sep 17 00:00:00 2001 From: Adriane Boyd Date: Wed, 28 Aug 2019 09:16:54 +0200 Subject: [PATCH] Single and paired orth variants for German --- spacy/lang/de/__init__.py | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/spacy/lang/de/__init__.py b/spacy/lang/de/__init__.py index 1b5aee6a8..ae972072f 100644 --- a/spacy/lang/de/__init__.py +++ b/spacy/lang/de/__init__.py @@ -27,6 +27,10 @@ class GermanDefaults(Language.Defaults): stop_words = STOP_WORDS syntax_iterators = SYNTAX_ITERATORS resources = {"lemma_lookup": "lemma_lookup.json"} + single_orth_variants = [{"tags": ["$("], "variants": ["…", "..."]}, + {"tags": ["$("], "variants": ["-", "—", "–", "--", "---", "——"]}] + paired_orth_variants = [{"tags": ["$("], "variants": [("'", "'"), (",", "'"), ("‚", "‘")]}, + {"tags": ["$("], "variants": [("``", "''"), ('"', '"'), ("„", "“")]}] class German(Language):