From 56e2219b658993ea90c84c7094bec9d8593fd76f Mon Sep 17 00:00:00 2001 From: Magnus Burton Date: Fri, 30 Dec 2016 21:17:34 +0100 Subject: [PATCH] Added Swedish city abbreviations --- spacy/sv/tokenizer_exceptions.py | 6 ++++++ 1 file changed, 6 insertions(+) diff --git a/spacy/sv/tokenizer_exceptions.py b/spacy/sv/tokenizer_exceptions.py index b2a85eec9..d8d4e8823 100644 --- a/spacy/sv/tokenizer_exceptions.py +++ b/spacy/sv/tokenizer_exceptions.py @@ -62,6 +62,12 @@ TOKENIZER_EXCEPTIONS = { ], "sön.": [ {ORTH: "sön.", LEMMA: "söndag"} + ], + "sthlm": [ + {ORTH: "sthlm", LEMMA: "Stockholm"} + ], + "gbg": [ + {ORTH: "gbg", LEMMA: "Göteborg"} ] }