diff --git a/spacy/bn/tokenizer_exceptions.py b/spacy/bn/tokenizer_exceptions.py index 169608d0b..ac8a95b3f 100644 --- a/spacy/bn/tokenizer_exceptions.py +++ b/spacy/bn/tokenizer_exceptions.py @@ -35,6 +35,9 @@ ABBREVIATIONS = { {ORTH: "সে.মি", LEMMA: "সেন্টিমিটার"}, {ORTH: "সে.মি.", LEMMA: "সেন্টিমিটার"}, ], + "মি.লি.": [ + {ORTH: "মি.লি.", LEMMA: "মিলিলিটার"}, + ] } TOKENIZER_EXCEPTIONS.update(ABBREVIATIONS)