Fixed tests for Swedish that were written in Danish. (#5395)

This commit is contained in:
Samuel Rodríguez Medina 2020-05-05 14:06:27 +02:00 committed by GitHub
parent c045a9c7f6
commit 5e55bfa821
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
1 changed files with 3 additions and 3 deletions

View File

@ -47,15 +47,15 @@ def test_sv_tokenizer_handles_ambiguous_abbr(sv_tokenizer, text):
def test_sv_tokenizer_handles_exc_in_text(sv_tokenizer): def test_sv_tokenizer_handles_exc_in_text(sv_tokenizer):
text = "Det er bl.a. ikke meningen" text = "Det är bl.a. inte meningen"
tokens = sv_tokenizer(text) tokens = sv_tokenizer(text)
assert len(tokens) == 5 assert len(tokens) == 5
assert tokens[2].text == "bl.a." assert tokens[2].text == "bl.a."
def test_sv_tokenizer_handles_custom_base_exc(sv_tokenizer): def test_sv_tokenizer_handles_custom_base_exc(sv_tokenizer):
text = "Her er noget du kan kigge i." text = "Här är något du kan titta på."
tokens = sv_tokenizer(text) tokens = sv_tokenizer(text)
assert len(tokens) == 8 assert len(tokens) == 8
assert tokens[6].text == "i" assert tokens[6].text == ""
assert tokens[7].text == "." assert tokens[7].text == "."