mirror of
https://github.com/explosion/spaCy.git
synced 2024-12-24 17:06:29 +03:00
Fixed tests for Swedish that were written in Danish. (#5395)
This commit is contained in:
parent
c045a9c7f6
commit
5e55bfa821
|
@ -47,15 +47,15 @@ def test_sv_tokenizer_handles_ambiguous_abbr(sv_tokenizer, text):
|
||||||
|
|
||||||
|
|
||||||
def test_sv_tokenizer_handles_exc_in_text(sv_tokenizer):
|
def test_sv_tokenizer_handles_exc_in_text(sv_tokenizer):
|
||||||
text = "Det er bl.a. ikke meningen"
|
text = "Det är bl.a. inte meningen"
|
||||||
tokens = sv_tokenizer(text)
|
tokens = sv_tokenizer(text)
|
||||||
assert len(tokens) == 5
|
assert len(tokens) == 5
|
||||||
assert tokens[2].text == "bl.a."
|
assert tokens[2].text == "bl.a."
|
||||||
|
|
||||||
|
|
||||||
def test_sv_tokenizer_handles_custom_base_exc(sv_tokenizer):
|
def test_sv_tokenizer_handles_custom_base_exc(sv_tokenizer):
|
||||||
text = "Her er noget du kan kigge i."
|
text = "Här är något du kan titta på."
|
||||||
tokens = sv_tokenizer(text)
|
tokens = sv_tokenizer(text)
|
||||||
assert len(tokens) == 8
|
assert len(tokens) == 8
|
||||||
assert tokens[6].text == "i"
|
assert tokens[6].text == "på"
|
||||||
assert tokens[7].text == "."
|
assert tokens[7].text == "."
|
||||||
|
|
Loading…
Reference in New Issue
Block a user