mirror of
https://github.com/explosion/spaCy.git
synced 2024-12-24 17:06:29 +03:00
Add test for tokenization of 'i.' for Danish.
This commit is contained in:
parent
ac8116510d
commit
8dc265ac0c
|
@ -13,3 +13,10 @@ def test_da_tokenizer_handles_exc_in_text(da_tokenizer):
|
|||
tokens = da_tokenizer(text)
|
||||
assert len(tokens) == 5
|
||||
assert tokens[2].text == "bl.a."
|
||||
|
||||
def test_da_tokenizer_handles_custom_base_exc(da_tokenizer):
|
||||
text = "Her er noget du kan kigge i."
|
||||
tokens = da_tokenizer(text)
|
||||
assert len(tokens) == 8
|
||||
assert tokens[6].text == "i"
|
||||
assert tokens[7].text == "."
|
||||
|
|
Loading…
Reference in New Issue
Block a user