mirror of
https://github.com/explosion/spaCy.git
synced 2024-12-26 18:06:29 +03:00
9 lines
252 B
Python
9 lines
252 B
Python
|
import pytest
|
||
|
|
||
|
|
||
|
def test_bg_tokenizer_handles_final_diacritics(bg_tokenizer):
|
||
|
text = "Ня̀маше яйца̀. Ня̀маше яйца̀."
|
||
|
tokens = bg_tokenizer(text)
|
||
|
assert tokens[1].text == "яйца̀"
|
||
|
assert tokens[2].text == "."
|