# coding: utf-8 from __future__ import unicode_literals import pytest @pytest.mark.parametrize( "text,norms", [("пн.", ["понедельник"]), ("пт.", ["пятница"]), ("дек.", ["декабрь"])], ) def test_ru_tokenizer_abbrev_exceptions(ru_tokenizer, text, norms): tokens = ru_tokenizer(text) assert len(tokens) == 1 assert [token.norm_ for token in tokens] == norms