Enabling tests/lang/ru/test_lemmatizer.py, fixing a unicode issue (#3084)

## Description See #3079. Here I'm merging into `develop` instead of `master`. ### Types of change  Bug fix. ## Checklist  - [x] I have submitted the spaCy Contributor Agreement. - [x] I ran the tests, and all new and existing tests passed. - [x] My changes don't require a change to the documentation, or if they do, I've added all required information.
2025-12-26 11:33:21 +03:00 · 2018-12-30 16:10:26 +05:00 · 2018-12-30 16:10:26 +05:00 · b665a32b95
commit b665a32b95
parent 9bc4cc1352
2 changed files with 4 additions and 2 deletions
--- a/spacy/lang/ru/lemmatizer.py
+++ b/spacy/lang/ru/lemmatizer.py
@ -1,6 +1,9 @@
 # coding: utf8
+from __future__ import unicode_literals
+
 from ...symbols import ADJ, DET, NOUN, NUM, PRON, PROPN, PUNCT, VERB, POS
 from ...lemmatizer import Lemmatizer
+from ...compat import unicode_


 class RussianLemmatizer(Lemmatizer):
@ -81,7 +84,7 @@ class RussianLemmatizer(Lemmatizer):

    @staticmethod
    def normalize_univ_pos(univ_pos):
-        if isinstance(univ_pos, str):
+        if isinstance(univ_pos, unicode_):
            return univ_pos.upper()

        symbols_to_str = {
--- a/spacy/tests/lang/ru/test_lemmatizer.py
+++ b/spacy/tests/lang/ru/test_lemmatizer.py
@ -39,7 +39,6 @@ def test_ru_lemmatizer_noun_lemmas(ru_lemmatizer, text, lemmas):
    assert sorted(ru_lemmatizer.noun(text)) == lemmas


-@pytest.mark.models("ru")
@pytest.mark.parametrize(
    "text,pos,morphology,lemma",
    [