spaCy/tests/doc/test_morphanalysis.py

34 lines
813 B
Python
Raw Normal View History

2019-03-08 02:10:07 +03:00
# coding: utf-8
from __future__ import unicode_literals
import pytest
2019-03-08 15:28:53 +03:00
2019-03-08 02:10:07 +03:00
@pytest.fixture
def i_has(en_tokenizer):
doc = en_tokenizer("I has")
doc[0].tag_ = "PRP"
doc[1].tag_ = "VBZ"
return doc
2019-03-08 15:28:53 +03:00
2019-03-08 02:10:07 +03:00
def test_token_morph_id(i_has):
assert i_has[0].morph.id
assert i_has[1].morph.id != 0
assert i_has[0].morph.id != i_has[1].morph.id
2019-03-08 15:28:53 +03:00
2019-03-08 02:10:07 +03:00
def test_morph_props(i_has):
assert i_has[0].morph.pron_type == i_has.vocab.strings["PronType_prs"]
2019-03-08 03:38:54 +03:00
assert i_has[0].morph.pron_type_ == "PronType_prs"
2019-03-08 02:10:07 +03:00
assert i_has[1].morph.pron_type == 0
def test_morph_iter(i_has):
assert list(i_has[0].morph) == ["PronType_prs"]
assert list(i_has[1].morph) == ["Number_sing", "Person_three", "VerbForm_fin"]
2019-03-08 03:38:54 +03:00
def test_morph_get(i_has):
assert i_has[0].morph.get("pron_type") == "PronType_prs"