2014-12-19 19:51:25 +03:00
|
|
|
from __future__ import unicode_literals
|
2014-12-22 00:54:47 +03:00
|
|
|
from spacy.en import English
|
2014-12-19 19:51:25 +03:00
|
|
|
|
|
|
|
import pytest
|
|
|
|
|
2014-12-22 00:54:47 +03:00
|
|
|
from spacy.en import English
|
|
|
|
|
|
|
|
|
|
|
|
@pytest.fixture
|
|
|
|
def EN():
|
2014-12-30 13:34:09 +03:00
|
|
|
return English()
|
2014-12-22 00:54:47 +03:00
|
|
|
|
|
|
|
|
2014-12-19 19:51:25 +03:00
|
|
|
@pytest.fixture
|
|
|
|
def morph_exc():
|
|
|
|
return {
|
|
|
|
'PRP$': {'his': {'L': '-PRP-', 'person': 3, 'case': 2}},
|
|
|
|
}
|
|
|
|
|
2014-12-22 00:54:47 +03:00
|
|
|
def test_load_exc(EN, morph_exc):
|
2014-12-23 05:18:59 +03:00
|
|
|
EN.tagger.load_morph_exceptions(morph_exc)
|
2014-12-23 03:40:32 +03:00
|
|
|
tokens = EN('I like his style.', tag=True)
|
2014-12-19 19:51:25 +03:00
|
|
|
his = tokens[2]
|
2014-12-26 06:26:27 +03:00
|
|
|
assert EN.tagger.tag_names[his.fine_pos] == 'PRP$'
|
2014-12-19 19:51:25 +03:00
|
|
|
assert his.lemma == '-PRP-'
|