Test lemma_ with unicode input

This commit is contained in:
Someon 2015-03-11 01:23:06 +02:00
parent 2e8d0e5d45
commit ec25976416

View File

@ -0,0 +1,15 @@
# encoding=utf8
from __future__ import unicode_literals
from spacy.en import English
import pytest
@pytest.fixture
def tokens():
return English()(u'ćode codé')
def test_unicode(tokens):
assert tokens[0].lemma_ == u'ćode'
assert tokens[1].lemma_ == u'codé'