spaCy/tests/test_wiki_sun.py
2014-08-30 20:36:06 +02:00

24 lines
385 B
Python

from __future__ import unicode_literals
from spacy.en import EN
from spacy.util import utf8open
import pytest
import os
from os import path
HERE = path.dirname(__file__)
@pytest.fixture
def sun_txt():
loc = path.join(HERE, 'sun.txt')
return utf8open(loc).read()
def test_tokenize(sun_txt):
assert len(sun_txt) != 0
tokens = EN.tokenize(sun_txt)
assert True