from __future__ import unicode_literals
import pytest
import os


@pytest.fixture(scope='session')
def nlp():
    from spacy.en import English
    if os.environ.get('SPACY_DATA'):
        data_dir = os.environ.get('SPACY_DATA')
    else:
        data_dir = True
    return English(path=data_dir)


@pytest.fixture()
def doc(nlp):
    for word in ['Hello', ',', 'world', '.', 'Here', 'are', 'two', 'sentences', '.']:
        _ = nlp.vocab[word]
    return nlp('Hello, world. Here are two sentences.')