from __future__ import unicode_literals from spacy.en import English import pytest EN = English() @pytest.fixture def doc(): return EN('This is a sentence. This is another sentence. And a third.') def test_sent_spans(doc): sents = list(doc.sents) assert sents[0].start == 0 assert sents[0].end == 5 assert len(sents) == 3 assert sum(len(sent) for sent in sents) == len(doc)