spaCy/spacy/tests/regression/test_issue995.py
2017-07-22 15:42:38 +02:00

22 lines
558 B
Python

from __future__ import unicode_literals
import pytest
from ... import load as load_spacy
@pytest.fixture
def doc():
nlp = load_spacy('en')
return nlp('Does flight number three fifty-four require a connecting flight'
' to get to Boston?')
@pytest.mark.models
def test_issue955(doc):
'''Test that we don't have any nested noun chunks'''
seen_tokens = set()
for np in doc.noun_chunks:
for word in np:
key = (word.i, word.text)
assert key not in seen_tokens
seen_tokens.add(key)