spaCy/spacy/tests/regression/test_issue3879.py
2019-08-20 16:41:58 +02:00

17 lines
496 B
Python

# coding: utf8
from __future__ import unicode_literals
import pytest
from spacy.matcher import Matcher
from spacy.tokens import Doc
@pytest.mark.xfail
def test_issue3879(en_vocab):
doc = Doc(en_vocab, words=["This", "is", "a", "test", "."])
assert len(doc) == 5
pattern = [{"ORTH": "This", "OP": "?"}, {"OP": "?"}, {"ORTH": "test"}]
matcher = Matcher(en_vocab)
matcher.add("TEST", None, pattern)
assert len(matcher(doc)) == 2 # fails because of a FP match 'is a test'