Add xfailing test (see #1971, #2675, #2671)

2025-12-09 11:14:21 +03:00 · 2019-02-08 20:50:01 +01:00 · 2019-02-08 20:50:01 +01:00 · 414a69b736
commit 414a69b736
parent ea07f3022e
1 changed files with 23 additions and 0 deletions
--- a/spacy/tests/regression/test_issue1971.py
+++ b/spacy/tests/regression/test_issue1971.py
@ -0,0 +1,23 @@
+# coding: utf8
+from __future__ import unicode_literals
+
+from spacy.matcher import Matcher
+from spacy.tokens import Token, Doc
+
+
+def test_issue1971(en_vocab):
+    # Possibly related to #2675 and #2671?
+    matcher = Matcher(en_vocab)
+    pattern = [
+        {"ORTH": "Doe"},
+        {"ORTH": "!", "OP": "?"},
+        {"_": {"optional": True}, "OP": "?"},
+        {"ORTH": "!", "OP": "?"},
+    ]
+    Token.set_extension("optional", default=False)
+    matcher.add("TEST", None, pattern)
+    doc = Doc(en_vocab, words=["Hello", "John", "Doe", "!"])
+    # We could also assert length 1 here, but this is more conclusive, because
+    # the real problem here is that it returns a duplicate match for a match_id
+    # that's not actually in the vocab!
+    assert all(match_id in en_vocab.strings for match_id, start, end in matcher(doc))