Add failing test for issue 2671: Incorrect rule ID returned from matcher

2025-12-03 08:14:20 +03:00 · 2018-08-15 15:54:33 +02:00 · 2018-08-15 15:54:33 +02:00 · 7cfa665ce6
commit 7cfa665ce6
parent 1b2a5869ab
1 changed files with 25 additions and 0 deletions
--- a/spacy/tests/regression/test_issue2671.py
+++ b/spacy/tests/regression/test_issue2671.py
@ -0,0 +1,25 @@
 # coding: utf-8
 from __future__ import unicode_literals
 from spacy.lang.en import English
 from spacy.matcher import Matcher
 def get_rule_id(nlp, matcher, doc):
    matches = matcher(doc)
    for match_id, start, end in matches:
        rule_id = nlp.vocab.strings[match_id]
        span = doc[start:end]
        return rule_id
 def test_issue2671():
    nlp = English()
    matcher = Matcher(nlp.vocab)
    pattern = [{'LOWER': 'high'}, {'IS_PUNCT': True, 'OP': '?'}, {'LOWER': 'adrenaline'}]
    matcher.add("test_pattern", None, pattern)
    doc1 = nlp("This is a high-adrenaline situation.")
    doc2 = nlp("This is a high adrenaline situation.")
    # Works correctly
    assert get_rule_id(nlp, matcher, doc1) == 'test_pattern'
    assert get_rule_id(nlp, matcher, doc2) == 'test_pattern'