mirror of
https://github.com/explosion/spaCy.git
synced 2025-01-24 16:24:16 +03:00
* Add a test for Issue #118: Matcher behaves unpredictably with overlapping entities
This commit is contained in:
parent
73928001ed
commit
fd72b8b282
19
tests/matcher/test_matcher_bugfixes.py
Normal file
19
tests/matcher/test_matcher_bugfixes.py
Normal file
|
@ -0,0 +1,19 @@
|
|||
import pytest
|
||||
|
||||
|
||||
from spacy.matcher import Matcher
|
||||
|
||||
def test_overlap_issue118(EN):
|
||||
'''Test a bug that arose from having overlapping matches'''
|
||||
doc = EN.tokenizer(u'how many points did lebron james score against the boston celtics last night')
|
||||
ORG = doc.vocab.strings['ORG']
|
||||
matcher = Matcher(EN.vocab, {'BostonCeltics': ('ORG', {}, [[{'lower': 'boston'}, {'lower': 'celtics'}], [{'lower': 'celtics'}]])})
|
||||
|
||||
matches = matcher(doc)
|
||||
assert matches == [(ORG, 9, 11)]
|
||||
ents = list(doc.ents)
|
||||
assert len(ents) == 1
|
||||
assert ents[0].label == ORG
|
||||
assert ents[0].start == 9
|
||||
assert ents[0].end == 11
|
||||
|
Loading…
Reference in New Issue
Block a user