2018-02-07 04:06:11 +03:00
|
|
|
'''Test regression in Matcher introduced in v2.0.6.'''
|
2018-02-07 03:29:23 +03:00
|
|
|
from __future__ import unicode_literals
|
|
|
|
import pytest
|
|
|
|
|
2018-02-07 04:06:11 +03:00
|
|
|
from ...vocab import Vocab
|
|
|
|
from ...tokens import Doc
|
|
|
|
from ...matcher import Matcher
|
2018-02-07 03:29:23 +03:00
|
|
|
|
|
|
|
def test_issue1945():
|
2018-02-07 04:06:11 +03:00
|
|
|
text = "a a a"
|
|
|
|
matcher = Matcher(Vocab())
|
|
|
|
matcher.add('MWE', None, [{'orth': 'a'}, {'orth': 'a'}])
|
|
|
|
doc = Doc(matcher.vocab, words=['a', 'a', 'a'])
|
|
|
|
matches = matcher(doc)
|
|
|
|
# We should see two overlapping matches here
|
|
|
|
assert len(matches) == 2
|
|
|
|
assert matches[0][1:] == (0, 2)
|
|
|
|
assert matches[1][1:] == (1, 3)
|