2020-03-29 14:56:07 +03:00
|
|
|
from spacy.lang.en import English
|
2020-08-14 16:00:52 +03:00
|
|
|
import pytest
|
2020-03-29 14:56:07 +03:00
|
|
|
|
|
|
|
|
|
|
|
def test_issue5152():
|
|
|
|
# Test that the comparison between a Span and a Token, goes well
|
|
|
|
# There was a bug when the number of tokens in the span equaled the number of characters in the token (!)
|
|
|
|
nlp = English()
|
|
|
|
text = nlp("Talk about being boring!")
|
|
|
|
text_var = nlp("Talk of being boring!")
|
|
|
|
y = nlp("Let")
|
|
|
|
span = text[0:3] # Talk about being
|
|
|
|
span_2 = text[0:3] # Talk about being
|
|
|
|
span_3 = text_var[0:3] # Talk of being
|
|
|
|
token = y[0] # Let
|
2020-08-14 16:00:52 +03:00
|
|
|
with pytest.warns(UserWarning):
|
|
|
|
assert span.similarity(token) == 0.0
|
2020-03-29 14:56:07 +03:00
|
|
|
assert span.similarity(span_2) == 1.0
|
2020-08-14 16:00:52 +03:00
|
|
|
with pytest.warns(UserWarning):
|
|
|
|
assert span_2.similarity(span_3) < 1.0
|