mirror of
https://github.com/explosion/spaCy.git
synced 2024-12-25 01:16:28 +03:00
unicode string for python 2.7
This commit is contained in:
parent
eca9cc5417
commit
673c81bbb4
|
@ -70,6 +70,6 @@ yet you your yours yourself yourselves
|
|||
)
|
||||
|
||||
for hyphen in ["'", "`", "‘", "´", "’"]:
|
||||
for stopword in "n't 'd 'll 'm 're 's 've".split():
|
||||
for stopword in u"n't 'd 'll 'm 're 's 've".split():
|
||||
STOP_WORDS.add(stopword.replace("'", hyphen))
|
||||
|
||||
|
|
|
@ -4,10 +4,10 @@ import pytest
|
|||
@pytest.mark.parametrize(
|
||||
"word",
|
||||
[
|
||||
"don't",
|
||||
"don’t",
|
||||
"I'd",
|
||||
"I’d",
|
||||
u"don't",
|
||||
u"don’t",
|
||||
u"I'd",
|
||||
u"I’d",
|
||||
],
|
||||
)
|
||||
def test_issue3521(en_tokenizer, word):
|
||||
|
|
Loading…
Reference in New Issue
Block a user