spaCy/tests/test_only_punct.py

15 lines
265 B
Python

from __future__ import unicode_literals
import pytest
from spacy.en import EN
def test_only_pre1():
assert len(EN.tokenize("(")) == 1
def test_only_pre2():
assert len(EN.tokenize("((")) == 2
def test_only_suf2():
assert len(EN.tokenize("''")) == 2