2015-01-05 09:54:54 +03:00
|
|
|
from __future__ import unicode_literals
|
2014-09-02 01:27:09 +04:00
|
|
|
import pytest
|
|
|
|
|
2014-09-02 01:41:43 +04:00
|
|
|
from spacy.orth import is_alpha
|
|
|
|
from spacy.orth import is_digit
|
|
|
|
from spacy.orth import is_punct
|
|
|
|
from spacy.orth import is_space
|
|
|
|
from spacy.orth import is_ascii
|
|
|
|
from spacy.orth import is_upper
|
|
|
|
from spacy.orth import is_lower
|
|
|
|
from spacy.orth import is_title
|
2014-09-02 01:27:09 +04:00
|
|
|
|
|
|
|
|
|
|
|
@pytest.fixture
|
|
|
|
def words():
|
|
|
|
return ["1997", "19.97", "hello9", "Hello", "HELLO", "Hello9", "\n", "!",
|
|
|
|
"!d", "\nd"]
|
|
|
|
|
|
|
|
def test_is_alpha(words):
|
2014-10-10 01:11:31 +04:00
|
|
|
assert not is_alpha(words[0])
|
|
|
|
assert not is_alpha(words[1])
|
|
|
|
assert not is_alpha(words[2])
|
|
|
|
assert is_alpha(words[3])
|
|
|
|
assert is_alpha(words[4])
|
|
|
|
assert not is_alpha(words[5])
|
|
|
|
assert not is_alpha(words[6])
|
|
|
|
assert not is_alpha(words[7])
|
|
|
|
assert not is_alpha(words[8])
|
|
|
|
assert not is_alpha(words[9])
|
2014-09-02 01:27:09 +04:00
|
|
|
|
|
|
|
|
|
|
|
def test_is_digit(words):
|
2014-10-10 01:11:31 +04:00
|
|
|
assert is_digit(words[0])
|
|
|
|
assert not is_digit(words[1])
|
|
|
|
assert not is_digit(words[2])
|
|
|
|
assert not is_digit(words[3])
|
|
|
|
assert not is_digit(words[4])
|
|
|
|
assert not is_digit(words[5])
|
|
|
|
assert not is_digit(words[6])
|
|
|
|
assert not is_digit(words[7])
|
|
|
|
assert not is_digit(words[8])
|
|
|
|
assert not is_digit(words[9])
|