2014-09-25 20:29:42 +04:00
|
|
|
from __future__ import unicode_literals
|
|
|
|
|
|
|
|
import pytest
|
|
|
|
|
|
|
|
from spacy.en import *
|
2014-10-10 01:11:31 +04:00
|
|
|
from spacy.lexeme import *
|
2014-09-25 20:29:42 +04:00
|
|
|
|
|
|
|
|
|
|
|
def test_is_alpha():
|
2014-10-14 08:47:06 +04:00
|
|
|
the = EN.lexicon.lookup('the')
|
2014-10-23 17:59:17 +04:00
|
|
|
assert the['flags'] & (1 << IS_ALPHA)
|
2014-10-14 08:47:06 +04:00
|
|
|
year = EN.lexicon.lookup('1999')
|
2014-10-23 17:59:17 +04:00
|
|
|
assert not year['flags'] & (1 << IS_ALPHA)
|
2014-10-14 08:47:06 +04:00
|
|
|
mixed = EN.lexicon.lookup('hello1')
|
2014-10-23 17:59:17 +04:00
|
|
|
assert not mixed['flags'] & (1 << IS_ALPHA)
|
2014-09-25 20:29:42 +04:00
|
|
|
|
|
|
|
|
|
|
|
def test_is_digit():
|
2014-10-14 08:47:06 +04:00
|
|
|
the = EN.lexicon.lookup('the')
|
2014-10-23 17:59:17 +04:00
|
|
|
assert not the['flags'] & (1 << IS_DIGIT)
|
2014-10-14 08:47:06 +04:00
|
|
|
year = EN.lexicon.lookup('1999')
|
2014-10-23 17:59:17 +04:00
|
|
|
assert year['flags'] & (1 << IS_DIGIT)
|
2014-10-14 08:47:06 +04:00
|
|
|
mixed = EN.lexicon.lookup('hello1')
|
2014-10-23 17:59:17 +04:00
|
|
|
assert not mixed['flags'] & (1 << IS_DIGIT)
|