2014-09-25 20:29:42 +04:00
|
|
|
from __future__ import unicode_literals
|
|
|
|
|
|
|
|
import pytest
|
|
|
|
|
|
|
|
from spacy.en import *
|
2014-10-10 01:11:31 +04:00
|
|
|
from spacy.lexeme import *
|
2014-09-25 20:29:42 +04:00
|
|
|
|
|
|
|
|
|
|
|
def test_is_alpha():
|
2014-12-09 07:18:43 +03:00
|
|
|
EN.load()
|
2014-10-30 10:15:30 +03:00
|
|
|
the = EN.lexicon['the']
|
2014-10-23 17:59:17 +04:00
|
|
|
assert the['flags'] & (1 << IS_ALPHA)
|
2014-10-30 10:15:30 +03:00
|
|
|
year = EN.lexicon['1999']
|
2014-10-23 17:59:17 +04:00
|
|
|
assert not year['flags'] & (1 << IS_ALPHA)
|
2014-10-30 10:15:30 +03:00
|
|
|
mixed = EN.lexicon['hello1']
|
2014-10-23 17:59:17 +04:00
|
|
|
assert not mixed['flags'] & (1 << IS_ALPHA)
|
2014-09-25 20:29:42 +04:00
|
|
|
|
|
|
|
|
|
|
|
def test_is_digit():
|
2014-12-09 07:18:43 +03:00
|
|
|
EN.load()
|
2014-10-30 10:15:30 +03:00
|
|
|
the = EN.lexicon['the']
|
2014-10-23 17:59:17 +04:00
|
|
|
assert not the['flags'] & (1 << IS_DIGIT)
|
2014-10-30 10:15:30 +03:00
|
|
|
year = EN.lexicon['1999']
|
2014-10-23 17:59:17 +04:00
|
|
|
assert year['flags'] & (1 << IS_DIGIT)
|
2014-10-30 10:15:30 +03:00
|
|
|
mixed = EN.lexicon['hello1']
|
2014-10-23 17:59:17 +04:00
|
|
|
assert not mixed['flags'] & (1 << IS_DIGIT)
|