mirror of
https://github.com/explosion/spaCy.git
synced 2024-12-26 18:06:29 +03:00
43 lines
717 B
Cython
43 lines
717 B
Cython
|
from spacy.spacy cimport Language
|
||
|
from spacy.word cimport Lexeme
|
||
|
cimport cython
|
||
|
|
||
|
|
||
|
cpdef size_t ALPHA
|
||
|
cpdef size_t DIGIT
|
||
|
cpdef size_t PUNCT
|
||
|
cpdef size_t SPACE
|
||
|
cpdef size_t LOWER
|
||
|
cpdef size_t UPPER
|
||
|
cpdef size_t TITLE
|
||
|
cpdef size_t ASCII
|
||
|
|
||
|
cpdef size_t OFT_LOWER
|
||
|
cpdef size_t OFT_TITLE
|
||
|
cpdef size_t OFT_UPPER
|
||
|
|
||
|
cpdef size_t PUNCT
|
||
|
cpdef size_t CONJ
|
||
|
cpdef size_t NUM
|
||
|
cpdef size_t N
|
||
|
cpdef size_t DET
|
||
|
cpdef size_t ADP
|
||
|
cpdef size_t ADJ
|
||
|
cpdef size_t ADV
|
||
|
cpdef size_t VERB
|
||
|
cpdef size_t NOUN
|
||
|
cpdef size_t PDT
|
||
|
cpdef size_t POS
|
||
|
cpdef size_t PRON
|
||
|
cpdef size_t PRT
|
||
|
|
||
|
cdef class English(spacy.Language):
|
||
|
cdef int find_split(self, unicode word)
|
||
|
|
||
|
|
||
|
cdef English EN
|
||
|
|
||
|
|
||
|
cpdef Word lookup(unicode word)
|
||
|
cpdef list tokenize(unicode string)
|