spaCy/spacy/lang.pxd
2014-08-27 19:38:57 +02:00

30 lines
672 B
Cython

from libc.stdint cimport uint32_t
from libc.stdint cimport uint64_t
from spacy.word cimport Lexeme
cdef class Lexicon:
cdef public dict probs
cdef public dict clusters
cdef public dict case_stats
cdef public dict tag_stats
cdef public list flag_checkers
cdef public list string_transformers
cdef dict lexicon
cpdef Lexeme lookup(self, unicode string)
cdef class Language:
cdef object name
cdef dict cache
cpdef readonly Lexicon lexicon
cpdef list tokenize(self, unicode text)
cdef list _tokenize(self, unicode string)
cpdef list _split(self, unicode string)
cpdef int _split_one(self, unicode word)