from libcpp.vector cimport vector from spacy.spacy cimport StringHash from spacy.spacy cimport Lexeme from spacy.spacy cimport Lexeme_addr from spacy.spacy cimport Language from spacy.tokens cimport Tokens cdef class English(spacy.Language): cdef int find_split(self, unicode word) cdef int set_orth(self, unicode word, Lexeme* lex) except -1 cdef English EN cpdef Lexeme_addr lookup(unicode word) except 0 cpdef Tokens tokenize(unicode string) cpdef unicode unhash(StringHash hash_value)