2014-07-07 14:47:21 +04:00
|
|
|
from spacy.spacy cimport Language
|
2014-08-22 18:35:48 +04:00
|
|
|
from spacy.lexeme cimport LexID
|
2014-07-07 14:47:21 +04:00
|
|
|
from spacy.tokens cimport Tokens
|
2014-08-22 18:35:48 +04:00
|
|
|
from spacy.lexeme cimport StringHash
|
2014-07-07 06:29:24 +04:00
|
|
|
|
|
|
|
|
2014-08-22 18:35:48 +04:00
|
|
|
cdef class PennTreebank3(Language):
|
|
|
|
cpdef list find_substrings(self, unicode word)
|
2014-07-07 14:47:21 +04:00
|
|
|
|
2014-07-07 06:29:24 +04:00
|
|
|
|
2014-08-22 18:35:48 +04:00
|
|
|
cdef PennTreebank3 PTB3
|
2014-07-07 06:29:24 +04:00
|
|
|
|
2014-08-22 18:35:48 +04:00
|
|
|
cpdef LexID lookup(unicode word) except 0
|
2014-07-07 14:47:21 +04:00
|
|
|
cpdef Tokens tokenize(unicode string)
|
2014-07-07 06:29:24 +04:00
|
|
|
cpdef unicode unhash(StringHash hash_value)
|