spaCy/spacy/tokens.pxd

78 lines
1.4 KiB
Cython
Raw Normal View History

2014-12-16 14:44:43 +03:00
from libc.stdint cimport uint32_t
2014-12-02 15:48:05 +03:00
import numpy as np
cimport numpy as np
from cymem.cymem cimport Pool
2014-12-04 12:46:55 +03:00
from thinc.typedefs cimport atom_t
from .lexeme cimport Lexeme
2014-12-08 13:12:15 +03:00
from .typedefs cimport flags_t
from .typedefs cimport Morphology
from .lang cimport Language
2014-12-08 13:12:15 +03:00
cdef struct TokenC:
const Lexeme* lex
2014-12-08 13:12:15 +03:00
Morphology morph
int idx
int pos
2014-12-08 13:12:15 +03:00
int lemma
int sense
2014-12-16 14:44:43 +03:00
int head
int dep_tag
uint32_t l_kids
uint32_t r_kids
ctypedef const Lexeme* const_Lexeme_ptr
ctypedef TokenC* TokenC_ptr
ctypedef fused LexemeOrToken:
const_Lexeme_ptr
TokenC_ptr
cdef class Tokens:
cdef Pool mem
cdef Language lang
cdef list tag_names
cdef TokenC* data
cdef int length
cdef int max_length
cdef int push_back(self, int i, LexemeOrToken lex_or_tok) except -1
2014-12-04 12:46:55 +03:00
cpdef np.ndarray[long, ndim=2] get_array(self, list features)
2014-12-02 15:48:05 +03:00
cdef class Token:
cdef public Language lang
cdef public int i
cdef public int idx
cdef int pos
2014-12-08 13:12:15 +03:00
cdef int lemma
2014-12-17 13:10:12 +03:00
cdef public int head
cdef public int dep_tag
cdef public atom_t id
cdef public atom_t cluster
cdef public atom_t length
cdef public atom_t postype
cdef public atom_t sensetype
2014-10-29 15:19:38 +03:00
cdef public atom_t sic
cdef public atom_t norm
cdef public atom_t shape
cdef public atom_t asciied
cdef public atom_t prefix
cdef public atom_t suffix
cdef public float prob
cdef public flags_t flags