from thinc.typedefs cimport atom_t from .lang cimport Language from .tokens cimport Tokens from .tokens cimport TokenC # Flags cpdef enum FlagID: IS_ALPHA IS_ASCII IS_DIGIT IS_LOWER IS_PUNCT IS_SPACE IS_TITLE IS_UPPER LIKE_URL LIKE_NUMBER OFT_LOWER OFT_TITLE OFT_UPPER IN_MALES IN_FEMALES IN_SURNAMES IN_PLACES IN_GAMES IN_CELEBS IN_NAMES cpdef enum: P2_sic P2_cluster P2_shape P2_prefix P2_suffix P2_pos P2_sense P1_sic P1_cluster P1_shape P1_prefix P1_suffix P1_pos P1_sense W_sic W_cluster W_shape W_prefix W_suffix W_pos W_sense N1_sic N1_cluster N1_shape N1_prefix N1_suffix N1_pos N1_sense N2_sic N2_cluster N2_shape N2_prefix N2_suffix N2_pos N2_sense N_CONTEXT_FIELDS cdef inline void fill_pos_context(atom_t* context, const int i, const TokenC* tokens) nogil: _fill_from_token(&context[P2_sic], &tokens[i-2]) _fill_from_token(&context[P1_sic], &tokens[i-1]) _fill_from_token(&context[W_sic], &tokens[i]) _fill_from_token(&context[N1_sic], &tokens[i+1]) _fill_from_token(&context[N2_sic], &tokens[i+2]) cdef inline void _fill_from_token(atom_t* context, const TokenC* t) nogil: context[0] = t.lex.sic context[1] = t.lex.cluster context[2] = t.lex.shape context[3] = t.lex.prefix context[4] = t.lex.suffix context[5] = t.pos context[6] = t.sense cdef class English(Language): pass