* Add extra context tokens

This commit is contained in:
Matthew Honnibal 2014-11-07 04:40:36 +11:00
parent 50309e6e49
commit b4454cf036
2 changed files with 20 additions and 0 deletions

View File

@ -46,11 +46,15 @@ cdef class Token:
cdef class Slots: cdef class Slots:
cdef readonly Token P4
cdef readonly Token P3
cdef readonly Token P2 cdef readonly Token P2
cdef readonly Token P1 cdef readonly Token P1
cdef readonly Token N0 cdef readonly Token N0
cdef readonly Token N1 cdef readonly Token N1
cdef readonly Token N2 cdef readonly Token N2
cdef readonly Token N3
cdef readonly Token N4
cdef int N_FIELDS cdef int N_FIELDS

View File

@ -4,11 +4,15 @@ from .lexeme cimport *
cdef class Slots: cdef class Slots:
def __init__(self): def __init__(self):
self.P4 = Token()
self.P3 = Token()
self.P2 = Token() self.P2 = Token()
self.P1 = Token() self.P1 = Token()
self.N0 = Token() self.N0 = Token()
self.N1 = Token() self.N1 = Token()
self.N2 = Token() self.N2 = Token()
self.N3 = Token()
self.N4 = Token()
cdef void _number_token(Token t, int* n_fields): cdef void _number_token(Token t, int* n_fields):
@ -137,26 +141,38 @@ cdef int _flatten_token(atom_t* context, Token ids, Token vals) except -1:
cdef hash_t fill_slots(Slots s, int i, Tokens tokens) except 0: cdef hash_t fill_slots(Slots s, int i, Tokens tokens) except 0:
fill_token(s.P4, tokens.lex[i-4], tokens.pos[i-4], tokens.ner[i-4])
fill_token(s.P3, tokens.lex[i-3], tokens.pos[i-3], tokens.ner[i-3])
fill_token(s.P2, tokens.lex[i-2], tokens.pos[i-2], tokens.ner[i-2]) fill_token(s.P2, tokens.lex[i-2], tokens.pos[i-2], tokens.ner[i-2])
fill_token(s.P1, tokens.lex[i-1], tokens.pos[i-1], tokens.ner[i-1]) fill_token(s.P1, tokens.lex[i-1], tokens.pos[i-1], tokens.ner[i-1])
fill_token(s.N0, tokens.lex[i], tokens.pos[i], tokens.ner[i]) fill_token(s.N0, tokens.lex[i], tokens.pos[i], tokens.ner[i])
fill_token(s.N1, tokens.lex[i+1], tokens.pos[i+1], tokens.ner[i+1]) fill_token(s.N1, tokens.lex[i+1], tokens.pos[i+1], tokens.ner[i+1])
fill_token(s.N2, tokens.lex[i+2], tokens.pos[i+2], tokens.ner[i+2]) fill_token(s.N2, tokens.lex[i+2], tokens.pos[i+2], tokens.ner[i+2])
fill_token(s.N3, tokens.lex[i+3], tokens.pos[i+3], tokens.ner[i+3])
fill_token(s.N4, tokens.lex[i+4], tokens.pos[i+4], tokens.ner[i+4])
return 1 return 1
cdef int fill_flat(atom_t* context, Slots s) except -1: cdef int fill_flat(atom_t* context, Slots s) except -1:
_flatten_token(context, FIELD_IDS.P4, s.P4)
_flatten_token(context, FIELD_IDS.P3, s.P3)
_flatten_token(context, FIELD_IDS.P2, s.P2) _flatten_token(context, FIELD_IDS.P2, s.P2)
_flatten_token(context, FIELD_IDS.P1, s.P1) _flatten_token(context, FIELD_IDS.P1, s.P1)
_flatten_token(context, FIELD_IDS.N0, s.N0) _flatten_token(context, FIELD_IDS.N0, s.N0)
_flatten_token(context, FIELD_IDS.N1, s.N1) _flatten_token(context, FIELD_IDS.N1, s.N1)
_flatten_token(context, FIELD_IDS.N2, s.N2) _flatten_token(context, FIELD_IDS.N2, s.N2)
_flatten_token(context, FIELD_IDS.N3, s.N4)
_flatten_token(context, FIELD_IDS.N4, s.N4)
N_FIELDS = 0 N_FIELDS = 0
FIELD_IDS = Slots() FIELD_IDS = Slots()
_number_token(FIELD_IDS.P4, &N_FIELDS)
_number_token(FIELD_IDS.P3, &N_FIELDS)
_number_token(FIELD_IDS.P2, &N_FIELDS) _number_token(FIELD_IDS.P2, &N_FIELDS)
_number_token(FIELD_IDS.P1, &N_FIELDS) _number_token(FIELD_IDS.P1, &N_FIELDS)
_number_token(FIELD_IDS.N0, &N_FIELDS) _number_token(FIELD_IDS.N0, &N_FIELDS)
_number_token(FIELD_IDS.N1, &N_FIELDS) _number_token(FIELD_IDS.N1, &N_FIELDS)
_number_token(FIELD_IDS.N2, &N_FIELDS) _number_token(FIELD_IDS.N2, &N_FIELDS)
_number_token(FIELD_IDS.N3, &N_FIELDS)
_number_token(FIELD_IDS.N4, &N_FIELDS)