Add beam-search classes

This commit is contained in:
Matthew Honnibal 2017-03-15 09:27:41 -05:00
parent c79b3129e3
commit 7769bc31e3

View File

@ -29,6 +29,24 @@ cdef class EntityRecognizer(Parser):
self.vocab._serializer = None self.vocab._serializer = None
cdef class BeamEntityRecognizer(BeamParser):
"""Annotate named entities on Doc objects."""
TransitionSystem = BiluoPushDown
feature_templates = get_feature_templates('ner')
def add_label(self, label):
for action in self.moves.action_types:
self.moves.add_action(action, label)
if isinstance(label, basestring):
label = self.vocab.strings[label]
for attr, freqs in self.vocab.serializer_freqs:
if attr == ENT_TYPE and label not in freqs:
freqs.append([label, 1])
# Super hacky :(
self.vocab._serializer = None
cdef class DependencyParser(Parser): cdef class DependencyParser(Parser):
TransitionSystem = ArcEager TransitionSystem = ArcEager
@ -46,4 +64,21 @@ cdef class DependencyParser(Parser):
self.vocab._serializer = None self.vocab._serializer = None
__all__ = [Tagger, DependencyParser, EntityRecognizer] cdef class BeamDependencyParser(BeamParser):
TransitionSystem = ArcEager
feature_templates = get_feature_templates('basic')
def add_label(self, label):
for action in self.moves.action_types:
self.moves.add_action(action, label)
if isinstance(label, basestring):
label = self.vocab.strings[label]
for attr, freqs in self.vocab.serializer_freqs:
if attr == DEP and label not in freqs:
freqs.append([label, 1])
# Super hacky :(
self.vocab._serializer = None
__all__ = [Tagger, DependencyParser, EntityRecognizer, BeamDependencyParser, BeamEntityRecognizer]