2017-04-15 13:05:47 +03:00
|
|
|
# coding: utf8
|
|
|
|
from __future__ import unicode_literals
|
|
|
|
|
2016-10-16 02:47:12 +03:00
|
|
|
from .syntax.parser cimport Parser
|
2017-03-11 16:00:20 +03:00
|
|
|
from .syntax.beam_parser cimport BeamParser
|
2016-10-16 02:47:12 +03:00
|
|
|
from .syntax.ner cimport BiluoPushDown
|
|
|
|
from .syntax.arc_eager cimport ArcEager
|
2016-10-16 22:34:57 +03:00
|
|
|
from .tagger import Tagger
|
2016-10-16 02:47:12 +03:00
|
|
|
|
2016-10-16 22:34:57 +03:00
|
|
|
# TODO: The disorganization here is pretty embarrassing. At least it's only
|
|
|
|
# internals.
|
|
|
|
from .syntax.parser import get_templates as get_feature_templates
|
2016-10-23 18:45:44 +03:00
|
|
|
from .attrs import DEP, ENT_TYPE
|
2016-10-16 02:47:12 +03:00
|
|
|
|
|
|
|
|
2017-03-11 21:45:37 +03:00
|
|
|
cdef class EntityRecognizer(Parser):
|
2017-04-15 12:59:21 +03:00
|
|
|
"""
|
|
|
|
Annotate named entities on Doc objects.
|
|
|
|
"""
|
2016-10-16 22:34:57 +03:00
|
|
|
TransitionSystem = BiluoPushDown
|
2017-03-11 16:00:20 +03:00
|
|
|
|
2016-10-16 22:34:57 +03:00
|
|
|
feature_templates = get_feature_templates('ner')
|
2016-10-16 02:47:12 +03:00
|
|
|
|
2016-10-23 18:45:44 +03:00
|
|
|
def add_label(self, label):
|
2017-04-15 00:52:17 +03:00
|
|
|
Parser.add_label(self, label)
|
2016-10-23 18:45:44 +03:00
|
|
|
if isinstance(label, basestring):
|
|
|
|
label = self.vocab.strings[label]
|
|
|
|
|
2016-10-16 02:47:12 +03:00
|
|
|
|
2017-03-15 17:27:41 +03:00
|
|
|
cdef class BeamEntityRecognizer(BeamParser):
|
2017-04-15 12:59:21 +03:00
|
|
|
"""
|
|
|
|
Annotate named entities on Doc objects.
|
|
|
|
"""
|
2017-03-15 17:27:41 +03:00
|
|
|
TransitionSystem = BiluoPushDown
|
|
|
|
|
|
|
|
feature_templates = get_feature_templates('ner')
|
2017-04-15 13:05:47 +03:00
|
|
|
|
2017-03-15 17:27:41 +03:00
|
|
|
def add_label(self, label):
|
2017-04-15 00:52:17 +03:00
|
|
|
Parser.add_label(self, label)
|
2017-03-15 17:27:41 +03:00
|
|
|
if isinstance(label, basestring):
|
|
|
|
label = self.vocab.strings[label]
|
|
|
|
|
|
|
|
|
2017-03-11 20:11:30 +03:00
|
|
|
cdef class DependencyParser(Parser):
|
2016-10-16 22:34:57 +03:00
|
|
|
TransitionSystem = ArcEager
|
2016-10-16 02:47:12 +03:00
|
|
|
|
2016-10-16 22:34:57 +03:00
|
|
|
feature_templates = get_feature_templates('basic')
|
2016-10-23 18:45:44 +03:00
|
|
|
|
|
|
|
def add_label(self, label):
|
2017-04-15 00:52:17 +03:00
|
|
|
Parser.add_label(self, label)
|
2016-10-23 18:45:44 +03:00
|
|
|
if isinstance(label, basestring):
|
|
|
|
label = self.vocab.strings[label]
|
|
|
|
|
2016-10-16 02:47:12 +03:00
|
|
|
|
2017-03-15 17:27:41 +03:00
|
|
|
cdef class BeamDependencyParser(BeamParser):
|
|
|
|
TransitionSystem = ArcEager
|
|
|
|
|
|
|
|
feature_templates = get_feature_templates('basic')
|
|
|
|
|
|
|
|
def add_label(self, label):
|
2017-04-15 00:52:17 +03:00
|
|
|
Parser.add_label(self, label)
|
2017-03-15 17:27:41 +03:00
|
|
|
if isinstance(label, basestring):
|
|
|
|
label = self.vocab.strings[label]
|
|
|
|
|
|
|
|
|
|
|
|
__all__ = [Tagger, DependencyParser, EntityRecognizer, BeamDependencyParser, BeamEntityRecognizer]
|