Fix syntax iterators

This commit is contained in:
Matthew Honnibal 2017-06-04 15:51:50 -05:00
parent 6d0356e6cc
commit e28f90b672
3 changed files with 7 additions and 7 deletions

View File

@ -15,9 +15,9 @@ def noun_chunks(obj):
# and not just "eine Tasse", same for "das Thema Familie". # and not just "eine Tasse", same for "das Thema Familie".
labels = ['sb', 'oa', 'da', 'nk', 'mo', 'ag', 'ROOT', 'root', 'cj', 'pd', 'og', 'app'] labels = ['sb', 'oa', 'da', 'nk', 'mo', 'ag', 'ROOT', 'root', 'cj', 'pd', 'og', 'app']
doc = obj.doc # Ensure works on both Doc and Span. doc = obj.doc # Ensure works on both Doc and Span.
np_label = doc.vocab.strings['NP'] np_label = doc.vocab.strings.add('NP')
np_deps = set(doc.vocab.strings[label] for label in labels) np_deps = set(doc.vocab.strings.add(label) for label in labels)
close_app = doc.vocab.strings['nk'] close_app = doc.vocab.strings.add('nk')
rbracket = 0 rbracket = 0
for i, word in enumerate(obj): for i, word in enumerate(obj):

View File

@ -31,7 +31,7 @@ class EnglishDefaults(Language.Defaults):
lemma_rules = dict(LEMMA_RULES) lemma_rules = dict(LEMMA_RULES)
lemma_index = dict(LEMMA_INDEX) lemma_index = dict(LEMMA_INDEX)
lemma_exc = dict(LEMMA_EXC) lemma_exc = dict(LEMMA_EXC)
sytax_iterators = dict(SYNTAX_ITERATORS) syntax_iterators = dict(SYNTAX_ITERATORS)
class English(Language): class English(Language):

View File

@ -11,9 +11,9 @@ def noun_chunks(obj):
labels = ['nsubj', 'dobj', 'nsubjpass', 'pcomp', 'pobj', labels = ['nsubj', 'dobj', 'nsubjpass', 'pcomp', 'pobj',
'attr', 'ROOT'] 'attr', 'ROOT']
doc = obj.doc # Ensure works on both Doc and Span. doc = obj.doc # Ensure works on both Doc and Span.
np_deps = [doc.vocab.strings[label] for label in labels] np_deps = [doc.vocab.strings.add(label) for label in labels]
conj = doc.vocab.strings['conj'] conj = doc.vocab.strings.add('conj')
np_label = doc.vocab.strings['NP'] np_label = doc.vocab.strings.add('NP')
seen = set() seen = set()
for i, word in enumerate(obj): for i, word in enumerate(obj):
if word.pos not in (NOUN, PROPN, PRON): if word.pos not in (NOUN, PROPN, PRON):