mirror of
https://github.com/explosion/spaCy.git
synced 2025-01-26 09:14:32 +03:00
parent
2dc0d28cc4
commit
cc36c308f4
|
@ -11,9 +11,11 @@ def english_noun_chunks(obj):
|
|||
conj = doc.vocab.strings['conj']
|
||||
np_label = doc.vocab.strings['NP']
|
||||
for i, word in enumerate(obj):
|
||||
if word.pos in (NOUN, PROPN, PRON) and word.dep in np_deps:
|
||||
if word.pos not in (NOUN, PROPN, PRON):
|
||||
continue
|
||||
if word.dep in np_deps:
|
||||
yield word.left_edge.i, word.i+1, np_label
|
||||
elif word.pos == NOUN and word.dep == conj:
|
||||
elif word.dep == conj:
|
||||
head = word.head
|
||||
while head.dep == conj and head.head.i < head.i:
|
||||
head = head.head
|
||||
|
|
|
@ -4,7 +4,6 @@ from __future__ import unicode_literals
|
|||
import pytest
|
||||
|
||||
|
||||
@pytest.mark.xfail
|
||||
@pytest.mark.models
|
||||
def test_issue693(EN):
|
||||
"""Test that doc.noun_chunks parses the complete sentence."""
|
||||
|
@ -15,5 +14,7 @@ def test_issue693(EN):
|
|||
doc2 = EN(text2)
|
||||
chunks1 = [chunk for chunk in doc1.noun_chunks]
|
||||
chunks2 = [chunk for chunk in doc2.noun_chunks]
|
||||
for word in doc1:
|
||||
print(word.text, word.dep_, word.head.text)
|
||||
assert len(chunks1) == 2
|
||||
assert len(chunks2) == 2
|
||||
|
|
Loading…
Reference in New Issue
Block a user