mirror of
https://github.com/explosion/spaCy.git
synced 2024-12-26 09:56:28 +03:00
709c9e75af
* return first sentence when span contains sentence boundary * docs fix * small fixes * cleanup
26 lines
866 B
Python
26 lines
866 B
Python
from spacy.tokens.doc import Doc
|
|
from spacy.vocab import Vocab
|
|
from spacy.pipeline._parser_internals.arc_eager import ArcEager
|
|
|
|
|
|
def test_issue7056():
|
|
"""Test that the Unshift transition works properly, and doesn't cause
|
|
sentence segmentation errors."""
|
|
vocab = Vocab()
|
|
ae = ArcEager(
|
|
vocab.strings,
|
|
ArcEager.get_actions(left_labels=["amod"], right_labels=["pobj"])
|
|
)
|
|
doc = Doc(vocab, words="Severe pain , after trauma".split())
|
|
state = ae.init_batch([doc])[0]
|
|
ae.apply_transition(state, "S")
|
|
ae.apply_transition(state, "L-amod")
|
|
ae.apply_transition(state, "S")
|
|
ae.apply_transition(state, "S")
|
|
ae.apply_transition(state, "S")
|
|
ae.apply_transition(state, "R-pobj")
|
|
ae.apply_transition(state, "D")
|
|
ae.apply_transition(state, "D")
|
|
ae.apply_transition(state, "D")
|
|
assert not state.eol()
|