mirror of
				https://github.com/explosion/spaCy.git
				synced 2025-11-04 01:48:04 +03:00 
			
		
		
		
	* return first sentence when span contains sentence boundary * docs fix * small fixes * cleanup
		
			
				
	
	
		
			26 lines
		
	
	
		
			866 B
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			26 lines
		
	
	
		
			866 B
		
	
	
	
		
			Python
		
	
	
	
	
	
from spacy.tokens.doc import Doc
 | 
						|
from spacy.vocab import Vocab
 | 
						|
from spacy.pipeline._parser_internals.arc_eager import ArcEager
 | 
						|
 | 
						|
 | 
						|
def test_issue7056():
 | 
						|
    """Test that the Unshift transition works properly, and doesn't cause
 | 
						|
    sentence segmentation errors."""
 | 
						|
    vocab = Vocab()
 | 
						|
    ae = ArcEager(
 | 
						|
        vocab.strings,
 | 
						|
        ArcEager.get_actions(left_labels=["amod"], right_labels=["pobj"])
 | 
						|
    )
 | 
						|
    doc = Doc(vocab, words="Severe pain , after trauma".split())
 | 
						|
    state = ae.init_batch([doc])[0]
 | 
						|
    ae.apply_transition(state, "S")
 | 
						|
    ae.apply_transition(state, "L-amod")
 | 
						|
    ae.apply_transition(state, "S")
 | 
						|
    ae.apply_transition(state, "S")
 | 
						|
    ae.apply_transition(state, "S")
 | 
						|
    ae.apply_transition(state, "R-pobj")
 | 
						|
    ae.apply_transition(state, "D")
 | 
						|
    ae.apply_transition(state, "D")
 | 
						|
    ae.apply_transition(state, "D")
 | 
						|
    assert not state.eol()
 |