mirror of
				https://github.com/explosion/spaCy.git
				synced 2025-11-04 09:57:26 +03:00 
			
		
		
		
	
		
			
				
	
	
		
			28 lines
		
	
	
		
			715 B
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			28 lines
		
	
	
		
			715 B
		
	
	
	
		
			Python
		
	
	
	
	
	
from __future__ import unicode_literals
 | 
						|
from ...tokens import Doc
 | 
						|
from ...vocab import Vocab
 | 
						|
 | 
						|
 | 
						|
def test_issue1834():
 | 
						|
    """test if sentence boundaries & parse/tag flags are not lost
 | 
						|
    during serialization
 | 
						|
    """
 | 
						|
    words = "This is a first sentence . And another one".split()
 | 
						|
    vocab = Vocab()
 | 
						|
    doc = Doc(vocab, words=words)
 | 
						|
    vocab = doc.vocab
 | 
						|
    doc[6].sent_start = True
 | 
						|
    deser_doc = Doc(vocab).from_bytes(doc.to_bytes())
 | 
						|
    assert deser_doc[6].sent_start
 | 
						|
    assert not deser_doc.is_parsed
 | 
						|
    assert not deser_doc.is_tagged
 | 
						|
    doc.is_parsed = True
 | 
						|
    doc.is_tagged = True
 | 
						|
    deser_doc = Doc(vocab).from_bytes(doc.to_bytes())
 | 
						|
    assert deser_doc.is_parsed
 | 
						|
    assert deser_doc.is_tagged
 | 
						|
 | 
						|
 | 
						|
 | 
						|
 |