mirror of
https://github.com/explosion/spaCy.git
synced 2024-11-14 05:37:03 +03:00
28 lines
715 B
Python
28 lines
715 B
Python
|
from __future__ import unicode_literals
|
||
|
from ...tokens import Doc
|
||
|
from ...vocab import Vocab
|
||
|
|
||
|
|
||
|
def test_issue1834():
|
||
|
"""test if sentence boundaries & parse/tag flags are not lost
|
||
|
during serialization
|
||
|
"""
|
||
|
words = "This is a first sentence . And another one".split()
|
||
|
vocab = Vocab()
|
||
|
doc = Doc(vocab, words=words)
|
||
|
vocab = doc.vocab
|
||
|
doc[6].sent_start = True
|
||
|
deser_doc = Doc(vocab).from_bytes(doc.to_bytes())
|
||
|
assert deser_doc[6].sent_start
|
||
|
assert not deser_doc.is_parsed
|
||
|
assert not deser_doc.is_tagged
|
||
|
doc.is_parsed = True
|
||
|
doc.is_tagged = True
|
||
|
deser_doc = Doc(vocab).from_bytes(doc.to_bytes())
|
||
|
assert deser_doc.is_parsed
|
||
|
assert deser_doc.is_tagged
|
||
|
|
||
|
|
||
|
|
||
|
|