mirror of
https://github.com/explosion/spaCy.git
synced 2025-01-13 02:36:32 +03:00
Slightly modify test for #3468
Check for Token.is_sent_start first (which is serialized/deserialized correctly)
This commit is contained in:
parent
02d9378d8c
commit
fbec72b4c3
|
@ -13,11 +13,11 @@ def test_issue3468():
|
||||||
nlp = English()
|
nlp = English()
|
||||||
nlp.add_pipe(nlp.create_pipe("sentencizer"))
|
nlp.add_pipe(nlp.create_pipe("sentencizer"))
|
||||||
doc = nlp("Hello world")
|
doc = nlp("Hello world")
|
||||||
assert doc.is_sentenced
|
|
||||||
assert doc[0].is_sent_start
|
assert doc[0].is_sent_start
|
||||||
|
assert doc.is_sentenced
|
||||||
assert len(list(doc.sents)) == 1
|
assert len(list(doc.sents)) == 1
|
||||||
doc_bytes = doc.to_bytes()
|
doc_bytes = doc.to_bytes()
|
||||||
new_doc = Doc(nlp.vocab).from_bytes(doc_bytes)
|
new_doc = Doc(nlp.vocab).from_bytes(doc_bytes)
|
||||||
assert new_doc.is_sentenced
|
|
||||||
assert doc[0].is_sent_start
|
assert doc[0].is_sent_start
|
||||||
|
assert new_doc.is_sentenced
|
||||||
assert len(list(new_doc.sents)) == 1
|
assert len(list(new_doc.sents)) == 1
|
||||||
|
|
Loading…
Reference in New Issue
Block a user