fix test for misaligned

2025-11-15 23:36:03 +03:00 · 2020-06-15 23:10:47 +02:00 · 2020-06-15 23:10:47 +02:00 · 0702a1d3fb
commit 0702a1d3fb
parent a28f8f369e
1 changed files with 4 additions and 4 deletions
--- a/spacy/tests/test_gold.py
+++ b/spacy/tests/test_gold.py
@ -176,10 +176,10 @@ def test_gold_biluo_different_tokenization(en_vocab, en_tokenizer):
    spaces = [True, True, True, False, False]
    doc = Doc(en_vocab, words=words, spaces=spaces)
    entities = [(len("I flew to "), len("I flew to San Francisco Valley"), "LOC")]
-    gp = GoldParse(
+    gold_words = ["I", "flew to", "San", "Francisco Valley", "."]
-        doc, words=["I", "flew to", "San", "Francisco Valley", "."], entities=entities,
+    example = Example.from_dict(doc, {"words": gold_words, "entities": entities})
-    )
+    assert example.get_aligned("ENT_IOB") == [2, 2, 3, 1, 2]
-    assert gp.ner == ["O", "O", "B-LOC", "L-LOC", "O"]
+    assert example.get_aligned("ENT_TYPE", as_string=True) == ["", "", "LOC", "LOC", ""]
    # additional whitespace tokens in GoldParse words
    words, spaces = get_words_and_spaces(