Fix scoring if tokenization changes

2025-07-02 10:53:05 +03:00 · 2018-05-01 01:33:20 +02:00 · 2018-05-01 01:33:20 +02:00 · d44bb45c72
commit d44bb45c72
parent 723b328062
1 changed files with 1 additions and 1 deletions
--- a/spacy/scorer.py
+++ b/spacy/scorer.py
@ -86,7 +86,7 @@ class Scorer(object):
    def score(self, tokens, gold, verbose=False, punct_labels=('p', 'punct')):
        if len(tokens) != len(gold):
-            raise ValueError(Errors.E078.format(words_doc=len(tokens), words_gold=len(gold)))
+            gold = GoldParse.from_annot_tuples(tokens, zip(*gold.orig_annot))
        gold_deps = set()
        gold_tags = set()
        gold_ents = set(tags_to_entities([annot[-1]