Update Scorer and add API docs

This commit is contained in:
Ines Montani 2019-05-24 14:06:04 +02:00
parent 4d550a3055
commit b78a8dc1d2
3 changed files with 98 additions and 6 deletions

View File

@ -35,7 +35,17 @@ class PRFScore(object):
class Scorer(object): class Scorer(object):
"""Compute evaluation scores."""
def __init__(self, eval_punct=False): def __init__(self, eval_punct=False):
"""Initialize the Scorer.
eval_punct (bool): Evaluate the dependency attachments to and from
punctuation.
RETURNS (Scorer): The newly created object.
DOCS: https://spacy.io/api/scorer#init
"""
self.tokens = PRFScore() self.tokens = PRFScore()
self.sbd = PRFScore() self.sbd = PRFScore()
self.unlabelled = PRFScore() self.unlabelled = PRFScore()
@ -46,34 +56,46 @@ class Scorer(object):
@property @property
def tags_acc(self): def tags_acc(self):
"""RETURNS (float): Part-of-speech tag accuracy (fine grained tags,
i.e. `Token.tag`).
"""
return self.tags.fscore * 100 return self.tags.fscore * 100
@property @property
def token_acc(self): def token_acc(self):
"""RETURNS (float): Tokenization accuracy."""
return self.tokens.precision * 100 return self.tokens.precision * 100
@property @property
def uas(self): def uas(self):
"""RETURNS (float): Unlabelled dependency score."""
return self.unlabelled.fscore * 100 return self.unlabelled.fscore * 100
@property @property
def las(self): def las(self):
"""RETURNS (float): Labelled depdendency score."""
return self.labelled.fscore * 100 return self.labelled.fscore * 100
@property @property
def ents_p(self): def ents_p(self):
"""RETURNS (float): Named entity accuracy (precision)."""
return self.ner.precision * 100 return self.ner.precision * 100
@property @property
def ents_r(self): def ents_r(self):
"""RETURNS (float): Named entity accuracy (recall)."""
return self.ner.recall * 100 return self.ner.recall * 100
@property @property
def ents_f(self): def ents_f(self):
"""RETURNS (float): Named entity accuracy (F-score)."""
return self.ner.fscore * 100 return self.ner.fscore * 100
@property @property
def scores(self): def scores(self):
"""RETURNS (dict): All scores with keys `uas`, `las`, `ents_p`,
`ents_r`, `ents_f`, `tags_acc` and `token_acc`.
"""
return { return {
"uas": self.uas, "uas": self.uas,
"las": self.las, "las": self.las,
@ -84,9 +106,20 @@ class Scorer(object):
"token_acc": self.token_acc, "token_acc": self.token_acc,
} }
def score(self, tokens, gold, verbose=False, punct_labels=("p", "punct")): def score(self, doc, gold, verbose=False, punct_labels=("p", "punct")):
if len(tokens) != len(gold): """Update the evaluation scores from a single Doc / GoldParse pair.
gold = GoldParse.from_annot_tuples(tokens, zip(*gold.orig_annot))
doc (Doc): The predicted annotations.
gold (GoldParse): The correct annotations.
verbose (bool): Print debugging information.
punct_labels (tuple): Dependency labels for punctuation. Used to
evaluate dependency attachments to punctuation if `eval_punct` is
`True`.
DOCS: https://spacy.io/api/scorer#score
"""
if len(doc) != len(gold):
gold = GoldParse.from_annot_tuples(doc, zip(*gold.orig_annot))
gold_deps = set() gold_deps = set()
gold_tags = set() gold_tags = set()
gold_ents = set(tags_to_entities([annot[-1] for annot in gold.orig_annot])) gold_ents = set(tags_to_entities([annot[-1] for annot in gold.orig_annot]))
@ -96,7 +129,7 @@ class Scorer(object):
gold_deps.add((id_, head, dep.lower())) gold_deps.add((id_, head, dep.lower()))
cand_deps = set() cand_deps = set()
cand_tags = set() cand_tags = set()
for token in tokens: for token in doc:
if token.orth_.isspace(): if token.orth_.isspace():
continue continue
gold_i = gold.cand_to_gold[token.i] gold_i = gold.cand_to_gold[token.i]
@ -116,7 +149,7 @@ class Scorer(object):
cand_deps.add((gold_i, gold_head, token.dep_.lower())) cand_deps.add((gold_i, gold_head, token.dep_.lower()))
if "-" not in [token[-1] for token in gold.orig_annot]: if "-" not in [token[-1] for token in gold.orig_annot]:
cand_ents = set() cand_ents = set()
for ent in tokens.ents: for ent in doc.ents:
first = gold.cand_to_gold[ent.start] first = gold.cand_to_gold[ent.start]
last = gold.cand_to_gold[ent.end - 1] last = gold.cand_to_gold[ent.end - 1]
if first is None or last is None: if first is None or last is None:

View File

@ -0,0 +1,58 @@
---
title: Scorer
teaser: Compute evaluation scores
tag: class
source: spacy/scorer.py
---
The `Scorer` computes and stores evaluation scores. It's typically created by
[`Language.evaluate`](/api/language#evaluate).
## Scorer.\_\_init\_\_ {#init tag="method"}
Create a new `Scorer`.
> #### Example
>
> ```python
> from spacy.scorer import Scorer
>
> scorer = Scorer()
> ```
| Name | Type | Description |
| ------------ | -------- | ------------------------------------------------------------ |
| `eval_punct` | bool | Evaluate the dependency attachments to and from punctuation. |
| **RETURNS** | `Scorer` | The newly created object. |
## Scorer.score {#score tag="method"}
Update the evaluation scores from a single [`Doc`](/api/doc) /
[`GoldParse`](/api/goldparse) pair.
> #### Example
>
> ```python
> scorer = Scorer()
> scorer.score(doc, gold)
> ```
| Name | Type | Description |
| -------------- | ----------- | -------------------------------------------------------------------------------------------------------------------- |
| `doc` | `Doc` | The predicted annotations. |
| `gold` | `GoldParse` | The correct annotations. |
| `verbose` | bool | Print debugging information. |
| `punct_labels` | tuple | Dependency labels for punctuation. Used to evaluate dependency attachments to punctuation if `eval_punct` is `True`. |
## Properties
| Name | Type | Description |
| ----------- | ----- | -------------------------------------------------------------------------------------------- |
| `token_acc` | float | Tokenization accuracy. |
| `tags_acc` | float | Part-of-speech tag accuracy (fine grained tags, i.e. `Token.tag`). |
| `uas` | float | Unlabelled dependency score. |
| `las` | float | Labelled dependency score. |
| `ents_p` | float | Named entity accuracy (precision). |
| `ents_r` | float | Named entity accuracy (recall). |
| `ents_f` | float | Named entity accuracy (F-score). |
| `scores` | dict | All scores with keys `uas`, `las`, `ents_p`, `ents_r`, `ents_f`, `tags_acc` and `token_acc`. |

View File

@ -90,7 +90,8 @@
{ "text": "StringStore", "url": "/api/stringstore" }, { "text": "StringStore", "url": "/api/stringstore" },
{ "text": "Vectors", "url": "/api/vectors" }, { "text": "Vectors", "url": "/api/vectors" },
{ "text": "GoldParse", "url": "/api/goldparse" }, { "text": "GoldParse", "url": "/api/goldparse" },
{ "text": "GoldCorpus", "url": "/api/goldcorpus" } { "text": "GoldCorpus", "url": "/api/goldcorpus" },
{ "text": "Scorer", "url": "/api/scorer" }
] ]
}, },
{ {