mirror of
https://github.com/explosion/spaCy.git
synced 2025-01-12 10:16:27 +03:00
Sync missing and misaligned values in Tagger loss (#6689)
Use `None` for both missing and misaligned annotation in `Tagger.get_loss`, reverting to the default missing value in the loss function.
This commit is contained in:
parent
c04bab6bae
commit
ad43cbb042
|
@ -256,8 +256,14 @@ class Tagger(TrainablePipe):
|
||||||
DOCS: https://nightly.spacy.io/api/tagger#get_loss
|
DOCS: https://nightly.spacy.io/api/tagger#get_loss
|
||||||
"""
|
"""
|
||||||
validate_examples(examples, "Tagger.get_loss")
|
validate_examples(examples, "Tagger.get_loss")
|
||||||
loss_func = SequenceCategoricalCrossentropy(names=self.labels, normalize=False, missing_value="")
|
loss_func = SequenceCategoricalCrossentropy(names=self.labels, normalize=False)
|
||||||
truths = [eg.get_aligned("TAG", as_string=True) for eg in examples]
|
# Convert empty tag "" to missing value None so that both misaligned
|
||||||
|
# tokens and tokens with missing annotation have the default missing
|
||||||
|
# value None.
|
||||||
|
truths = []
|
||||||
|
for eg in examples:
|
||||||
|
eg_truths = [tag if tag is not "" else None for tag in eg.get_aligned("TAG", as_string=True)]
|
||||||
|
truths.append(eg_truths)
|
||||||
d_scores, loss = loss_func(scores, truths)
|
d_scores, loss = loss_func(scores, truths)
|
||||||
if self.model.ops.xp.isnan(loss):
|
if self.model.ops.xp.isnan(loss):
|
||||||
raise ValueError(Errors.E910.format(name=self.name))
|
raise ValueError(Errors.E910.format(name=self.name))
|
||||||
|
|
|
@ -37,7 +37,16 @@ TRAIN_DATA = [
|
||||||
]
|
]
|
||||||
|
|
||||||
PARTIAL_DATA = [
|
PARTIAL_DATA = [
|
||||||
|
# partial annotation
|
||||||
("I like green eggs", {"tags": ["", "V", "J", ""]}),
|
("I like green eggs", {"tags": ["", "V", "J", ""]}),
|
||||||
|
# misaligned partial annotation
|
||||||
|
(
|
||||||
|
"He hates green eggs",
|
||||||
|
{
|
||||||
|
"words": ["He", "hate", "s", "green", "eggs"],
|
||||||
|
"tags": ["", "V", "S", "J", ""],
|
||||||
|
},
|
||||||
|
),
|
||||||
]
|
]
|
||||||
|
|
||||||
|
|
||||||
|
|
Loading…
Reference in New Issue
Block a user