update EL training data format in docs (#7839)

* update EL training data format

* fix typo

* all -1 because reasons
This commit is contained in:
Sofie Van Landeghem 2021-04-22 08:50:09 +02:00 committed by GitHub
parent 49ff1126bf
commit 2e746dbf32
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23

View File

@ -451,9 +451,11 @@ doc = nlp("I'm pretty happy about that!")
gold_dict = {"cats": {"POSITIVE": 1.0, "NEGATIVE": 0.0}}
example = Example.from_dict(doc, gold_dict)
# Training data for an Entity Linking component
# Training data for an Entity Linking component (also requires entities & sentences)
doc = nlp("Russ Cochran his reprints include EC Comics.")
gold_dict = {"links": {(0, 12): {"Q7381115": 1.0, "Q2146908": 0.0}}}
gold_dict = {"entities": [(0, 12, "PERSON")],
"links": {(0, 12): {"Q7381115": 1.0, "Q2146908": 0.0}},
"sent_starts": [1, -1, -1, -1, -1, -1, -1, -1]}
example = Example.from_dict(doc, gold_dict)
```