mirror of
https://github.com/explosion/spaCy.git
synced 2025-02-10 08:30:34 +03:00
Add BILUO docs to NER annotation scheme
This commit is contained in:
parent
fdd8dacb75
commit
91dbee1b8f
|
@ -86,6 +86,31 @@ include _annotation/_dep-labels
|
||||||
|
|
||||||
include _annotation/_named-entities
|
include _annotation/_named-entities
|
||||||
|
|
||||||
|
| showed that the minimal #[strong Begin], #[strong In], #[strong Out]
|
||||||
|
| scheme was more difficult to learn than the #[strong BILUO] scheme that
|
||||||
|
| we use, which explicitly marks boundary tokens.
|
||||||
|
|
||||||
|
+table(["Tag", "Description"])
|
||||||
|
+row
|
||||||
|
+cell #[code #[span.u-color-theme B] EGIN]
|
||||||
|
+cell The first token of a multi-token entity.
|
||||||
|
|
||||||
|
+row
|
||||||
|
+cell #[code #[span.u-color-theme I] N]
|
||||||
|
+cell An inner token of a multi-token entity.
|
||||||
|
|
||||||
|
+row
|
||||||
|
+cell #[code #[span.u-color-theme L] AST]
|
||||||
|
+cell The final token of a multi-token entity.
|
||||||
|
|
||||||
|
+row
|
||||||
|
+cell #[code #[span.u-color-theme U] NIT]
|
||||||
|
+cell A single-token entity.
|
||||||
|
|
||||||
|
+row
|
||||||
|
+cell #[code #[span.u-color-theme O] UT]
|
||||||
|
+cell A non-entity token.
|
||||||
|
|
||||||
+h(2, "json-input") JSON input format for training
|
+h(2, "json-input") JSON input format for training
|
||||||
|
|
||||||
p
|
p
|
||||||
|
|
Loading…
Reference in New Issue
Block a user