mirror of
https://github.com/explosion/spaCy.git
synced 2025-01-12 02:06:31 +03:00
Add documentation for spaCy's JSON format
This commit is contained in:
parent
007a2492bd
commit
13df2d6a60
|
@ -79,3 +79,33 @@ p
|
||||||
+h(2, "named-entities") Named Entity Recognition
|
+h(2, "named-entities") Named Entity Recognition
|
||||||
|
|
||||||
include _annotation/_named-entities
|
include _annotation/_named-entities
|
||||||
|
|
||||||
|
+h(2, "json-input") JSON input format for training
|
||||||
|
|
||||||
|
p
|
||||||
|
| spaCy takes training data in the following format:
|
||||||
|
|
||||||
|
+code("Example structure").
|
||||||
|
doc: {
|
||||||
|
id: string,
|
||||||
|
paragraphs: [{
|
||||||
|
raw: string,
|
||||||
|
sents: [int],
|
||||||
|
tokens: [{
|
||||||
|
start: int,
|
||||||
|
tag: string,
|
||||||
|
head: int,
|
||||||
|
dep: string
|
||||||
|
}],
|
||||||
|
ner: [{
|
||||||
|
start: int,
|
||||||
|
end: int,
|
||||||
|
label: string
|
||||||
|
}],
|
||||||
|
brackets: [{
|
||||||
|
start: int,
|
||||||
|
end: int,
|
||||||
|
label: string
|
||||||
|
}]
|
||||||
|
}]
|
||||||
|
}
|
||||||
|
|
|
@ -143,7 +143,8 @@ p
|
||||||
+tag experimental
|
+tag experimental
|
||||||
|
|
||||||
p
|
p
|
||||||
| Train a model. Expects data in spaCy's JSON format.
|
| Train a model. Expects data in spaCy's
|
||||||
|
| #[+a("/docs/api/annotation#json-input") JSON format].
|
||||||
|
|
||||||
+code(false, "bash").
|
+code(false, "bash").
|
||||||
python -m spacy train [lang] [output_dir] [train_data] [dev_data] [--n_iter] [--parser_L1] [--no_tagger] [--no_parser] [--no_ner]
|
python -m spacy train [lang] [output_dir] [train_data] [dev_data] [--n_iter] [--parser_L1] [--no_tagger] [--no_parser] [--no_ner]
|
||||||
|
|
Loading…
Reference in New Issue
Block a user