mirror of
https://github.com/explosion/spaCy.git
synced 2024-11-14 05:37:03 +03:00
Update default pretraining config [ci skip]
This commit is contained in:
parent
154752f9c2
commit
e977086a9a
|
@ -1,13 +1,23 @@
|
||||||
[pretraining]
|
[pretraining]
|
||||||
max_epochs = 1000
|
max_epochs = 1000
|
||||||
min_length = 5
|
|
||||||
max_length = 500
|
|
||||||
dropout = 0.2
|
dropout = 0.2
|
||||||
n_save_every = null
|
n_save_every = null
|
||||||
batch_size = 3000
|
component = "tok2vec"
|
||||||
seed = ${system.seed}
|
layer = ""
|
||||||
use_pytorch_for_gpu_memory = ${system.use_pytorch_for_gpu_memory}
|
|
||||||
tok2vec_model = "components.tok2vec.model"
|
[pretraining.batcher]
|
||||||
|
@batchers = "spacy.batch_by_words.v1"
|
||||||
|
size = 3000
|
||||||
|
discard_oversize = false
|
||||||
|
tolerance = 0.2
|
||||||
|
get_length = null
|
||||||
|
|
||||||
|
[pretraining.corpus]
|
||||||
|
@readers = "spacy.JsonlReader.v1"
|
||||||
|
path = ${paths.raw}
|
||||||
|
min_length = 5
|
||||||
|
max_length = 500
|
||||||
|
limit = 0
|
||||||
|
|
||||||
[pretraining.objective]
|
[pretraining.objective]
|
||||||
type = "characters"
|
type = "characters"
|
||||||
|
|
Loading…
Reference in New Issue
Block a user