Reduce batch size during pretrain

2025-09-22 20:16:43 +03:00 · 2018-12-10 15:30:23 +00:00 · 2018-12-10 15:30:23 +00:00 · df15279e88
commit df15279e88
parent 83ac227bd3
1 changed files with 1 additions and 1 deletions
--- a/spacy/cli/pretrain.py
+++ b/spacy/cli/pretrain.py
@ -110,7 +110,7 @@ def pretrain(
    msg.row(("#", "# Words", "Total Loss", "Loss", "w/s"), **row_settings)
    for epoch in range(nr_iter):
        for batch in util.minibatch_by_words(
-            ((text, None) for text in texts), size=5000
+            ((text, None) for text in texts), size=3000
        ):
            docs = make_docs(nlp, [text for (text, _) in batch])
            loss = make_update(model, docs, optimizer, drop=dropout)