Tweak memory management in train_from_config

2025-07-18 20:22:25 +03:00 · 2020-05-21 19:32:04 +02:00 · 2020-05-21 19:32:04 +02:00 · 3b5cfec1fc
commit 3b5cfec1fc
parent f075655deb
1 changed files with 6 additions and 0 deletions
--- a/spacy/cli/train_from_config.py
+++ b/spacy/cli/train_from_config.py
@ -213,6 +213,12 @@ def train_from_config(
                if is_best_checkpoint and output_path is not None:
                    nlp.to_disk(output_path)
                progress = tqdm.tqdm(total=training["eval_frequency"], leave=False)
+            # Clean up the objects to faciliate garbage collection.
+            for eg in batch:
+                eg.doc = None
+                eg.goldparse = None
+                eg.doc_annotation = None
+                eg.token_annotation = None
    finally:
        if output_path is not None:
            final_model_path = output_path / "model-final"