diff --git a/spacy/tests/training/test_pretraining.py b/spacy/tests/training/test_pretraining.py index c0d64f1e7..47aee0796 100644 --- a/spacy/tests/training/test_pretraining.py +++ b/spacy/tests/training/test_pretraining.py @@ -164,6 +164,24 @@ def test_pretraining_default(): assert "PretrainCharacters" in filled["pretraining"]["objective"]["@architectures"] +@pytest.mark.parametrize("objective", CHAR_OBJECTIVES) +def test_pretraining_last_model(objective): + """Test that pretraining works with the character objective""" + config = Config().from_str(pretrain_string_listener) + config["pretraining"]["objective"] = objective + nlp = util.load_model_from_config(config, auto_fill=True, validate=False) + filled = nlp.config + pretrain_config = util.load_config(DEFAULT_CONFIG_PRETRAIN_PATH) + filled = pretrain_config.merge(filled) + with make_tempdir() as tmp_dir: + file_path = write_sample_jsonl(tmp_dir) + filled["paths"]["raw_text"] = file_path + filled = filled.interpolate() + assert filled["pretraining"]["component"] == "tok2vec" + pretrain(filled, tmp_dir) + assert Path(tmp_dir / "model_last.bin").exists() + + @pytest.mark.parametrize("objective", CHAR_OBJECTIVES) def test_pretraining_tok2vec_characters(objective): """Test that pretraining works with the character objective"""