From bef9f63e1391d89d9e246855e9f769b3172a2c18 Mon Sep 17 00:00:00 2001
From: Raphael Mitsch <r.mitsch@outlook.com>
Date: Thu, 21 Sep 2023 11:28:58 +0200
Subject: [PATCH 01/25] Add gpt-3.5-turbo-instruct to list of supported OpenAI
 models.

---
 website/docs/api/large-language-models.mdx | 68 +++++++++++-----------
 1 file changed, 34 insertions(+), 34 deletions(-)

diff --git a/website/docs/api/large-language-models.mdx b/website/docs/api/large-language-models.mdx
index d32368e22..43a95074a 100644
--- a/website/docs/api/large-language-models.mdx
+++ b/website/docs/api/large-language-models.mdx
@@ -19,8 +19,8 @@ prototyping** and **prompting**, and turning unstructured responses into
 An LLM component is implemented through the `LLMWrapper` class. It is accessible
 through a generic `llm`
 [component factory](https://spacy.io/usage/processing-pipelines#custom-components-factories)
-as well as through task-specific component factories: `llm_ner`, `llm_spancat`, `llm_rel`,
-`llm_textcat`, `llm_sentiment` and `llm_summarization`.
+as well as through task-specific component factories: `llm_ner`, `llm_spancat`,
+`llm_rel`, `llm_textcat`, `llm_sentiment` and `llm_summarization`.
 
 ### LLMWrapper.\_\_init\_\_ {id="init",tag="method"}
 
@@ -952,38 +952,38 @@ provider's API.
 
 Currently, these models are provided as part of the core library:
 
-| Model                         | Provider  | Supported names                                                                          | Default name           | Default config                       |
-| ----------------------------- | --------- | ---------------------------------------------------------------------------------------- | ---------------------- | ------------------------------------ |
-| `spacy.GPT-4.v1`              | OpenAI    | `["gpt-4", "gpt-4-0314", "gpt-4-32k", "gpt-4-32k-0314"]`                                 | `"gpt-4"`              | `{}`                                 |
-| `spacy.GPT-4.v2`              | OpenAI    | `["gpt-4", "gpt-4-0314", "gpt-4-32k", "gpt-4-32k-0314"]`                                 | `"gpt-4"`              | `{temperature=0.0}`                  |
-| `spacy.GPT-3-5.v1`            | OpenAI    | `["gpt-3.5-turbo", "gpt-3.5-turbo-16k", "gpt-3.5-turbo-0613", "gpt-3.5-turbo-0613-16k"]` | `"gpt-3.5-turbo"`      | `{}`                                 |
-| `spacy.GPT-3-5.v2`            | OpenAI    | `["gpt-3.5-turbo", "gpt-3.5-turbo-16k", "gpt-3.5-turbo-0613", "gpt-3.5-turbo-0613-16k"]` | `"gpt-3.5-turbo"`      | `{temperature=0.0}`                  |
-| `spacy.Davinci.v1`            | OpenAI    | `["davinci"]`                                                                            | `"davinci"`            | `{}`                                 |
-| `spacy.Davinci.v2`            | OpenAI    | `["davinci"]`                                                                            | `"davinci"`            | `{temperature=0.0, max_tokens=500}`  |
-| `spacy.Text-Davinci.v1`       | OpenAI    | `["text-davinci-003", "text-davinci-002"]`                                               | `"text-davinci-003"`   | `{}`                                 |
-| `spacy.Text-Davinci.v2`       | OpenAI    | `["text-davinci-003", "text-davinci-002"]`                                               | `"text-davinci-003"`   | `{temperature=0.0, max_tokens=1000}` |
-| `spacy.Code-Davinci.v1`       | OpenAI    | `["code-davinci-002"]`                                                                   | `"code-davinci-002"`   | `{}`                                 |
-| `spacy.Code-Davinci.v2`       | OpenAI    | `["code-davinci-002"]`                                                                   | `"code-davinci-002"`   | `{temperature=0.0, max_tokens=500}`  |
-| `spacy.Curie.v1`              | OpenAI    | `["curie"]`                                                                              | `"curie"`              | `{}`                                 |
-| `spacy.Curie.v2`              | OpenAI    | `["curie"]`                                                                              | `"curie"`              | `{temperature=0.0, max_tokens=500}`  |
-| `spacy.Text-Curie.v1`         | OpenAI    | `["text-curie-001"]`                                                                     | `"text-curie-001"`     | `{}`                                 |
-| `spacy.Text-Curie.v2`         | OpenAI    | `["text-curie-001"]`                                                                     | `"text-curie-001"`     | `{temperature=0.0, max_tokens=500}`  |
-| `spacy.Babbage.v1`            | OpenAI    | `["babbage"]`                                                                            | `"babbage"`            | `{}`                                 |
-| `spacy.Babbage.v2`            | OpenAI    | `["babbage"]`                                                                            | `"babbage"`            | `{temperature=0.0, max_tokens=500}`  |
-| `spacy.Text-Babbage.v1`       | OpenAI    | `["text-babbage-001"]`                                                                   | `"text-babbage-001"`   | `{}`                                 |
-| `spacy.Text-Babbage.v2`       | OpenAI    | `["text-babbage-001"]`                                                                   | `"text-babbage-001"`   | `{temperature=0.0, max_tokens=500}`  |
-| `spacy.Ada.v1`                | OpenAI    | `["ada"]`                                                                                | `"ada"`                | `{}`                                 |
-| `spacy.Ada.v2`                | OpenAI    | `["ada"]`                                                                                | `"ada"`                | `{temperature=0.0, max_tokens=500}`  |
-| `spacy.Text-Ada.v1`           | OpenAI    | `["text-ada-001"]`                                                                       | `"text-ada-001"`       | `{}`                                 |
-| `spacy.Text-Ada.v2`           | OpenAI    | `["text-ada-001"]`                                                                       | `"text-ada-001"`       | `{temperature=0.0, max_tokens=500}`  |
-| `spacy.Command.v1`            | Cohere    | `["command", "command-light", "command-light-nightly", "command-nightly"]`               | `"command"`            | `{}`                                 |
-| `spacy.Claude-2.v1`           | Anthropic | `["claude-2", "claude-2-100k"]`                                                          | `"claude-2"`           | `{}`                                 |
-| `spacy.Claude-1.v1`           | Anthropic | `["claude-1", "claude-1-100k"]`                                                          | `"claude-1"`           | `{}`                                 |
-| `spacy.Claude-1-0.v1`         | Anthropic | `["claude-1.0"]`                                                                         | `"claude-1.0"`         | `{}`                                 |
-| `spacy.Claude-1-2.v1`         | Anthropic | `["claude-1.2"]`                                                                         | `"claude-1.2"`         | `{}`                                 |
-| `spacy.Claude-1-3.v1`         | Anthropic | `["claude-1.3", "claude-1.3-100k"]`                                                      | `"claude-1.3"`         | `{}`                                 |
-| `spacy.Claude-instant-1.v1`   | Anthropic | `["claude-instant-1", "claude-instant-1-100k"]`                                          | `"claude-instant-1"`   | `{}`                                 |
-| `spacy.Claude-instant-1-1.v1` | Anthropic | `["claude-instant-1.1", "claude-instant-1.1-100k"]`                                      | `"claude-instant-1.1"` | `{}`                                 |
+| Model                         | Provider  | Supported names                                                                                                    | Default name           | Default config                       |
+| ----------------------------- | --------- | ------------------------------------------------------------------------------------------------------------------ | ---------------------- | ------------------------------------ |
+| `spacy.GPT-4.v1`              | OpenAI    | `["gpt-4", "gpt-4-0314", "gpt-4-32k", "gpt-4-32k-0314"]`                                                           | `"gpt-4"`              | `{}`                                 |
+| `spacy.GPT-4.v2`              | OpenAI    | `["gpt-4", "gpt-4-0314", "gpt-4-32k", "gpt-4-32k-0314"]`                                                           | `"gpt-4"`              | `{temperature=0.0}`                  |
+| `spacy.GPT-3-5.v1`            | OpenAI    | `["gpt-3.5-turbo", "gpt-3.5-turbo-16k", "gpt-3.5-turbo-0613", "gpt-3.5-turbo-0613-16k", "gpt-3.5-turbo-instruct"]` | `"gpt-3.5-turbo"`      | `{}`                                 |
+| `spacy.GPT-3-5.v2`            | OpenAI    | `["gpt-3.5-turbo", "gpt-3.5-turbo-16k", "gpt-3.5-turbo-0613", "gpt-3.5-turbo-0613-16k", "gpt-3.5-turbo-instruct"]` | `"gpt-3.5-turbo"`      | `{temperature=0.0}`                  |
+| `spacy.Davinci.v1`            | OpenAI    | `["davinci"]`                                                                                                      | `"davinci"`            | `{}`                                 |
+| `spacy.Davinci.v2`            | OpenAI    | `["davinci"]`                                                                                                      | `"davinci"`            | `{temperature=0.0, max_tokens=500}`  |
+| `spacy.Text-Davinci.v1`       | OpenAI    | `["text-davinci-003", "text-davinci-002"]`                                                                         | `"text-davinci-003"`   | `{}`                                 |
+| `spacy.Text-Davinci.v2`       | OpenAI    | `["text-davinci-003", "text-davinci-002"]`                                                                         | `"text-davinci-003"`   | `{temperature=0.0, max_tokens=1000}` |
+| `spacy.Code-Davinci.v1`       | OpenAI    | `["code-davinci-002"]`                                                                                             | `"code-davinci-002"`   | `{}`                                 |
+| `spacy.Code-Davinci.v2`       | OpenAI    | `["code-davinci-002"]`                                                                                             | `"code-davinci-002"`   | `{temperature=0.0, max_tokens=500}`  |
+| `spacy.Curie.v1`              | OpenAI    | `["curie"]`                                                                                                        | `"curie"`              | `{}`                                 |
+| `spacy.Curie.v2`              | OpenAI    | `["curie"]`                                                                                                        | `"curie"`              | `{temperature=0.0, max_tokens=500}`  |
+| `spacy.Text-Curie.v1`         | OpenAI    | `["text-curie-001"]`                                                                                               | `"text-curie-001"`     | `{}`                                 |
+| `spacy.Text-Curie.v2`         | OpenAI    | `["text-curie-001"]`                                                                                               | `"text-curie-001"`     | `{temperature=0.0, max_tokens=500}`  |
+| `spacy.Babbage.v1`            | OpenAI    | `["babbage"]`                                                                                                      | `"babbage"`            | `{}`                                 |
+| `spacy.Babbage.v2`            | OpenAI    | `["babbage"]`                                                                                                      | `"babbage"`            | `{temperature=0.0, max_tokens=500}`  |
+| `spacy.Text-Babbage.v1`       | OpenAI    | `["text-babbage-001"]`                                                                                             | `"text-babbage-001"`   | `{}`                                 |
+| `spacy.Text-Babbage.v2`       | OpenAI    | `["text-babbage-001"]`                                                                                             | `"text-babbage-001"`   | `{temperature=0.0, max_tokens=500}`  |
+| `spacy.Ada.v1`                | OpenAI    | `["ada"]`                                                                                                          | `"ada"`                | `{}`                                 |
+| `spacy.Ada.v2`                | OpenAI    | `["ada"]`                                                                                                          | `"ada"`                | `{temperature=0.0, max_tokens=500}`  |
+| `spacy.Text-Ada.v1`           | OpenAI    | `["text-ada-001"]`                                                                                                 | `"text-ada-001"`       | `{}`                                 |
+| `spacy.Text-Ada.v2`           | OpenAI    | `["text-ada-001"]`                                                                                                 | `"text-ada-001"`       | `{temperature=0.0, max_tokens=500}`  |
+| `spacy.Command.v1`            | Cohere    | `["command", "command-light", "command-light-nightly", "command-nightly"]`                                         | `"command"`            | `{}`                                 |
+| `spacy.Claude-2.v1`           | Anthropic | `["claude-2", "claude-2-100k"]`                                                                                    | `"claude-2"`           | `{}`                                 |
+| `spacy.Claude-1.v1`           | Anthropic | `["claude-1", "claude-1-100k"]`                                                                                    | `"claude-1"`           | `{}`                                 |
+| `spacy.Claude-1-0.v1`         | Anthropic | `["claude-1.0"]`                                                                                                   | `"claude-1.0"`         | `{}`                                 |
+| `spacy.Claude-1-2.v1`         | Anthropic | `["claude-1.2"]`                                                                                                   | `"claude-1.2"`         | `{}`                                 |
+| `spacy.Claude-1-3.v1`         | Anthropic | `["claude-1.3", "claude-1.3-100k"]`                                                                                | `"claude-1.3"`         | `{}`                                 |
+| `spacy.Claude-instant-1.v1`   | Anthropic | `["claude-instant-1", "claude-instant-1-100k"]`                                                                    | `"claude-instant-1"`   | `{}`                                 |
+| `spacy.Claude-instant-1-1.v1` | Anthropic | `["claude-instant-1.1", "claude-instant-1.1-100k"]`                                                                | `"claude-instant-1.1"` | `{}`                                 |
 
 To use these models, make sure that you've [set the relevant API](#api-keys)
 keys as environment variables.

From 1b043dde3fc674869f11b8b138db878552b4c91a Mon Sep 17 00:00:00 2001
From: Adriane Boyd <adrianeboyd@gmail.com>
Date: Wed, 9 Aug 2023 13:43:50 +0200
Subject: [PATCH 02/25] Revert "disable tests until 3.7 models are available"

This reverts commit 991bcc111e1a35cc96dba32ac08c212b0b360384.
---
 .github/workflows/tests.yml | 54 ++++++++++++++++++-------------------
 spacy/tests/test_cli.py     |  2 --
 2 files changed, 27 insertions(+), 29 deletions(-)

diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml
index 1058b4673..976b1f4f2 100644
--- a/.github/workflows/tests.yml
+++ b/.github/workflows/tests.yml
@@ -115,22 +115,22 @@ jobs:
       - name: Test import
         run: python -W error -c "import spacy"
 
-#      - name: "Test download CLI"
-#        run: |
-#          python -m spacy download ca_core_news_sm
-#          python -m spacy download ca_core_news_md
-#          python -c "import spacy; nlp=spacy.load('ca_core_news_sm'); doc=nlp('test')"
-#        if: matrix.python_version == '3.9'
-#
-#      - name: "Test download_url in info CLI"
-#        run: |
-#          python -W error -m spacy info ca_core_news_sm | grep -q download_url
-#        if: matrix.python_version == '3.9'
-#
-#      - name: "Test no warnings on load (#11713)"
-#        run: |
-#          python -W error -c "import ca_core_news_sm; nlp = ca_core_news_sm.load(); doc=nlp('test')"
-#        if: matrix.python_version == '3.9'
+      - name: "Test download CLI"
+        run: |
+          python -m spacy download ca_core_news_sm
+          python -m spacy download ca_core_news_md
+          python -c "import spacy; nlp=spacy.load('ca_core_news_sm'); doc=nlp('test')"
+        if: matrix.python_version == '3.9'
+
+      - name: "Test download_url in info CLI"
+        run: |
+          python -W error -m spacy info ca_core_news_sm | grep -q download_url
+        if: matrix.python_version == '3.9'
+
+      - name: "Test no warnings on load (#11713)"
+        run: |
+          python -W error -c "import ca_core_news_sm; nlp = ca_core_news_sm.load(); doc=nlp('test')"
+        if: matrix.python_version == '3.9'
 
       - name: "Test convert CLI"
         run: |
@@ -154,17 +154,17 @@ jobs:
           python -m spacy train ner.cfg --paths.train ner-token-per-line-conll2003.spacy --paths.dev ner-token-per-line-conll2003.spacy --training.max_steps 10 --gpu-id -1
         if: matrix.python_version == '3.9'
 
-#      - name: "Test assemble CLI"
-#        run: |
-#          python -c "import spacy; config = spacy.util.load_config('ner.cfg'); config['components']['ner'] = {'source': 'ca_core_news_sm'}; config.to_disk('ner_source_sm.cfg')"
-#          PYTHONWARNINGS="error,ignore::DeprecationWarning" python -m spacy assemble ner_source_sm.cfg output_dir
-#        if: matrix.python_version == '3.9'
-#
-#      - name: "Test assemble CLI vectors warning"
-#        run: |
-#          python -c "import spacy; config = spacy.util.load_config('ner.cfg'); config['components']['ner'] = {'source': 'ca_core_news_md'}; config.to_disk('ner_source_md.cfg')"
-#          python -m spacy assemble ner_source_md.cfg output_dir 2>&1 | grep -q W113
-#        if: matrix.python_version == '3.9'
+      - name: "Test assemble CLI"
+        run: |
+          python -c "import spacy; config = spacy.util.load_config('ner.cfg'); config['components']['ner'] = {'source': 'ca_core_news_sm'}; config.to_disk('ner_source_sm.cfg')"
+          PYTHONWARNINGS="error,ignore::DeprecationWarning" python -m spacy assemble ner_source_sm.cfg output_dir
+        if: matrix.python_version == '3.9'
+
+      - name: "Test assemble CLI vectors warning"
+        run: |
+          python -c "import spacy; config = spacy.util.load_config('ner.cfg'); config['components']['ner'] = {'source': 'ca_core_news_md'}; config.to_disk('ner_source_md.cfg')"
+          python -m spacy assemble ner_source_md.cfg output_dir 2>&1 | grep -q W113
+        if: matrix.python_version == '3.9'
 
       - name: "Install test requirements"
         run: |
diff --git a/spacy/tests/test_cli.py b/spacy/tests/test_cli.py
index 8c1d1a64c..0d2fe0a9e 100644
--- a/spacy/tests/test_cli.py
+++ b/spacy/tests/test_cli.py
@@ -538,7 +538,6 @@ def test_string_to_list_intify(value):
     assert string_to_list(value, intify=True) == [1, 2, 3]
 
 
-@pytest.mark.skip(reason="Temporarily skip before 3.7 models are published")
 def test_download_compatibility():
     spec = SpecifierSet("==" + about.__version__)
     spec.prereleases = False
@@ -549,7 +548,6 @@ def test_download_compatibility():
         assert get_minor_version(about.__version__) == get_minor_version(version)
 
 
-@pytest.mark.skip(reason="Temporarily skip before 3.7 models are published")
 def test_validate_compatibility_table():
     spec = SpecifierSet("==" + about.__version__)
     spec.prereleases = False

From 160e61772e3e4fbd4e9e28446c6d687596921f93 Mon Sep 17 00:00:00 2001
From: Adriane Boyd <adrianeboyd@gmail.com>
Date: Sun, 1 Oct 2023 21:40:07 +0200
Subject: [PATCH 03/25] Docs for v3.7.0 (#13029)

* Docs for v3.7.0

* Minor fixes

* Extend Weasel notes

* Minor edits

* Update version in README
---
 README.md                      |   2 +-
 website/docs/usage/v3-7.mdx    | 140 +++++++++++++++++++++++++++++++++
 website/meta/sidebars.json     |   3 +-
 website/src/templates/index.js |   4 +-
 4 files changed, 145 insertions(+), 4 deletions(-)
 create mode 100644 website/docs/usage/v3-7.mdx

diff --git a/README.md b/README.md
index 3920c1dc2..b2ffa4639 100644
--- a/README.md
+++ b/README.md
@@ -16,7 +16,7 @@ model packaging, deployment and workflow management. spaCy is commercial
 open-source software, released under the
 [MIT license](https://github.com/explosion/spaCy/blob/master/LICENSE).
 
-💫 **Version 3.6 out now!**
+💫 **Version 3.7 out now!**
 [Check out the release notes here.](https://github.com/explosion/spaCy/releases)
 
 [![tests](https://github.com/explosion/spaCy/actions/workflows/tests.yml/badge.svg)](https://github.com/explosion/spaCy/actions/workflows/tests.yml)
diff --git a/website/docs/usage/v3-7.mdx b/website/docs/usage/v3-7.mdx
new file mode 100644
index 000000000..76fc9530f
--- /dev/null
+++ b/website/docs/usage/v3-7.mdx
@@ -0,0 +1,140 @@
+---
+title: What's New in v3.7
+teaser: New features and how to upgrade
+menu:
+  - ['New Features', 'features']
+  - ['Upgrading Notes', 'upgrading']
+---
+
+## New features {id="features",hidden="true"}
+
+spaCy v3.7 adds support for Python 3.12, introduces the new standalone library
+[Weasel](https://github.com/explosion/weasel) for project workflows, and updates
+the transformer-based trained pipelines to use our new
+[Curated Transformers](https://github.com/explosion/curated-transformers)
+library.
+
+This release drops support for Python 3.6.
+
+### Weasel {id="weasel"}
+
+The [spaCy projects](/usage/projects) functionality has been moved into a new
+standalone library [Weasel](https://github.com/explosion/weasel). This brings
+minor changes to spaCy-specific settings in spaCy projects (see
+[upgrading](#upgrading) below), but also makes it possible to use the same
+workflow functionality outside of spaCy.
+
+All `spacy project` commands should run as before, just now they're using Weasel
+under the hood.
+
+<Infobox title="Remote storage for Python 3.12" variant="warning">
+
+Remote storage for spaCy projects is not yet supported for Python 3.12. Use
+Python 3.11 or earlier for remote storage.
+
+</Infobox>
+
+### Registered vectors {id="custom-vectors"}
+
+You can specify a custom registered vectors class under `[nlp.vectors]` in order
+to use static vectors in formats other than the ones supported by
+[`Vectors`](/api/vectors). To implement your custom vectors, extend the abstract
+class [`BaseVectors`](/api/basevectors). See an example using
+[BPEmb subword embeddings](/usage/embeddings-transformers#custom-vectors).
+
+### Additional features and improvements {id="additional-features-and-improvements"}
+
+- Add support for Python 3.12.
+- Extend to Thinc v8.2.
+- Extend `transformers` extra to `spacy-transformers` v1.3.
+- Add `--spans-key` option for CLI evaluation with `spacy benchmark accuracy`.
+- Load the CLI module lazily for `spacy.info`.
+- Add type stubs for for `spacy.training.example`.
+- Warn for unsupported pattern keys in dependency matcher.
+- `Language.replace_listeners`: Pass the replaced listener and the `tok2vec`
+  pipe to the callback in order to support `spacy-curated-transformers`.
+- Always use `tqdm` with `disable=None` in order to disable output in
+  non-interactive environments.
+- Language updates:
+  - Add left and right pointing angle brackets as punctuation to ancient Greek.
+  - Update example sentences for Turkish.
+- Package setup updates:
+  - Update NumPy build constraints for NumPy 1.25+. For Python 3.9+, it is no
+    longer necessary to set build constraints while building binary wheels.
+  - Refactor Cython profiling in order to disable profiling for Python 3.12 in
+    the package setup, since Cython does not currently support profiling for
+    Python 3.12.
+
+## Trained pipelines {id="pipelines"}
+
+### Pipeline updates {id="pipeline-updates"}
+
+The transformer-based `trf` pipelines have been updated to use our new
+[Curated Transformers](https://github.com/explosion/curated-transformers)
+library using the Thinc model wrappers and pipeline component from
+[spaCy Curated Transformers](https://github.com/explosion/spacy-curated-transformers).
+
+## Notes about upgrading from v3.6 {id="upgrading"}
+
+This release drops support for Python 3.6, drops mypy checks for Python 3.7 and
+removes the `ray` extra. In addition there are several minor changes for spaCy
+projects described in the following section.
+
+### Backwards incompatibilities for spaCy Projects {id="upgrading-projects"}
+
+`spacy project` has a few backwards incompatibilities due to the transition to
+the standalone library [Weasel](https://github.com/explosion/weasel), which is
+not as tightly coupled to spaCy. Weasel produces warnings when it detects older
+spaCy-specific settings in your environment or project config.
+
+- Support for the `spacy_version` configuration key has been dropped.
+- Support for the `check_requirements` configuration key has been dropped due to
+  the deprecation of `pkg_resources`.
+- The `SPACY_CONFIG_OVERRIDES` environment variable is no longer checked. You
+  can set configuration overrides using `WEASEL_CONFIG_OVERRIDES`.
+- Support for `SPACY_PROJECT_USE_GIT_VERSION` environment variable has been
+  dropped.
+- Error codes are now Weasel-specific and do not follow spaCy error codes.
+
+### Pipeline package version compatibility {id="version-compat"}
+
+> #### Using legacy implementations
+>
+> In spaCy v3, you'll still be able to load and reference legacy implementations
+> via [`spacy-legacy`](https://github.com/explosion/spacy-legacy), even if the
+> components or architectures change and newer versions are available in the
+> core library.
+
+When you're loading a pipeline package trained with an earlier version of spaCy
+v3, you will see a warning telling you that the pipeline may be incompatible.
+This doesn't necessarily have to be true, but we recommend running your
+pipelines against your test suite or evaluation data to make sure there are no
+unexpected results.
+
+If you're using one of the [trained pipelines](/models) we provide, you should
+run [`spacy download`](/api/cli#download) to update to the latest version. To
+see an overview of all installed packages and their compatibility, you can run
+[`spacy validate`](/api/cli#validate).
+
+If you've trained your own custom pipeline and you've confirmed that it's still
+working as expected, you can update the spaCy version requirements in the
+[`meta.json`](/api/data-formats#meta):
+
+```diff
+- "spacy_version": ">=3.6.0,<3.7.0",
++ "spacy_version": ">=3.6.0,<3.8.0",
+```
+
+### Updating v3.6 configs
+
+To update a config from spaCy v3.6 with the new v3.7 settings, run
+[`init fill-config`](/api/cli#init-fill-config):
+
+```cli
+$ python -m spacy init fill-config config-v3.6.cfg config-v3.7.cfg
+```
+
+In many cases ([`spacy train`](/api/cli#train),
+[`spacy.load`](/api/top-level#spacy.load)), the new defaults will be filled in
+automatically, but you'll need to fill in the new settings to run
+[`debug config`](/api/cli#debug) and [`debug data`](/api/cli#debug-data).
diff --git a/website/meta/sidebars.json b/website/meta/sidebars.json
index 617473cb0..24213ed12 100644
--- a/website/meta/sidebars.json
+++ b/website/meta/sidebars.json
@@ -15,7 +15,8 @@
                     { "text": "New in v3.3", "url": "/usage/v3-3" },
                     { "text": "New in v3.4", "url": "/usage/v3-4" },
                     { "text": "New in v3.5", "url": "/usage/v3-5" },
-                    { "text": "New in v3.6", "url": "/usage/v3-6" }
+                    { "text": "New in v3.6", "url": "/usage/v3-6" },
+                    { "text": "New in v3.7", "url": "/usage/v3-7" }
                 ]
             },
             {
diff --git a/website/src/templates/index.js b/website/src/templates/index.js
index c8295593c..1c969bd39 100644
--- a/website/src/templates/index.js
+++ b/website/src/templates/index.js
@@ -58,8 +58,8 @@ const AlertSpace = ({ nightly, legacy }) => {
 }
 
 const navAlert = (
-    <Link to="/usage/v3-6" noLinkLayout>
-        <strong>💥 Out now:</strong> spaCy v3.6
+    <Link to="/usage/v3-7" noLinkLayout>
+        <strong>💥 Out now:</strong> spaCy v3.7
     </Link>
 )
 

From 92ce32aa3f04b2d7fac2db0b5bfe3411c8709d9e Mon Sep 17 00:00:00 2001
From: Adriane Boyd <adrianeboyd@gmail.com>
Date: Mon, 2 Oct 2023 12:53:46 +0200
Subject: [PATCH 04/25] Update binder version to v3.7 (#13034)

---
 website/meta/site.json | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/website/meta/site.json b/website/meta/site.json
index 08fcde62e..a07d131d3 100644
--- a/website/meta/site.json
+++ b/website/meta/site.json
@@ -27,7 +27,7 @@
         "indexName": "spacy"
     },
     "binderUrl": "explosion/spacy-io-binder",
-    "binderVersion": "3.6",
+    "binderVersion": "3.7",
     "sections": [
         { "id": "usage", "title": "Usage Documentation", "theme": "blue" },
         { "id": "models", "title": "Models Documentation", "theme": "blue" },

From 6d0185f7fba4d8a4f76a9c35d2e78542ee0c226a Mon Sep 17 00:00:00 2001
From: Adriane Boyd <adrianeboyd@gmail.com>
Date: Wed, 4 Oct 2023 12:33:33 +0200
Subject: [PATCH 05/25] Revert "Load the cli module lazily for spacy.info
 (#12962)"

This reverts commit beda27a91eadd70563dbaffd844d8c9d5e245928.
---
 spacy/__init__.py       | 7 +------
 spacy/tests/test_cli.py | 4 ----
 2 files changed, 1 insertion(+), 10 deletions(-)

diff --git a/spacy/__init__.py b/spacy/__init__.py
index 8aa2eccd7..1a18ad0d5 100644
--- a/spacy/__init__.py
+++ b/spacy/__init__.py
@@ -13,6 +13,7 @@ from thinc.api import Config, prefer_gpu, require_cpu, require_gpu  # noqa: F401
 from . import pipeline  # noqa: F401
 from . import util
 from .about import __version__  # noqa: F401
+from .cli.info import info  # noqa: F401
 from .errors import Errors
 from .glossary import explain  # noqa: F401
 from .language import Language
@@ -76,9 +77,3 @@ def blank(
     # We should accept both dot notation and nested dict here for consistency
     config = util.dot_to_dict(config)
     return LangClass.from_config(config, vocab=vocab, meta=meta)
-
-
-def info(*args, **kwargs):
-    from .cli.info import info as cli_info
-
-    return cli_info(*args, **kwargs)
diff --git a/spacy/tests/test_cli.py b/spacy/tests/test_cli.py
index 0d2fe0a9e..86451317b 100644
--- a/spacy/tests/test_cli.py
+++ b/spacy/tests/test_cli.py
@@ -12,7 +12,6 @@ from thinc.api import Config
 
 import spacy
 from spacy import about
-from spacy import info as spacy_info
 from spacy.cli import info
 from spacy.cli._util import parse_config_overrides, string_to_list, walk_directory
 from spacy.cli.apply import apply
@@ -193,9 +192,6 @@ def test_cli_info():
         raw_data = info(tmp_dir, exclude=[""])
         assert raw_data["lang"] == "nl"
         assert raw_data["components"] == ["textcat"]
-        raw_data = spacy_info(tmp_dir, exclude=[""])
-        assert raw_data["lang"] == "nl"
-        assert raw_data["components"] == ["textcat"]
 
 
 def test_cli_converters_conllu_to_docs():

From 9d036607f1ad60ebf1719526c0ec1f531eb688e9 Mon Sep 17 00:00:00 2001
From: Adriane Boyd <adrianeboyd@gmail.com>
Date: Wed, 4 Oct 2023 18:13:12 +0200
Subject: [PATCH 06/25] Set version to v3.7.1 (#13042)

---
 spacy/about.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/spacy/about.py b/spacy/about.py
index 1a3367673..0e718400b 100644
--- a/spacy/about.py
+++ b/spacy/about.py
@@ -1,5 +1,5 @@
 # fmt: off
 __title__ = "spacy"
-__version__ = "3.7.0"
+__version__ = "3.7.1"
 __download_url__ = "https://github.com/explosion/spacy-models/releases/download"
 __compatibility__ = "https://raw.githubusercontent.com/explosion/spacy-models/master/compatibility.json"

From 734826db79fc27b4632c364d04b4ddd450f1772d Mon Sep 17 00:00:00 2001
From: Raphael Mitsch <r.mitsch@outlook.com>
Date: Thu, 5 Oct 2023 08:45:25 +0200
Subject: [PATCH 07/25] Update `spacy-llm` task argument docs w.r.t. task
 refactoring (#12995)

* Update task arguments w.r.t. task refactoring in 0.5.0.

* Add disclaimer w.r.t. gated models/Llama 2.

* Update website/docs/api/large-language-models.mdx

* Update website/docs/api/large-language-models.mdx
---
 website/docs/api/large-language-models.mdx | 271 ++++++++++++---------
 1 file changed, 162 insertions(+), 109 deletions(-)

diff --git a/website/docs/api/large-language-models.mdx b/website/docs/api/large-language-models.mdx
index 43a95074a..845edaa1a 100644
--- a/website/docs/api/large-language-models.mdx
+++ b/website/docs/api/large-language-models.mdx
@@ -254,12 +254,14 @@ prompting.
 > max_n_words = null
 > ```
 
-| Argument      | Description                                                                                                                                                                                   |
-| ------------- | --------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
-| `template`    | Custom prompt template to send to LLM model. Defaults to [summarization.v1.jinja](https://github.com/explosion/spacy-llm/blob/main/spacy_llm/tasks/templates/summarization.v1.jinja). ~~str~~ |
-| `examples`    | Optional function that generates examples for few-shot learning. Defaults to `None`. ~~Optional[Callable[[], Iterable[Any]]]~~                                                                |
-| `max_n_words` | Maximum number of words to be used in summary. Note that this should not expected to work exactly. Defaults to `None`. ~~Optional[int]~~                                                      |
-| `field`       | Name of extension attribute to store summary in (i. e. the summary will be available in `doc._.{field}`). Defaults to `summary`. ~~str~~                                                      |
+| Argument                    | Description                                                                                                                                                                                   |
+| --------------------------- | --------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| `template`                  | Custom prompt template to send to LLM model. Defaults to [summarization.v1.jinja](https://github.com/explosion/spacy-llm/blob/main/spacy_llm/tasks/templates/summarization.v1.jinja). ~~str~~ |
+| `examples`                  | Optional function that generates examples for few-shot learning. Defaults to `None`. ~~Optional[Callable[[], Iterable[Any]]]~~                                                                |
+| `parse_responses` (NEW)     | Callable for parsing LLM responses for this task. Defaults to the internal parsing method for this task. ~~Optional[TaskResponseParser[SummarizationTask]]~~                                  |
+| `prompt_example_type` (NEW) | Type to use for fewshot examples. Defaults to `SummarizationExample`. ~~Optional[Type[FewshotExample]]~~                                                                                      |
+| `max_n_words`               | Maximum number of words to be used in summary. Note that this should not expected to work exactly. Defaults to `None`. ~~Optional[int]~~                                                      |
+| `field`                     | Name of extension attribute to store summary in (i. e. the summary will be available in `doc._.{field}`). Defaults to `summary`. ~~str~~                                                      |
 
 The summarization task prompts the model for a concise summary of the provided
 text. It optionally allows to limit the response to a certain number of tokens -
@@ -325,16 +327,19 @@ When no examples are [specified](/usage/large-language-models#few-shot-prompts),
 the v3 implementation will use a dummy example in the prompt. Technically this
 means that the task will always perform few-shot prompting under the hood.
 
-| Argument                  | Description                                                                                                                                                                                            |
-| ------------------------- | ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------ |
-| `labels`                  | List of labels or str of comma-separated list of labels. ~~Union[List[str], str]~~                                                                                                                     |
-| `label_definitions`       | Optional dict mapping a label to a description of that label. These descriptions are added to the prompt to help instruct the LLM on what to extract. Defaults to `None`. ~~Optional[Dict[str, str]]~~ |
-| `template`                | Custom prompt template to send to LLM model. Defaults to [ner.v3.jinja](https://github.com/explosion/spacy-llm/blob/main/spacy_llm/tasks/templates/ner.v3.jinja). ~~str~~                              |
-| `description` (NEW)       | A description of what to recognize or not recognize as entities. ~~str~~                                                                                                                               |
-| `examples`                | Optional function that generates examples for few-shot learning. Defaults to `None`. ~~Optional[Callable[[], Iterable[Any]]]~~                                                                         |
-| `normalizer`              | Function that normalizes the labels as returned by the LLM. If `None`, defaults to `spacy.LowercaseNormalizer.v1`. Defaults to `None`. ~~Optional[Callable[[str], str]]~~                              |
-| `alignment_mode`          | Alignment mode in case the LLM returns entities that do not align with token boundaries. Options are `"strict"`, `"contract"` or `"expand"`. Defaults to `"contract"`. ~~str~~                         |
-| `case_sensitive_matching` | Whether to search without case sensitivity. Defaults to `False`. ~~bool~~                                                                                                                              |
+| Argument                    | Description                                                                                                                                                                                            |
+| --------------------------- | ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------ |
+| `template`                  | Custom prompt template to send to LLM model. Defaults to [ner.v3.jinja](https://github.com/explosion/spacy-llm/blob/main/spacy_llm/tasks/templates/ner.v3.jinja). ~~str~~                              |
+| `examples`                  | Optional function that generates examples for few-shot learning. Defaults to `None`. ~~Optional[Callable[[], Iterable[Any]]]~~                                                                         |
+| `parse_responses` (NEW)     | Callable for parsing LLM responses for this task. Defaults to the internal parsing method for this task. ~~Optional[TaskResponseParser[NERTask]]~~                                                     |
+| `prompt_example_type` (NEW) | Type to use for fewshot examples. Defaults to `NERExample`. ~~Optional[Type[FewshotExample]]~~                                                                                                         |
+| `scorer`                    | Scorer function that evaluates the task performance on provided examples. Defaults to the metric used by spaCy. ~~Optional[Scorer]~~                                                                   |
+| `labels`                    | List of labels or str of comma-separated list of labels. ~~Union[List[str], str]~~                                                                                                                     |
+| `label_definitions`         | Optional dict mapping a label to a description of that label. These descriptions are added to the prompt to help instruct the LLM on what to extract. Defaults to `None`. ~~Optional[Dict[str, str]]~~ |
+| `description` (NEW)         | A description of what to recognize or not recognize as entities. ~~str~~                                                                                                                               |
+| `normalizer`                | Function that normalizes the labels as returned by the LLM. If `None`, defaults to `spacy.LowercaseNormalizer.v1`. Defaults to `None`. ~~Optional[Callable[[str], str]]~~                              |
+| `alignment_mode`            | Alignment mode in case the LLM returns entities that do not align with token boundaries. Options are `"strict"`, `"contract"` or `"expand"`. Defaults to `"contract"`. ~~str~~                         |
+| `case_sensitive_matching`   | Whether to search without case sensitivity. Defaults to `False`. ~~bool~~                                                                                                                              |
 
 Note that the `single_match` parameter, used in v1 and v2, is not supported
 anymore, as the CoT parsing algorithm takes care of this automatically.
@@ -415,16 +420,19 @@ v1.
 > examples = null
 > ```
 
-| Argument                  | Description                                                                                                                                                                                            |
-| ------------------------- | ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------ |
-| `labels`                  | List of labels or str of comma-separated list of labels. ~~Union[List[str], str]~~                                                                                                                     |
-| `label_definitions` (NEW) | Optional dict mapping a label to a description of that label. These descriptions are added to the prompt to help instruct the LLM on what to extract. Defaults to `None`. ~~Optional[Dict[str, str]]~~ |
-| `template` (NEW)          | Custom prompt template to send to LLM model. Defaults to [ner.v2.jinja](https://github.com/explosion/spacy-llm/blob/main/spacy_llm/tasks/templates/ner.v2.jinja). ~~str~~                              |
-| `examples`                | Optional function that generates examples for few-shot learning. Defaults to `None`. ~~Optional[Callable[[], Iterable[Any]]]~~                                                                         |
-| `normalizer`              | Function that normalizes the labels as returned by the LLM. If `None`, defaults to `spacy.LowercaseNormalizer.v1`. Defaults to `None`. ~~Optional[Callable[[str], str]]~~                              |
-| `alignment_mode`          | Alignment mode in case the LLM returns entities that do not align with token boundaries. Options are `"strict"`, `"contract"` or `"expand"`. Defaults to `"contract"`. ~~str~~                         |
-| `case_sensitive_matching` | Whether to search without case sensitivity. Defaults to `False`. ~~bool~~                                                                                                                              |
-| `single_match`            | Whether to match an entity in the LLM's response only once (the first hit) or multiple times. Defaults to `False`. ~~bool~~                                                                            |
+| Argument                    | Description                                                                                                                                                                                            |
+| --------------------------- | ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------ |
+| `template` (NEW)            | Custom prompt template to send to LLM model. Defaults to [ner.v2.jinja](https://github.com/explosion/spacy-llm/blob/main/spacy_llm/tasks/templates/ner.v2.jinja). ~~str~~                              |
+| `examples`                  | Optional function that generates examples for few-shot learning. Defaults to `None`. ~~Optional[Callable[[], Iterable[Any]]]~~                                                                         |
+| `parse_responses` (NEW)     | Callable for parsing LLM responses for this task. Defaults to the internal parsing method for this task. ~~Optional[TaskResponseParser[NERTask]]~~                                                     |
+| `prompt_example_type` (NEW) | Type to use for fewshot examples. Defaults to `NERExample`. ~~Optional[Type[FewshotExample]]~~                                                                                                         |
+| `scorer` (NEW)              | Scorer function that evaluates the task performance on provided examples. Defaults to the metric used by spaCy. ~~Optional[Scorer]~~                                                                   |
+| `labels`                    | List of labels or str of comma-separated list of labels. ~~Union[List[str], str]~~                                                                                                                     |
+| `label_definitions` (NEW)   | Optional dict mapping a label to a description of that label. These descriptions are added to the prompt to help instruct the LLM on what to extract. Defaults to `None`. ~~Optional[Dict[str, str]]~~ |
+| `normalizer`                | Function that normalizes the labels as returned by the LLM. If `None`, defaults to `spacy.LowercaseNormalizer.v1`. Defaults to `None`. ~~Optional[Callable[[str], str]]~~                              |
+| `alignment_mode`            | Alignment mode in case the LLM returns entities that do not align with token boundaries. Options are `"strict"`, `"contract"` or `"expand"`. Defaults to `"contract"`. ~~str~~                         |
+| `case_sensitive_matching`   | Whether to search without case sensitivity. Defaults to `False`. ~~bool~~                                                                                                                              |
+| `single_match`              | Whether to match an entity in the LLM's response only once (the first hit) or multiple times. Defaults to `False`. ~~bool~~                                                                            |
 
 The parameters `alignment_mode`, `case_sensitive_matching` and `single_match`
 are identical to the [v1](#ner-v1) implementation. The format of few-shot
@@ -467,14 +475,17 @@ few-shot prompting.
 > examples = null
 > ```
 
-| Argument                  | Description                                                                                                                                                                    |
-| ------------------------- | ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------ |
-| `labels`                  | Comma-separated list of labels. ~~str~~                                                                                                                                        |
-| `examples`                | Optional function that generates examples for few-shot learning. Defaults to `None`. ~~Optional[Callable[[], Iterable[Any]]]~~                                                 |
-| `normalizer`              | Function that normalizes the labels as returned by the LLM. If `None`, defaults to `spacy.LowercaseNormalizer.v1`. ~~Optional[Callable[[str], str]]~~                          |
-| `alignment_mode`          | Alignment mode in case the LLM returns entities that do not align with token boundaries. Options are `"strict"`, `"contract"` or `"expand"`. Defaults to `"contract"`. ~~str~~ |
-| `case_sensitive_matching` | Whether to search without case sensitivity. Defaults to `False`. ~~bool~~                                                                                                      |
-| `single_match`            | Whether to match an entity in the LLM's response only once (the first hit) or multiple times. Defaults to `False`. ~~bool~~                                                    |
+| Argument                    | Description                                                                                                                                                                    |
+| --------------------------- | ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------ |
+| `examples`                  | Optional function that generates examples for few-shot learning. Defaults to `None`. ~~Optional[Callable[[], Iterable[Any]]]~~                                                 |
+| `parse_responses` (NEW)     | Callable for parsing LLM responses for this task. Defaults to the internal parsing method for this task. ~~Optional[TaskResponseParser[NERTask]]~~                             |
+| `prompt_example_type` (NEW) | Type to use for fewshot examples. Defaults to `NERExample`. ~~Optional[Type[FewshotExample]]~~                                                                                 |
+| `scorer` (NEW)              | Scorer function that evaluates the task performance on provided examples. Defaults to the metric used by spaCy. ~~Optional[Scorer]~~                                           |
+| `labels`                    | Comma-separated list of labels. ~~str~~                                                                                                                                        |
+| `normalizer`                | Function that normalizes the labels as returned by the LLM. If `None`, defaults to `spacy.LowercaseNormalizer.v1`. ~~Optional[Callable[[str], str]]~~                          |
+| `alignment_mode`            | Alignment mode in case the LLM returns entities that do not align with token boundaries. Options are `"strict"`, `"contract"` or `"expand"`. Defaults to `"contract"`. ~~str~~ |
+| `case_sensitive_matching`   | Whether to search without case sensitivity. Defaults to `False`. ~~bool~~                                                                                                      |
+| `single_match`              | Whether to match an entity in the LLM's response only once (the first hit) or multiple times. Defaults to `False`. ~~bool~~                                                    |
 
 The NER task implementation doesn't currently ask the LLM for specific offsets,
 but simply expects a list of strings that represent the enties in the document.
@@ -539,17 +550,20 @@ support overlapping entities and store its annotations in `doc.spans`.
 > examples = null
 > ```
 
-| Argument                  | Description                                                                                                                                                                                            |
-| ------------------------- | ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------ |
-| `labels`                  | List of labels or str of comma-separated list of labels. ~~Union[List[str], str]~~                                                                                                                     |
-| `label_definitions`       | Optional dict mapping a label to a description of that label. These descriptions are added to the prompt to help instruct the LLM on what to extract. Defaults to `None`. ~~Optional[Dict[str, str]]~~ |
-| `template`                | Custom prompt template to send to LLM model. Defaults to [`spancat.v3.jinja`](https://github.com/explosion/spacy-llm/blob/main/spacy_llm/tasks/templates/spancat.v3.jinja). ~~str~~                    |
-| `description` (NEW)       | A description of what to recognize or not recognize as entities. ~~str~~                                                                                                                               |
-| `spans_key`               | Key of the `Doc.spans` dict to save the spans under. Defaults to `"sc"`. ~~str~~                                                                                                                       |
-| `examples`                | Optional function that generates examples for few-shot learning. Defaults to `None`. ~~Optional[Callable[[], Iterable[Any]]]~~                                                                         |
-| `normalizer`              | Function that normalizes the labels as returned by the LLM. If `None`, defaults to `spacy.LowercaseNormalizer.v1`. ~~Optional[Callable[[str], str]]~~                                                  |
-| `alignment_mode`          | Alignment mode in case the LLM returns entities that do not align with token boundaries. Options are `"strict"`, `"contract"` or `"expand"`. Defaults to `"contract"`. ~~str~~                         |
-| `case_sensitive_matching` | Whether to search without case sensitivity. Defaults to `False`. ~~bool~~                                                                                                                              |
+| Argument                    | Description                                                                                                                                                                                            |
+| --------------------------- | ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------ |
+| `template`                  | Custom prompt template to send to LLM model. Defaults to [`spancat.v3.jinja`](https://github.com/explosion/spacy-llm/blob/main/spacy_llm/tasks/templates/spancat.v3.jinja). ~~str~~                    |
+| `examples`                  | Optional function that generates examples for few-shot learning. Defaults to `None`. ~~Optional[Callable[[], Iterable[Any]]]~~                                                                         |
+| `parse_responses` (NEW)     | Callable for parsing LLM responses for this task. Defaults to the internal parsing method for this task. ~~Optional[TaskResponseParser[SpanCatTask]]~~                                                 |
+| `prompt_example_type` (NEW) | Type to use for fewshot examples. Defaults to `SpanCatExample`. ~~Optional[Type[FewshotExample]]~~                                                                                                     |
+| `scorer` (NEW)              | Scorer function that evaluates the task performance on provided examples. Defaults to the metric used by spaCy. ~~Optional[Scorer]~~                                                                   |
+| `labels`                    | List of labels or str of comma-separated list of labels. ~~Union[List[str], str]~~                                                                                                                     |
+| `label_definitions`         | Optional dict mapping a label to a description of that label. These descriptions are added to the prompt to help instruct the LLM on what to extract. Defaults to `None`. ~~Optional[Dict[str, str]]~~ |
+| `description` (NEW)         | A description of what to recognize or not recognize as entities. ~~str~~                                                                                                                               |
+| `spans_key`                 | Key of the `Doc.spans` dict to save the spans under. Defaults to `"sc"`. ~~str~~                                                                                                                       |
+| `normalizer`                | Function that normalizes the labels as returned by the LLM. If `None`, defaults to `spacy.LowercaseNormalizer.v1`. ~~Optional[Callable[[str], str]]~~                                                  |
+| `alignment_mode`            | Alignment mode in case the LLM returns entities that do not align with token boundaries. Options are `"strict"`, `"contract"` or `"expand"`. Defaults to `"contract"`. ~~str~~                         |
+| `case_sensitive_matching`   | Whether to search without case sensitivity. Defaults to `False`. ~~bool~~                                                                                                                              |
 
 Note that the `single_match` parameter, used in v1 and v2, is not supported
 anymore, as the CoT parsing algorithm takes care of this automatically.
@@ -568,17 +582,20 @@ support overlapping entities and store its annotations in `doc.spans`.
 > examples = null
 > ```
 
-| Argument                  | Description                                                                                                                                                                                            |
-| ------------------------- | ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------ |
-| `labels`                  | List of labels or str of comma-separated list of labels. ~~Union[List[str], str]~~                                                                                                                     |
-| `label_definitions` (NEW) | Optional dict mapping a label to a description of that label. These descriptions are added to the prompt to help instruct the LLM on what to extract. Defaults to `None`. ~~Optional[Dict[str, str]]~~ |
-| `template` (NEW)          | Custom prompt template to send to LLM model. Defaults to [`spancat.v2.jinja`](https://github.com/explosion/spacy-llm/blob/main/spacy_llm/tasks/templates/spancat.v2.jinja). ~~str~~                    |
-| `spans_key`               | Key of the `Doc.spans` dict to save the spans under. Defaults to `"sc"`. ~~str~~                                                                                                                       |
-| `examples`                | Optional function that generates examples for few-shot learning. Defaults to `None`. ~~Optional[Callable[[], Iterable[Any]]]~~                                                                         |
-| `normalizer`              | Function that normalizes the labels as returned by the LLM. If `None`, defaults to `spacy.LowercaseNormalizer.v1`. ~~Optional[Callable[[str], str]]~~                                                  |
-| `alignment_mode`          | Alignment mode in case the LLM returns entities that do not align with token boundaries. Options are `"strict"`, `"contract"` or `"expand"`. Defaults to `"contract"`. ~~str~~                         |
-| `case_sensitive_matching` | Whether to search without case sensitivity. Defaults to `False`. ~~bool~~                                                                                                                              |
-| `single_match`            | Whether to match an entity in the LLM's response only once (the first hit) or multiple times. Defaults to `False`. ~~bool~~                                                                            |
+| Argument                    | Description                                                                                                                                                                                            |
+| --------------------------- | ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------ |
+| `template` (NEW)            | Custom prompt template to send to LLM model. Defaults to [`spancat.v2.jinja`](https://github.com/explosion/spacy-llm/blob/main/spacy_llm/tasks/templates/spancat.v2.jinja). ~~str~~                    |
+| `examples`                  | Optional function that generates examples for few-shot learning. Defaults to `None`. ~~Optional[Callable[[], Iterable[Any]]]~~                                                                         |
+| `parse_responses` (NEW)     | Callable for parsing LLM responses for this task. Defaults to the internal parsing method for this task. ~~Optional[TaskResponseParser[SpanCatTask]]~~                                                 |
+| `prompt_example_type` (NEW) | Type to use for fewshot examples. Defaults to `SpanCatExample`. ~~Optional[Type[FewshotExample]]~~                                                                                                     |
+| `scorer` (NEW)              | Scorer function that evaluates the task performance on provided examples. Defaults to the metric used by spaCy. ~~Optional[Scorer]~~                                                                   |
+| `labels`                    | List of labels or str of comma-separated list of labels. ~~Union[List[str], str]~~                                                                                                                     |
+| `label_definitions` (NEW)   | Optional dict mapping a label to a description of that label. These descriptions are added to the prompt to help instruct the LLM on what to extract. Defaults to `None`. ~~Optional[Dict[str, str]]~~ |
+| `spans_key`                 | Key of the `Doc.spans` dict to save the spans under. Defaults to `"sc"`. ~~str~~                                                                                                                       |
+| `normalizer`                | Function that normalizes the labels as returned by the LLM. If `None`, defaults to `spacy.LowercaseNormalizer.v1`. ~~Optional[Callable[[str], str]]~~                                                  |
+| `alignment_mode`            | Alignment mode in case the LLM returns entities that do not align with token boundaries. Options are `"strict"`, `"contract"` or `"expand"`. Defaults to `"contract"`. ~~str~~                         |
+| `case_sensitive_matching`   | Whether to search without case sensitivity. Defaults to `False`. ~~bool~~                                                                                                                              |
+| `single_match`              | Whether to match an entity in the LLM's response only once (the first hit) or multiple times. Defaults to `False`. ~~bool~~                                                                            |
 
 Except for the `spans_key` parameter, the SpanCat v2 task reuses the
 configuration from the NER v2 task. Refer to [its documentation](#ner-v2) for
@@ -599,15 +616,18 @@ v1 NER task to support overlapping entities and store its annotations in
 > examples = null
 > ```
 
-| Argument                  | Description                                                                                                                                                                    |
-| ------------------------- | ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------ |
-| `labels`                  | Comma-separated list of labels. ~~str~~                                                                                                                                        |
-| `spans_key`               | Key of the `Doc.spans` dict to save the spans under. Defaults to `"sc"`. ~~str~~                                                                                               |
-| `examples`                | Optional function that generates examples for few-shot learning. Defaults to `None`. ~~Optional[Callable[[], Iterable[Any]]]~~                                                 |
-| `normalizer`              | Function that normalizes the labels as returned by the LLM. If `None`, defaults to `spacy.LowercaseNormalizer.v1`. ~~Optional[Callable[[str], str]]~~                          |
-| `alignment_mode`          | Alignment mode in case the LLM returns entities that do not align with token boundaries. Options are `"strict"`, `"contract"` or `"expand"`. Defaults to `"contract"`. ~~str~~ |
-| `case_sensitive_matching` | Whether to search without case sensitivity. Defaults to `False`. ~~bool~~                                                                                                      |
-| `single_match`            | Whether to match an entity in the LLM's response only once (the first hit) or multiple times. Defaults to `False`. ~~bool~~                                                    |
+| Argument                    | Description                                                                                                                                                                    |
+| --------------------------- | ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------ |
+| `examples`                  | Optional function that generates examples for few-shot learning. Defaults to `None`. ~~Optional[Callable[[], Iterable[Any]]]~~                                                 |
+| `parse_responses` (NEW)     | Callable for parsing LLM responses for this task. Defaults to the internal parsing method for this task. ~~Optional[TaskResponseParser[SpanCatTask]]~~                         |
+| `prompt_example_type` (NEW) | Type to use for fewshot examples. Defaults to `SpanCatExample`. ~~Optional[Type[FewshotExample]]~~                                                                             |
+| `scorer` (NEW)              | Scorer function that evaluates the task performance on provided examples. Defaults to the metric used by spaCy. ~~Optional[Scorer]~~                                           |
+| `labels`                    | Comma-separated list of labels. ~~str~~                                                                                                                                        |
+| `spans_key`                 | Key of the `Doc.spans` dict to save the spans under. Defaults to `"sc"`. ~~str~~                                                                                               |
+| `normalizer`                | Function that normalizes the labels as returned by the LLM. If `None`, defaults to `spacy.LowercaseNormalizer.v1`. ~~Optional[Callable[[str], str]]~~                          |
+| `alignment_mode`            | Alignment mode in case the LLM returns entities that do not align with token boundaries. Options are `"strict"`, `"contract"` or `"expand"`. Defaults to `"contract"`. ~~str~~ |
+| `case_sensitive_matching`   | Whether to search without case sensitivity. Defaults to `False`. ~~bool~~                                                                                                      |
+| `single_match`              | Whether to match an entity in the LLM's response only once (the first hit) or multiple times. Defaults to `False`. ~~bool~~                                                    |
 
 Except for the `spans_key` parameter, the SpanCat v1 task reuses the
 configuration from the NER v1 task. Refer to [its documentation](#ner-v1) for
@@ -636,16 +656,19 @@ prompt.
 > examples = null
 > ```
 
-| Argument                  | Description                                                                                                                                                                         |
-| ------------------------- | ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
-| `labels`                  | List of labels or str of comma-separated list of labels. ~~Union[List[str], str]~~                                                                                                  |
-| `label_definitions` (NEW) | Dictionary of label definitions. Included in the prompt, if set. Defaults to `None`. ~~Optional[Dict[str, str]]~~                                                                   |
-| `template`                | Custom prompt template to send to LLM model. Defaults to [`textcat.v3.jinja`](https://github.com/explosion/spacy-llm/blob/main/spacy_llm/tasks/templates/textcat.v3.jinja). ~~str~~ |
-| `examples`                | Optional function that generates examples for few-shot learning. Defaults to `None`. ~~Optional[Callable[[], Iterable[Any]]]~~                                                      |
-| `normalizer`              | Function that normalizes the labels as returned by the LLM. If `None`, falls back to `spacy.LowercaseNormalizer.v1`. Defaults to `None`. ~~Optional[Callable[[str], str]]~~         |
-| `exclusive_classes`       | If set to `True`, only one label per document should be valid. If set to `False`, one document can have multiple labels. Defaults to `False`. ~~bool~~                              |
-| `allow_none`              | When set to `True`, allows the LLM to not return any of the given label. The resulting dict in `doc.cats` will have `0.0` scores for all labels. Defaults to `True`. ~~bool~~       |
-| `verbose`                 | If set to `True`, warnings will be generated when the LLM returns invalid responses. Defaults to `False`. ~~bool~~                                                                  |
+| Argument                    | Description                                                                                                                                                                         |
+| --------------------------- | ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| `template`                  | Custom prompt template to send to LLM model. Defaults to [`textcat.v3.jinja`](https://github.com/explosion/spacy-llm/blob/main/spacy_llm/tasks/templates/textcat.v3.jinja). ~~str~~ |
+| `examples`                  | Optional function that generates examples for few-shot learning. Defaults to `None`. ~~Optional[Callable[[], Iterable[Any]]]~~                                                      |
+| `parse_responses` (NEW)     | Callable for parsing LLM responses for this task. Defaults to the internal parsing method for this task. ~~Optional[TaskResponseParser[SpanCatTask]]~~                              |
+| `prompt_example_type` (NEW) | Type to use for fewshot examples. Defaults to `TextCatExample`. ~~Optional[Type[FewshotExample]]~~                                                                                  |
+| `scorer` (NEW)              | Scorer function that evaluates the task performance on provided examples. Defaults to the metric used by spaCy. ~~Optional[Scorer]~~                                                |
+| `labels`                    | List of labels or str of comma-separated list of labels. ~~Union[List[str], str]~~                                                                                                  |
+| `label_definitions` (NEW)   | Dictionary of label definitions. Included in the prompt, if set. Defaults to `None`. ~~Optional[Dict[str, str]]~~                                                                   |
+| `normalizer`                | Function that normalizes the labels as returned by the LLM. If `None`, falls back to `spacy.LowercaseNormalizer.v1`. Defaults to `None`. ~~Optional[Callable[[str], str]]~~         |
+| `exclusive_classes`         | If set to `True`, only one label per document should be valid. If set to `False`, one document can have multiple labels. Defaults to `False`. ~~bool~~                              |
+| `allow_none`                | When set to `True`, allows the LLM to not return any of the given label. The resulting dict in `doc.cats` will have `0.0` scores for all labels. Defaults to `True`. ~~bool~~       |
+| `verbose`                   | If set to `True`, warnings will be generated when the LLM returns invalid responses. Defaults to `False`. ~~bool~~                                                                  |
 
 The formatting of few-shot examples is the same as those for the
 [v1](#textcat-v1) implementation.
@@ -663,15 +686,18 @@ V2 includes all v1 functionality, with an improved prompt template.
 > examples = null
 > ```
 
-| Argument            | Description                                                                                                                                                                         |
-| ------------------- | ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
-| `labels`            | List of labels or str of comma-separated list of labels. ~~Union[List[str], str]~~                                                                                                  |
-| `template` (NEW)    | Custom prompt template to send to LLM model. Defaults to [`textcat.v2.jinja`](https://github.com/explosion/spacy-llm/blob/main/spacy_llm/tasks/templates/textcat.v2.jinja). ~~str~~ |
-| `examples`          | Optional function that generates examples for few-shot learning. Defaults to `None`. ~~Optional[Callable[[], Iterable[Any]]]~~                                                      |
-| `normalizer`        | Function that normalizes the labels as returned by the LLM. If `None`, falls back to `spacy.LowercaseNormalizer.v1`. ~~Optional[Callable[[str], str]]~~                             |
-| `exclusive_classes` | If set to `True`, only one label per document should be valid. If set to `False`, one document can have multiple labels. Defaults to `False`. ~~bool~~                              |
-| `allow_none`        | When set to `True`, allows the LLM to not return any of the given label. The resulting dict in `doc.cats` will have `0.0` scores for all labels. Defaults to `True`. ~~bool~~       |
-| `verbose`           | If set to `True`, warnings will be generated when the LLM returns invalid responses. Defaults to `False`. ~~bool~~                                                                  |
+| Argument                    | Description                                                                                                                                                                         |
+| --------------------------- | ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| `template` (NEW)            | Custom prompt template to send to LLM model. Defaults to [`textcat.v2.jinja`](https://github.com/explosion/spacy-llm/blob/main/spacy_llm/tasks/templates/textcat.v2.jinja). ~~str~~ |
+| `examples`                  | Optional function that generates examples for few-shot learning. Defaults to `None`. ~~Optional[Callable[[], Iterable[Any]]]~~                                                      |
+| `parse_responses` (NEW)     | Callable for parsing LLM responses for this task. Defaults to the internal parsing method for this task. ~~Optional[TaskResponseParser[SpanCatTask]]~~                              |
+| `prompt_example_type` (NEW) | Type to use for fewshot examples. Defaults to `TextCatExample`. ~~Optional[Type[FewshotExample]]~~                                                                                  |
+| `scorer` (NEW)              | Scorer function that evaluates the task performance on provided examples. Defaults to the metric used by spaCy. ~~Optional[Scorer]~~                                                |
+| `labels`                    | List of labels or str of comma-separated list of labels. ~~Union[List[str], str]~~                                                                                                  |
+| `normalizer`                | Function that normalizes the labels as returned by the LLM. If `None`, falls back to `spacy.LowercaseNormalizer.v1`. ~~Optional[Callable[[str], str]]~~                             |
+| `exclusive_classes`         | If set to `True`, only one label per document should be valid. If set to `False`, one document can have multiple labels. Defaults to `False`. ~~bool~~                              |
+| `allow_none`                | When set to `True`, allows the LLM to not return any of the given label. The resulting dict in `doc.cats` will have `0.0` scores for all labels. Defaults to `True`. ~~bool~~       |
+| `verbose`                   | If set to `True`, warnings will be generated when the LLM returns invalid responses. Defaults to `False`. ~~bool~~                                                                  |
 
 The formatting of few-shot examples is the same as those for the
 [v1](#textcat-v1) implementation.
@@ -690,14 +716,17 @@ prompting.
 > examples = null
 > ```
 
-| Argument            | Description                                                                                                                                                                   |
-| ------------------- | ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
-| `labels`            | Comma-separated list of labels. ~~str~~                                                                                                                                       |
-| `examples`          | Optional function that generates examples for few-shot learning. Deafults to `None`. ~~Optional[Callable[[], Iterable[Any]]]~~                                                |
-| `normalizer`        | Function that normalizes the labels as returned by the LLM. If `None`, falls back to `spacy.LowercaseNormalizer.v1`. ~~Optional[Callable[[str], str]]~~                       |
-| `exclusive_classes` | If set to `True`, only one label per document should be valid. If set to `False`, one document can have multiple labels. Deafults to `False`. ~~bool~~                        |
-| `allow_none`        | When set to `True`, allows the LLM to not return any of the given label. The resulting dict in `doc.cats` will have `0.0` scores for all labels. Deafults to `True`. ~~bool~~ |
-| `verbose`           | If set to `True`, warnings will be generated when the LLM returns invalid responses. Deafults to `False`. ~~bool~~                                                            |
+| Argument                    | Description                                                                                                                                                                   |
+| --------------------------- | ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| `examples`                  | Optional function that generates examples for few-shot learning. Deafults to `None`. ~~Optional[Callable[[], Iterable[Any]]]~~                                                |
+| `parse_responses` (NEW)     | Callable for parsing LLM responses for this task. Defaults to the internal parsing method for this task. ~~Optional[TaskResponseParser[SpanCatTask]]~~                        |
+| `prompt_example_type` (NEW) | Type to use for fewshot examples. Defaults to `TextCatExample`. ~~Optional[Type[FewshotExample]]~~                                                                            |
+| `scorer` (NEW)              | Scorer function that evaluates the task performance on provided examples. Defaults to the metric used by spaCy. ~~Optional[Scorer]~~                                          |
+| `labels`                    | Comma-separated list of labels. ~~str~~                                                                                                                                       |
+| `normalizer`                | Function that normalizes the labels as returned by the LLM. If `None`, falls back to `spacy.LowercaseNormalizer.v1`. ~~Optional[Callable[[str], str]]~~                       |
+| `exclusive_classes`         | If set to `True`, only one label per document should be valid. If set to `False`, one document can have multiple labels. Defaults to `False`. ~~bool~~                        |
+| `allow_none`                | When set to `True`, allows the LLM to not return any of the given label. The resulting dict in `doc.cats` will have `0.0` scores for all labels. Defaults to `True`. ~~bool~~ |
+| `verbose`                   | If set to `True`, warnings will be generated when the LLM returns invalid responses. Defaults to `False`. ~~bool~~                                                            |
 
 To perform [few-shot learning](/usage/large-language-models#few-shot-prompts),
 you can write down a few examples in a separate file, and provide these to be
@@ -740,14 +769,17 @@ on an upstream NER component for entities extraction.
 > labels = ["LivesIn", "Visits"]
 > ```
 
-| Argument            | Description                                                                                                                                                                 |
-| ------------------- | --------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
-| `labels`            | List of labels or str of comma-separated list of labels. ~~Union[List[str], str]~~                                                                                          |
-| `template`          | Custom prompt template to send to LLM model. Defaults to [`rel.v3.jinja`](https://github.com/explosion/spacy-llm/blob/main/spacy_llm/tasks/templates/rel.v1.jinja). ~~str~~ |
-| `label_definitions` | Dictionary providing a description for each relation label. Defaults to `None`. ~~Optional[Dict[str, str]]~~                                                                |
-| `examples`          | Optional function that generates examples for few-shot learning. Defaults to `None`. ~~Optional[Callable[[], Iterable[Any]]]~~                                              |
-| `normalizer`        | Function that normalizes the labels as returned by the LLM. If `None`, falls back to `spacy.LowercaseNormalizer.v1`. Defaults to `None`. ~~Optional[Callable[[str], str]]~~ |
-| `verbose`           | If set to `True`, warnings will be generated when the LLM returns invalid responses. Defaults to `False`. ~~bool~~                                                          |
+| Argument                    | Description                                                                                                                                                                 |
+| --------------------------- | --------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| `template`                  | Custom prompt template to send to LLM model. Defaults to [`rel.v3.jinja`](https://github.com/explosion/spacy-llm/blob/main/spacy_llm/tasks/templates/rel.v1.jinja). ~~str~~ |
+| `examples`                  | Optional function that generates examples for few-shot learning. Defaults to `None`. ~~Optional[Callable[[], Iterable[Any]]]~~                                              |
+| `parse_responses` (NEW)     | Callable for parsing LLM responses for this task. Defaults to the internal parsing method for this task. ~~Optional[TaskResponseParser[RELTask]]~~                          |
+| `prompt_example_type` (NEW) | Type to use for fewshot examples. Defaults to `RELExample`. ~~Optional[Type[FewshotExample]]~~                                                                              |
+| `scorer` (NEW)              | Scorer function that evaluates the task performance on provided examples. Defaults to the metric used by spaCy. ~~Optional[Scorer]~~                                        |
+| `labels`                    | List of labels or str of comma-separated list of labels. ~~Union[List[str], str]~~                                                                                          |
+| `label_definitions`         | Dictionary providing a description for each relation label. Defaults to `None`. ~~Optional[Dict[str, str]]~~                                                                |
+| `normalizer`                | Function that normalizes the labels as returned by the LLM. If `None`, falls back to `spacy.LowercaseNormalizer.v1`. Defaults to `None`. ~~Optional[Callable[[str], str]]~~ |
+| `verbose`                   | If set to `True`, warnings will be generated when the LLM returns invalid responses. Defaults to `False`. ~~bool~~                                                          |
 
 To perform [few-shot learning](/usage/large-language-models#few-shot-prompts),
 you can write down a few examples in a separate file, and provide these to be
@@ -793,10 +825,13 @@ This task supports both zero-shot and few-shot prompting.
 > examples = null
 > ```
 
-| Argument   | Description                                                                                                                                                                   |
-| ---------- | ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
-| `template` | Custom prompt template to send to LLM model. Defaults to [lemma.v1.jinja](https://github.com/explosion/spacy-llm/blob/main/spacy_llm/tasks/templates/lemma.v1.jinja). ~~str~~ |
-| `examples` | Optional function that generates examples for few-shot learning. Defaults to `None`. ~~Optional[Callable[[], Iterable[Any]]]~~                                                |
+| Argument                    | Description                                                                                                                                                                   |
+| --------------------------- | ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| `template`                  | Custom prompt template to send to LLM model. Defaults to [lemma.v1.jinja](https://github.com/explosion/spacy-llm/blob/main/spacy_llm/tasks/templates/lemma.v1.jinja). ~~str~~ |
+| `examples`                  | Optional function that generates examples for few-shot learning. Defaults to `None`. ~~Optional[Callable[[], Iterable[Any]]]~~                                                |
+| `parse_responses` (NEW)     | Callable for parsing LLM responses for this task. Defaults to the internal parsing method for this task. ~~Optional[TaskResponseParser[LemmaTask]]~~                          |
+| `prompt_example_type` (NEW) | Type to use for fewshot examples. Defaults to `LemmaExample`. ~~Optional[Type[FewshotExample]]~~                                                                              |
+| `scorer` (NEW)              | Scorer function that evaluates the task performance on provided examples. Defaults to the metric used by spaCy. ~~Optional[Scorer]~~                                          |
 
 The task prompts the LLM to lemmatize the passed text and return the lemmatized
 version as a list of tokens and their corresponding lemma. E. g. the text
@@ -870,11 +905,14 @@ This task supports both zero-shot and few-shot prompting.
 > examples = null
 > ```
 
-| Argument   | Description                                                                                                                                |
-| ---------- | ------------------------------------------------------------------------------------------------------------------------------------------ |
-| `template` | Custom prompt template to send to LLM model. Defaults to [sentiment.v1.jinja](./spacy_llm/tasks/templates/sentiment.v1.jinja). ~~str~~     |
-| `examples` | Optional function that generates examples for few-shot learning. Defaults to `None`. ~~Optional[Callable[[], Iterable[Any]]]~~             |
-| `field`    | Name of extension attribute to store summary in (i. e. the summary will be available in `doc._.{field}`). Defaults to `sentiment`. ~~str~~ |
+| Argument                    | Description                                                                                                                                              |
+| --------------------------- | -------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| `template`                  | Custom prompt template to send to LLM model. Defaults to [sentiment.v1.jinja](./spacy_llm/tasks/templates/sentiment.v1.jinja). ~~str~~                   |
+| `examples`                  | Optional function that generates examples for few-shot learning. Defaults to `None`. ~~Optional[Callable[[], Iterable[Any]]]~~                           |
+| `parse_responses` (NEW)     | Callable for parsing LLM responses for this task. Defaults to the internal parsing method for this task. ~~Optional[TaskResponseParser[SentimentTask]]~~ |
+| `prompt_example_type` (NEW) | Type to use for fewshot examples. Defaults to `SentimentExample`. ~~Optional[Type[FewshotExample]]~~                                                     |
+| `scorer` (NEW)              | Scorer function that evaluates the task performance on provided examples. Defaults to the metric used by spaCy. ~~Optional[Scorer]~~                     |
+| `field`                     | Name of extension attribute to store summary in (i. e. the summary will be available in `doc._.{field}`). Defaults to `sentiment`. ~~str~~               |
 
 To perform [few-shot learning](/usage/large-language-models#few-shot-prompts),
 you can write down a few examples in a separate file, and provide these to be
@@ -1042,6 +1080,21 @@ Currently, these models are provided as part of the core library:
 | `spacy.StableLM.v1`  | Stability AI    | `["stablelm-base-alpha-3b", "stablelm-base-alpha-7b", "stablelm-tuned-alpha-3b", "stablelm-tuned-alpha-7b"]` | https://huggingface.co/stabilityai     |
 | `spacy.OpenLLaMA.v1` | OpenLM Research | `["open_llama_3b", "open_llama_7b", "open_llama_7b_v2", "open_llama_13b"]`                                   | https://huggingface.co/openlm-research |
 
+<Infobox variant="warning" title="Gated models on Hugging Face" id="hf_licensing">
+
+Some models available on Hugging Face (HF), such as Llama 2, are _gated models_.
+That means that users have to fulfill certain requirements to be allowed access
+to these models. In the case of Llama 2 you'll need to request agree to Meta's
+Terms of Service while logged in with your HF account. After Meta grants you
+permission to use Llama 2, you'll be able to download and use the model.
+
+This requires that you are logged in with your HF account on your local
+machine - check out the HF quick start documentation. In a nutshell, you'll need
+to create an access token on HF and log in to HF using your access token, e. g.
+with `huggingface-cli login`.
+
+</Infobox>
+
 Note that Hugging Face will download the model the first time you use it - you
 can
 [define the cached directory](https://huggingface.co/docs/huggingface_hub/main/en/guides/manage-cache)

From 6e54360a3d068c2b85b45902f8885b8db043372f Mon Sep 17 00:00:00 2001
From: Adriane Boyd <adrianeboyd@gmail.com>
Date: Thu, 5 Oct 2023 08:50:22 +0200
Subject: [PATCH 08/25] Remove pathy dependency, update docs for cloudpathlib
 in Weasel (#13035)

---
 requirements.txt                | 1 -
 setup.cfg                       | 1 -
 spacy/cli/_util.py              | 4 ----
 website/docs/api/cli.mdx        | 6 +++---
 website/docs/usage/projects.mdx | 6 +++---
 5 files changed, 6 insertions(+), 12 deletions(-)

diff --git a/requirements.txt b/requirements.txt
index a8ba956a1..3050624f9 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -10,7 +10,6 @@ wasabi>=0.9.1,<1.2.0
 srsly>=2.4.3,<3.0.0
 catalogue>=2.0.6,<2.1.0
 typer>=0.3.0,<0.10.0
-pathy>=0.10.0
 smart-open>=5.2.1,<7.0.0
 weasel>=0.1.0,<0.4.0
 # Third party dependencies
diff --git a/setup.cfg b/setup.cfg
index 75f2e3a15..ab9e39e0c 100644
--- a/setup.cfg
+++ b/setup.cfg
@@ -56,7 +56,6 @@ install_requires =
     weasel>=0.1.0,<0.4.0
     # Third-party dependencies
     typer>=0.3.0,<0.10.0
-    pathy>=0.10.0
     smart-open>=5.2.1,<7.0.0
     tqdm>=4.38.0,<5.0.0
     numpy>=1.15.0; python_version < "3.9"
diff --git a/spacy/cli/_util.py b/spacy/cli/_util.py
index bc6c53cd9..fa41e6a08 100644
--- a/spacy/cli/_util.py
+++ b/spacy/cli/_util.py
@@ -41,10 +41,6 @@ from ..util import (
     run_command,
 )
 
-if TYPE_CHECKING:
-    from pathy import FluidPath  # noqa: F401
-
-
 SDIST_SUFFIX = ".tar.gz"
 WHEEL_SUFFIX = "-py3-none-any.whl"
 
diff --git a/website/docs/api/cli.mdx b/website/docs/api/cli.mdx
index 3ec0081c9..51cae960b 100644
--- a/website/docs/api/cli.mdx
+++ b/website/docs/api/cli.mdx
@@ -1544,9 +1544,9 @@ obsolete files is left up to you.
 
 Remotes can be defined in the `remotes` section of the
 [`project.yml`](/usage/projects#project-yml). Under the hood, spaCy uses
-[`Pathy`](https://github.com/justindujardin/pathy) to communicate with the
-remote storages, so you can use any protocol that `Pathy` supports, including
-[S3](https://aws.amazon.com/s3/),
+[`cloudpathlib`](https://cloudpathlib.drivendata.org) to communicate with the
+remote storages, so you can use any protocol that `cloudpathlib` supports,
+including [S3](https://aws.amazon.com/s3/),
 [Google Cloud Storage](https://cloud.google.com/storage), and the local
 filesystem, although you may need to install extra dependencies to use certain
 protocols.
diff --git a/website/docs/usage/projects.mdx b/website/docs/usage/projects.mdx
index f3cca8013..b089a7ab5 100644
--- a/website/docs/usage/projects.mdx
+++ b/website/docs/usage/projects.mdx
@@ -656,9 +656,9 @@ locally.
 You can list one or more remotes in the `remotes` section of your
 [`project.yml`](#project-yml) by mapping a string name to the URL of the
 storage. Under the hood, spaCy uses
-[`Pathy`](https://github.com/justindujardin/pathy) to communicate with the
-remote storages, so you can use any protocol that `Pathy` supports, including
-[S3](https://aws.amazon.com/s3/),
+[`cloudpathlib`](https://cloudpathlib.drivendata.org) to communicate with the
+remote storages, so you can use any protocol that `cloudpathlib` supports,
+including [S3](https://aws.amazon.com/s3/),
 [Google Cloud Storage](https://cloud.google.com/storage), and the local
 filesystem, although you may need to install extra dependencies to use certain
 protocols.

From 1dec138e61f41963096772cd096e1a1e07ae2ce9 Mon Sep 17 00:00:00 2001
From: Raphael Mitsch <r.mitsch@outlook.com>
Date: Thu, 5 Oct 2023 08:50:41 +0200
Subject: [PATCH 09/25] Update docs w.r.t. PaLM support. (#13018)

---
 website/docs/api/large-language-models.mdx   | 7 +++++++
 website/docs/usage/large-language-models.mdx | 5 +++--
 2 files changed, 10 insertions(+), 2 deletions(-)

diff --git a/website/docs/api/large-language-models.mdx b/website/docs/api/large-language-models.mdx
index 845edaa1a..aac4c5108 100644
--- a/website/docs/api/large-language-models.mdx
+++ b/website/docs/api/large-language-models.mdx
@@ -1022,6 +1022,7 @@ Currently, these models are provided as part of the core library:
 | `spacy.Claude-1-3.v1`         | Anthropic | `["claude-1.3", "claude-1.3-100k"]`                                                                                | `"claude-1.3"`         | `{}`                                 |
 | `spacy.Claude-instant-1.v1`   | Anthropic | `["claude-instant-1", "claude-instant-1-100k"]`                                                                    | `"claude-instant-1"`   | `{}`                                 |
 | `spacy.Claude-instant-1-1.v1` | Anthropic | `["claude-instant-1.1", "claude-instant-1.1-100k"]`                                                                | `"claude-instant-1.1"` | `{}`                                 |
+| `spacy.PaLM.v1`               | Google    | `["chat-bison-001", "text-bison-001"]`                                                                             | `"text-bison-001"`     | `{temperature=0.0}`                  |
 
 To use these models, make sure that you've [set the relevant API](#api-keys)
 keys as environment variables.
@@ -1052,6 +1053,12 @@ For Anthropic:
 export ANTHROPIC_API_KEY="..."
 ```
 
+For PaLM:
+
+```shell
+export PALM_API_KEY="..."
+```
+
 ### Models via HuggingFace {id="models-hf"}
 
 These models all take the same parameters:
diff --git a/website/docs/usage/large-language-models.mdx b/website/docs/usage/large-language-models.mdx
index 86f44f5ae..35117ef57 100644
--- a/website/docs/usage/large-language-models.mdx
+++ b/website/docs/usage/large-language-models.mdx
@@ -170,8 +170,8 @@ to be `"databricks/dolly-v2-12b"` for better performance.
 ### Example 3: Create the component directly in Python {id="example-3"}
 
 The `llm` component behaves as any other component does, and there are
-[task-specific components](/api/large-language-models#config) defined to
-help you hit the ground running with a reasonable built-in task implementation.
+[task-specific components](/api/large-language-models#config) defined to help
+you hit the ground running with a reasonable built-in task implementation.
 
 ```python
 import spacy
@@ -484,6 +484,7 @@ provider's documentation.
 | [`spacy.Claude-1-0.v1`](/api/large-language-models#models-rest)         | Anthropic’s `claude-1.0` model family.         |
 | [`spacy.Claude-1-2.v1`](/api/large-language-models#models-rest)         | Anthropic’s `claude-1.2` model family.         |
 | [`spacy.Claude-1-3.v1`](/api/large-language-models#models-rest)         | Anthropic’s `claude-1.3` model family.         |
+| [`spacy.PaLM.v1`](/api/large-language-models#models-rest)               | Google’s `PaLM` model family.                  |
 | [`spacy.Dolly.v1`](/api/large-language-models#models-hf)                | Dolly models through HuggingFace.              |
 | [`spacy.Falcon.v1`](/api/large-language-models#models-hf)               | Falcon models through HuggingFace.             |
 | [`spacy.Llama2.v1`](/api/large-language-models#models-hf)               | Llama2 models through HuggingFace.             |

From 862f8254e8498fc426a406f56d44b350d830e852 Mon Sep 17 00:00:00 2001
From: Raphael Mitsch <r.mitsch@outlook.com>
Date: Thu, 5 Oct 2023 13:18:27 +0200
Subject: [PATCH 10/25] Add docs on Azure OpenAI support in `spacy-llm`
 (#13043)

* Add gpt-3.5-turbo-instruct to list of supported OpenAI models.

* Update `spacy-llm` task argument docs w.r.t. task refactoring (#12995)

* Update task arguments w.r.t. task refactoring in 0.5.0.

* Add disclaimer w.r.t. gated models/Llama 2.

* Update website/docs/api/large-language-models.mdx

* Update website/docs/api/large-language-models.mdx

* Update docs w.r.t. PaLM support. (#13018)

* Add info on spacy.Azure.v1.

* Attempt to fix netlify check fails.

* Attempt to fix netlify check fails.

* Attempt to fix netlify check fails.

* Attempt to fix netlify check fails.

* Attempt to fix netlify check fails.

* Attempt to fix netlify check fails.

* Attempt to fix netlify check fails.

* Attempt to fix netlify check fails.

* Attempt to fix netlify check fails.

* Format.
---
 website/docs/api/large-language-models.mdx   | 85 ++++++++++++--------
 website/docs/usage/large-language-models.mdx |  1 +
 2 files changed, 53 insertions(+), 33 deletions(-)

diff --git a/website/docs/api/large-language-models.mdx b/website/docs/api/large-language-models.mdx
index aac4c5108..c5d106e29 100644
--- a/website/docs/api/large-language-models.mdx
+++ b/website/docs/api/large-language-models.mdx
@@ -990,43 +990,62 @@ provider's API.
 
 Currently, these models are provided as part of the core library:
 
-| Model                         | Provider  | Supported names                                                                                                    | Default name           | Default config                       |
-| ----------------------------- | --------- | ------------------------------------------------------------------------------------------------------------------ | ---------------------- | ------------------------------------ |
-| `spacy.GPT-4.v1`              | OpenAI    | `["gpt-4", "gpt-4-0314", "gpt-4-32k", "gpt-4-32k-0314"]`                                                           | `"gpt-4"`              | `{}`                                 |
-| `spacy.GPT-4.v2`              | OpenAI    | `["gpt-4", "gpt-4-0314", "gpt-4-32k", "gpt-4-32k-0314"]`                                                           | `"gpt-4"`              | `{temperature=0.0}`                  |
-| `spacy.GPT-3-5.v1`            | OpenAI    | `["gpt-3.5-turbo", "gpt-3.5-turbo-16k", "gpt-3.5-turbo-0613", "gpt-3.5-turbo-0613-16k", "gpt-3.5-turbo-instruct"]` | `"gpt-3.5-turbo"`      | `{}`                                 |
-| `spacy.GPT-3-5.v2`            | OpenAI    | `["gpt-3.5-turbo", "gpt-3.5-turbo-16k", "gpt-3.5-turbo-0613", "gpt-3.5-turbo-0613-16k", "gpt-3.5-turbo-instruct"]` | `"gpt-3.5-turbo"`      | `{temperature=0.0}`                  |
-| `spacy.Davinci.v1`            | OpenAI    | `["davinci"]`                                                                                                      | `"davinci"`            | `{}`                                 |
-| `spacy.Davinci.v2`            | OpenAI    | `["davinci"]`                                                                                                      | `"davinci"`            | `{temperature=0.0, max_tokens=500}`  |
-| `spacy.Text-Davinci.v1`       | OpenAI    | `["text-davinci-003", "text-davinci-002"]`                                                                         | `"text-davinci-003"`   | `{}`                                 |
-| `spacy.Text-Davinci.v2`       | OpenAI    | `["text-davinci-003", "text-davinci-002"]`                                                                         | `"text-davinci-003"`   | `{temperature=0.0, max_tokens=1000}` |
-| `spacy.Code-Davinci.v1`       | OpenAI    | `["code-davinci-002"]`                                                                                             | `"code-davinci-002"`   | `{}`                                 |
-| `spacy.Code-Davinci.v2`       | OpenAI    | `["code-davinci-002"]`                                                                                             | `"code-davinci-002"`   | `{temperature=0.0, max_tokens=500}`  |
-| `spacy.Curie.v1`              | OpenAI    | `["curie"]`                                                                                                        | `"curie"`              | `{}`                                 |
-| `spacy.Curie.v2`              | OpenAI    | `["curie"]`                                                                                                        | `"curie"`              | `{temperature=0.0, max_tokens=500}`  |
-| `spacy.Text-Curie.v1`         | OpenAI    | `["text-curie-001"]`                                                                                               | `"text-curie-001"`     | `{}`                                 |
-| `spacy.Text-Curie.v2`         | OpenAI    | `["text-curie-001"]`                                                                                               | `"text-curie-001"`     | `{temperature=0.0, max_tokens=500}`  |
-| `spacy.Babbage.v1`            | OpenAI    | `["babbage"]`                                                                                                      | `"babbage"`            | `{}`                                 |
-| `spacy.Babbage.v2`            | OpenAI    | `["babbage"]`                                                                                                      | `"babbage"`            | `{temperature=0.0, max_tokens=500}`  |
-| `spacy.Text-Babbage.v1`       | OpenAI    | `["text-babbage-001"]`                                                                                             | `"text-babbage-001"`   | `{}`                                 |
-| `spacy.Text-Babbage.v2`       | OpenAI    | `["text-babbage-001"]`                                                                                             | `"text-babbage-001"`   | `{temperature=0.0, max_tokens=500}`  |
-| `spacy.Ada.v1`                | OpenAI    | `["ada"]`                                                                                                          | `"ada"`                | `{}`                                 |
-| `spacy.Ada.v2`                | OpenAI    | `["ada"]`                                                                                                          | `"ada"`                | `{temperature=0.0, max_tokens=500}`  |
-| `spacy.Text-Ada.v1`           | OpenAI    | `["text-ada-001"]`                                                                                                 | `"text-ada-001"`       | `{}`                                 |
-| `spacy.Text-Ada.v2`           | OpenAI    | `["text-ada-001"]`                                                                                                 | `"text-ada-001"`       | `{temperature=0.0, max_tokens=500}`  |
-| `spacy.Command.v1`            | Cohere    | `["command", "command-light", "command-light-nightly", "command-nightly"]`                                         | `"command"`            | `{}`                                 |
-| `spacy.Claude-2.v1`           | Anthropic | `["claude-2", "claude-2-100k"]`                                                                                    | `"claude-2"`           | `{}`                                 |
-| `spacy.Claude-1.v1`           | Anthropic | `["claude-1", "claude-1-100k"]`                                                                                    | `"claude-1"`           | `{}`                                 |
-| `spacy.Claude-1-0.v1`         | Anthropic | `["claude-1.0"]`                                                                                                   | `"claude-1.0"`         | `{}`                                 |
-| `spacy.Claude-1-2.v1`         | Anthropic | `["claude-1.2"]`                                                                                                   | `"claude-1.2"`         | `{}`                                 |
-| `spacy.Claude-1-3.v1`         | Anthropic | `["claude-1.3", "claude-1.3-100k"]`                                                                                | `"claude-1.3"`         | `{}`                                 |
-| `spacy.Claude-instant-1.v1`   | Anthropic | `["claude-instant-1", "claude-instant-1-100k"]`                                                                    | `"claude-instant-1"`   | `{}`                                 |
-| `spacy.Claude-instant-1-1.v1` | Anthropic | `["claude-instant-1.1", "claude-instant-1.1-100k"]`                                                                | `"claude-instant-1.1"` | `{}`                                 |
-| `spacy.PaLM.v1`               | Google    | `["chat-bison-001", "text-bison-001"]`                                                                             | `"text-bison-001"`     | `{temperature=0.0}`                  |
+| Model                         | Provider          | Supported names                                                                                                    | Default name           | Default config                       |
+| ----------------------------- | ----------------- | ------------------------------------------------------------------------------------------------------------------ | ---------------------- | ------------------------------------ |
+| `spacy.GPT-4.v1`              | OpenAI            | `["gpt-4", "gpt-4-0314", "gpt-4-32k", "gpt-4-32k-0314"]`                                                           | `"gpt-4"`              | `{}`                                 |
+| `spacy.GPT-4.v2`              | OpenAI            | `["gpt-4", "gpt-4-0314", "gpt-4-32k", "gpt-4-32k-0314"]`                                                           | `"gpt-4"`              | `{temperature=0.0}`                  |
+| `spacy.GPT-3-5.v1`            | OpenAI            | `["gpt-3.5-turbo", "gpt-3.5-turbo-16k", "gpt-3.5-turbo-0613", "gpt-3.5-turbo-0613-16k", "gpt-3.5-turbo-instruct"]` | `"gpt-3.5-turbo"`      | `{}`                                 |
+| `spacy.GPT-3-5.v2`            | OpenAI            | `["gpt-3.5-turbo", "gpt-3.5-turbo-16k", "gpt-3.5-turbo-0613", "gpt-3.5-turbo-0613-16k", "gpt-3.5-turbo-instruct"]` | `"gpt-3.5-turbo"`      | `{temperature=0.0}`                  |
+| `spacy.Davinci.v1`            | OpenAI            | `["davinci"]`                                                                                                      | `"davinci"`            | `{}`                                 |
+| `spacy.Davinci.v2`            | OpenAI            | `["davinci"]`                                                                                                      | `"davinci"`            | `{temperature=0.0, max_tokens=500}`  |
+| `spacy.Text-Davinci.v1`       | OpenAI            | `["text-davinci-003", "text-davinci-002"]`                                                                         | `"text-davinci-003"`   | `{}`                                 |
+| `spacy.Text-Davinci.v2`       | OpenAI            | `["text-davinci-003", "text-davinci-002"]`                                                                         | `"text-davinci-003"`   | `{temperature=0.0, max_tokens=1000}` |
+| `spacy.Code-Davinci.v1`       | OpenAI            | `["code-davinci-002"]`                                                                                             | `"code-davinci-002"`   | `{}`                                 |
+| `spacy.Code-Davinci.v2`       | OpenAI            | `["code-davinci-002"]`                                                                                             | `"code-davinci-002"`   | `{temperature=0.0, max_tokens=500}`  |
+| `spacy.Curie.v1`              | OpenAI            | `["curie"]`                                                                                                        | `"curie"`              | `{}`                                 |
+| `spacy.Curie.v2`              | OpenAI            | `["curie"]`                                                                                                        | `"curie"`              | `{temperature=0.0, max_tokens=500}`  |
+| `spacy.Text-Curie.v1`         | OpenAI            | `["text-curie-001"]`                                                                                               | `"text-curie-001"`     | `{}`                                 |
+| `spacy.Text-Curie.v2`         | OpenAI            | `["text-curie-001"]`                                                                                               | `"text-curie-001"`     | `{temperature=0.0, max_tokens=500}`  |
+| `spacy.Babbage.v1`            | OpenAI            | `["babbage"]`                                                                                                      | `"babbage"`            | `{}`                                 |
+| `spacy.Babbage.v2`            | OpenAI            | `["babbage"]`                                                                                                      | `"babbage"`            | `{temperature=0.0, max_tokens=500}`  |
+| `spacy.Text-Babbage.v1`       | OpenAI            | `["text-babbage-001"]`                                                                                             | `"text-babbage-001"`   | `{}`                                 |
+| `spacy.Text-Babbage.v2`       | OpenAI            | `["text-babbage-001"]`                                                                                             | `"text-babbage-001"`   | `{temperature=0.0, max_tokens=500}`  |
+| `spacy.Ada.v1`                | OpenAI            | `["ada"]`                                                                                                          | `"ada"`                | `{}`                                 |
+| `spacy.Ada.v2`                | OpenAI            | `["ada"]`                                                                                                          | `"ada"`                | `{temperature=0.0, max_tokens=500}`  |
+| `spacy.Text-Ada.v1`           | OpenAI            | `["text-ada-001"]`                                                                                                 | `"text-ada-001"`       | `{}`                                 |
+| `spacy.Text-Ada.v2`           | OpenAI            | `["text-ada-001"]`                                                                                                 | `"text-ada-001"`       | `{temperature=0.0, max_tokens=500}`  |
+| `spacy.Azure.v1`              | Microsoft, OpenAI | Arbitrary values                                                                                                   | No default             | `{temperature=0.0}`                  |
+| `spacy.Command.v1`            | Cohere            | `["command", "command-light", "command-light-nightly", "command-nightly"]`                                         | `"command"`            | `{}`                                 |
+| `spacy.Claude-2.v1`           | Anthropic         | `["claude-2", "claude-2-100k"]`                                                                                    | `"claude-2"`           | `{}`                                 |
+| `spacy.Claude-1.v1`           | Anthropic         | `["claude-1", "claude-1-100k"]`                                                                                    | `"claude-1"`           | `{}`                                 |
+| `spacy.Claude-1-0.v1`         | Anthropic         | `["claude-1.0"]`                                                                                                   | `"claude-1.0"`         | `{}`                                 |
+| `spacy.Claude-1-2.v1`         | Anthropic         | `["claude-1.2"]`                                                                                                   | `"claude-1.2"`         | `{}`                                 |
+| `spacy.Claude-1-3.v1`         | Anthropic         | `["claude-1.3", "claude-1.3-100k"]`                                                                                | `"claude-1.3"`         | `{}`                                 |
+| `spacy.Claude-instant-1.v1`   | Anthropic         | `["claude-instant-1", "claude-instant-1-100k"]`                                                                    | `"claude-instant-1"`   | `{}`                                 |
+| `spacy.Claude-instant-1-1.v1` | Anthropic         | `["claude-instant-1.1", "claude-instant-1.1-100k"]`                                                                | `"claude-instant-1.1"` | `{}`                                 |
+| `spacy.PaLM.v1`               | Google            | `["chat-bison-001", "text-bison-001"]`                                                                             | `"text-bison-001"`     | `{temperature=0.0}`                  |
 
 To use these models, make sure that you've [set the relevant API](#api-keys)
 keys as environment variables.
 
+**⚠️ A note on `spacy.Azure.v1`.** Working with Azure OpenAI is slightly
+different than working with models from other providers:
+
+- In Azure LLMs have to be made available by creating a _deployment_ of a given
+  model (e. g. GPT-3.5). This deployment can have an arbitrary name. The `name`
+  argument, which everywhere else denotes the model name (e. g. `claude-1.0`,
+  `gpt-3.5`), here refers to the _deployment name_.
+- Deployed Azure OpenAI models are reachable via a resource-specific base URL,
+  usually of the form `https://{resource}.openai.azure.com`. Hence the URL has
+  to be specified via the `base_url` argument.
+- Azure further expects the _API version_ to be specified. The default value for
+  this, via the `api_version` argument, is currently `2023-05-15` but may be
+  updated in the future.
+- Finally, since we can't infer information about the model from the deployment
+  name, `spacy-llm` requires the `model_type` to be set to either
+  `"completions"` or `"chat"`, depending on whether the deployed model is a
+  completion or chat model.
+
 #### API Keys {id="api-keys"}
 
 Note that when using hosted services, you have to ensure that the proper API
diff --git a/website/docs/usage/large-language-models.mdx b/website/docs/usage/large-language-models.mdx
index 35117ef57..875ff33d4 100644
--- a/website/docs/usage/large-language-models.mdx
+++ b/website/docs/usage/large-language-models.mdx
@@ -476,6 +476,7 @@ provider's documentation.
 | [`spacy.Curie.v2`](/api/large-language-models#models-rest)              | OpenAI’s `curie` model family.                 |
 | [`spacy.Babbage.v2`](/api/large-language-models#models-rest)            | OpenAI’s `babbage` model family.               |
 | [`spacy.Ada.v2`](/api/large-language-models#models-rest)                | OpenAI’s `ada` model family.                   |
+| [`spacy.Azure.v1`](/api/large-language-models#models-rest)              | Azure's OpenAI models.                         |
 | [`spacy.Command.v1`](/api/large-language-models#models-rest)            | Cohere’s `command` model family.               |
 | [`spacy.Claude-2.v1`](/api/large-language-models#models-rest)           | Anthropic’s `claude-2` model family.           |
 | [`spacy.Claude-1.v1`](/api/large-language-models#models-rest)           | Anthropic’s `claude-1` model family.           |

From 1162fcf0994dd7f83a744eddd0bdd31bccd5ca29 Mon Sep 17 00:00:00 2001
From: Raphael Mitsch <r.mitsch@outlook.com>
Date: Thu, 5 Oct 2023 14:44:38 +0200
Subject: [PATCH 11/25] Add Mistral mentions. (#13037)

---
 website/docs/api/large-language-models.mdx   | 3 ++-
 website/docs/usage/large-language-models.mdx | 3 ++-
 2 files changed, 4 insertions(+), 2 deletions(-)

diff --git a/website/docs/api/large-language-models.mdx b/website/docs/api/large-language-models.mdx
index c5d106e29..f8404cb2e 100644
--- a/website/docs/api/large-language-models.mdx
+++ b/website/docs/api/large-language-models.mdx
@@ -1101,8 +1101,9 @@ Currently, these models are provided as part of the core library:
 | Model                | Provider        | Supported names                                                                                              | HF directory                           |
 | -------------------- | --------------- | ------------------------------------------------------------------------------------------------------------ | -------------------------------------- |
 | `spacy.Dolly.v1`     | Databricks      | `["dolly-v2-3b", "dolly-v2-7b", "dolly-v2-12b"]`                                                             | https://huggingface.co/databricks      |
-| `spacy.Llama2.v1`    | Meta AI         | `["Llama-2-7b-hf", "Llama-2-13b-hf", "Llama-2-70b-hf"]`                                                      | https://huggingface.co/meta-llama      |
 | `spacy.Falcon.v1`    | TII             | `["falcon-rw-1b", "falcon-7b", "falcon-7b-instruct", "falcon-40b-instruct"]`                                 | https://huggingface.co/tiiuae          |
+| `spacy.Llama2.v1`    | Meta AI         | `["Llama-2-7b-hf", "Llama-2-13b-hf", "Llama-2-70b-hf"]`                                                      | https://huggingface.co/meta-llama      |
+| `spacy.Mistral.v1`   | Mistral AI      | `["Mistral-7B-v0.1", "Mistral-7B-Instruct-v0.1"]`                                                            | https://huggingface.co/mistralai       |
 | `spacy.StableLM.v1`  | Stability AI    | `["stablelm-base-alpha-3b", "stablelm-base-alpha-7b", "stablelm-tuned-alpha-3b", "stablelm-tuned-alpha-7b"]` | https://huggingface.co/stabilityai     |
 | `spacy.OpenLLaMA.v1` | OpenLM Research | `["open_llama_3b", "open_llama_7b", "open_llama_7b_v2", "open_llama_13b"]`                                   | https://huggingface.co/openlm-research |
 
diff --git a/website/docs/usage/large-language-models.mdx b/website/docs/usage/large-language-models.mdx
index 875ff33d4..94494b4e1 100644
--- a/website/docs/usage/large-language-models.mdx
+++ b/website/docs/usage/large-language-models.mdx
@@ -436,7 +436,7 @@ respectively. Alternatively you can use LangChain to access hosted or local
 models by specifying one of the models registered with the `langchain.` prefix.
 
 <Infobox>
-_Why LangChain if there are also are a native REST and a HuggingFace interface? When should I use what?_
+_Why LangChain if there are also are native REST and HuggingFace interfaces? When should I use what?_
 
 Third-party libraries like `langchain` focus on prompt management, integration
 of many different LLM APIs, and other related features such as conversational
@@ -488,6 +488,7 @@ provider's documentation.
 | [`spacy.PaLM.v1`](/api/large-language-models#models-rest)               | Google’s `PaLM` model family.                  |
 | [`spacy.Dolly.v1`](/api/large-language-models#models-hf)                | Dolly models through HuggingFace.              |
 | [`spacy.Falcon.v1`](/api/large-language-models#models-hf)               | Falcon models through HuggingFace.             |
+| [`spacy.Mistral.v1`](/api/large-language-models#models-hf)              | Mistral models through HuggingFace.            |
 | [`spacy.Llama2.v1`](/api/large-language-models#models-hf)               | Llama2 models through HuggingFace.             |
 | [`spacy.StableLM.v1`](/api/large-language-models#models-hf)             | StableLM models through HuggingFace.           |
 | [`spacy.OpenLLaMA.v1`](/api/large-language-models#models-hf)            | OpenLLaMA models through HuggingFace.          |

From b83f1e372490acd86c6ddcb7b9f5b10b2d50b4ab Mon Sep 17 00:00:00 2001
From: Ines Montani <ines@ines.io>
Date: Fri, 6 Oct 2023 14:22:43 +0200
Subject: [PATCH 12/25] Inline displaCy visualizations in docs (#13050) [ci
 skip]

---
 .../images/displacy-long2.html                |   0
 website/docs/usage/101/_named-entities.mdx    |   8 +-
 website/docs/usage/101/_pos-deps.mdx          |   7 +-
 website/docs/usage/linguistic-features.mdx    |  15 +-
 website/docs/usage/rule-based-matching.mdx    |   7 +-
 website/docs/usage/saving-loading.mdx         |   8 +-
 website/docs/usage/v3-3.mdx                   |   8 +-
 website/docs/usage/visualizers.mdx            |  32 +--
 ...-founded.html => displacy-dep-founded.svg} |   0
 .../public/images/displacy-ent-custom.html    |  80 -------
 website/public/images/displacy-ent-snek.html  |  59 -----
 website/public/images/displacy-ent1.html      |  84 -------
 website/public/images/displacy-ent2.html      |  86 -------
 .../{displacy-long.html => displacy-long.svg} |   0
 website/public/images/displacy-long2.svg      | 212 ++++++++++++++++++
 .../public/images/displacy-span-custom.html   |  84 -------
 website/public/images/displacy-span.html      | 123 ----------
 website/src/components/embed.js               |  18 +-
 website/src/remark.js                         |   4 +-
 website/src/styles/embed.module.sass          |   8 +
 20 files changed, 273 insertions(+), 570 deletions(-)
 rename website/{public => docs}/images/displacy-long2.html (100%)
 rename website/public/images/{displacy-dep-founded.html => displacy-dep-founded.svg} (100%)
 delete mode 100644 website/public/images/displacy-ent-custom.html
 delete mode 100644 website/public/images/displacy-ent-snek.html
 delete mode 100644 website/public/images/displacy-ent1.html
 delete mode 100644 website/public/images/displacy-ent2.html
 rename website/public/images/{displacy-long.html => displacy-long.svg} (100%)
 create mode 100644 website/public/images/displacy-long2.svg
 delete mode 100644 website/public/images/displacy-span-custom.html
 delete mode 100644 website/public/images/displacy-span.html

diff --git a/website/public/images/displacy-long2.html b/website/docs/images/displacy-long2.html
similarity index 100%
rename from website/public/images/displacy-long2.html
rename to website/docs/images/displacy-long2.html
diff --git a/website/docs/usage/101/_named-entities.mdx b/website/docs/usage/101/_named-entities.mdx
index 9ae4134d8..da43c0ddd 100644
--- a/website/docs/usage/101/_named-entities.mdx
+++ b/website/docs/usage/101/_named-entities.mdx
@@ -31,8 +31,6 @@ for ent in doc.ents:
 Using spaCy's built-in [displaCy visualizer](/usage/visualizers), here's what
 our example sentence and its named entities look like:
 
-<Iframe
-  title="displaCy visualization of entities"
-  src="/images/displacy-ent1.html"
-  height={100}
-/>
+<Standalone height={120}>
+<div style={{lineHeight: 2.5, fontFamily: "-apple-system, BlinkMacSystemFont, 'Segoe UI', Helvetica, Arial, sans-serif, 'Apple Color Emoji', 'Segoe UI Emoji', 'Segoe UI Symbol'", fontSize: 18}}><mark style={{ background: '#7aecec', padding: '0.45em 0.6em', margin: '0 0.25em', lineHeight: 1, borderRadius: '0.35em'}}>Apple <span style={{ fontSize: '0.8em', fontWeight: 'bold', lineHeight: 1, borderRadius: '0.35em', marginLeft: '0.5rem'}}>ORG</span></mark> is looking at buying <mark style={{ background: '#feca74', padding: '0.45em 0.6em', margin: '0 0.25em', lineHeight: 1, borderRadius: '0.35em'}}>U.K. <span style={{ fontSize: '0.8em', fontWeight: 'bold', lineHeight: 1, borderRadius: '0.35em', marginLeft: '0.5rem'}}>GPE</span></mark> startup for <mark style={{ background: '#e4e7d2', padding: '0.45em 0.6em', margin: '0 0.25em', lineHeight: 1, borderRadius: '0.35em'}}>$1 billion <span style={{ fontSize: '0.8em', fontWeight: 'bold', lineHeight: 1, borderRadius: '0.35em', marginLeft: '0.5rem'}}>MONEY</span></mark></div>
+</Standalone>
diff --git a/website/docs/usage/101/_pos-deps.mdx b/website/docs/usage/101/_pos-deps.mdx
index bedb6ce2c..db1e12885 100644
--- a/website/docs/usage/101/_pos-deps.mdx
+++ b/website/docs/usage/101/_pos-deps.mdx
@@ -56,8 +56,7 @@ for token in doc:
 Using spaCy's built-in [displaCy visualizer](/usage/visualizers), here's what
 our example sentence and its dependencies look like:
 
-<Iframe
-  title="displaCy visualization of dependencies and entities"
-  src="/images/displacy-long.html"
-  height={450}
+<ImageScrollable
+  src="/images/displacy-long.svg"
+  width={1975}
 />
diff --git a/website/docs/usage/linguistic-features.mdx b/website/docs/usage/linguistic-features.mdx
index a58e8a241..47259ce15 100644
--- a/website/docs/usage/linguistic-features.mdx
+++ b/website/docs/usage/linguistic-features.mdx
@@ -290,10 +290,9 @@ for token in doc:
 | toward        | `prep`     | shift     | `NOUN`   | manufacturers           |
 | manufacturers | `pobj`     | toward    | `ADP`    |                         |
 
-<Iframe
-  title="displaCy visualization of dependencies and entities 2"
-  src="/images/displacy-long2.html"
-  height={450}
+<ImageScrollable
+  src="/images/displacy-long2.svg"
+  width={1275}
 />
 
 Because the syntactic relations form a tree, every word has **exactly one
@@ -709,11 +708,9 @@ doc = nlp(text)
 displacy.serve(doc, style="ent")
 ```
 
-<Iframe
-  title="displaCy visualizer for entities"
-  src="/images/displacy-ent2.html"
-  height={180}
-/>
+<Standalone height={180}>
+<div style={{lineHeight: 2.5, fontFamily: "-apple-system, BlinkMacSystemFont, 'Segoe UI', Helvetica, Arial, sans-serif, 'Apple Color Emoji', 'Segoe UI Emoji', 'Segoe UI Symbol'", fontSize: 18}}>When <mark style={{ background: '#aa9cfc', padding: '0.45em 0.6em', margin: '0 0.25em', lineHeight: 1, borderRadius: '0.35em'}}>Sebastian Thrun <span style={{ fontSize: '0.8em', fontWeight: 'bold', lineHeight: 1, borderRadius: '0.35em', marginLeft: '0.5rem'}}>PERSON</span></mark> started working on self-driving cars at <mark style={{ background: '#7aecec', padding: '0.45em 0.6em', margin: '0 0.25em', lineHeight: 1, borderRadius: '0.35em'}}>Google <span style={{ fontSize: '0.8em', fontWeight: 'bold', lineHeight: 1, borderRadius: '0.35em', marginLeft: '0.5rem'}}>ORG</span></mark> in <mark style={{ background: '#bfe1d9', padding: '0.45em 0.6em', margin: '0 0.25em', lineHeight: 1, borderRadius: '0.35em'}}>2007 <span style={{ fontSize: '0.8em', fontWeight: 'bold', lineHeight: 1, borderRadius: '0.35em', marginLeft: '0.5rem'}}>DATE</span></mark>, few people outside of the company took him seriously.</div>
+</Standalone>
 
 ## Entity Linking {id="entity-linking"}
 
diff --git a/website/docs/usage/rule-based-matching.mdx b/website/docs/usage/rule-based-matching.mdx
index d01107ea2..e5b98da3a 100644
--- a/website/docs/usage/rule-based-matching.mdx
+++ b/website/docs/usage/rule-based-matching.mdx
@@ -1144,10 +1144,9 @@ relations and tokens we want to match:
 > displacy.serve(doc)
 > ```
 
-<Iframe
-  title="displaCy visualization of dependencies"
-  src="/images/displacy-dep-founded.html"
-  height={450}
+<ImageScrollable
+  src="/images/displacy-dep-founded.svg"
+  width={925}
 />
 
 The relations we're interested in are:
diff --git a/website/docs/usage/saving-loading.mdx b/website/docs/usage/saving-loading.mdx
index aad8ea353..26f59750b 100644
--- a/website/docs/usage/saving-loading.mdx
+++ b/website/docs/usage/saving-loading.mdx
@@ -586,11 +586,9 @@ After installing the package, the custom colors will be used when visualizing
 text with `displacy`. Whenever the label `SNEK` is assigned, it will be
 displayed in `#3dff74`.
 
-<Iframe
-  title="displaCy visualization of entities"
-  src="/images/displacy-ent-snek.html"
-  height={100}
-/>
+<Standalone height={100}>
+<div style={{lineHeight: 2.5, fontFamily: "-apple-system, BlinkMacSystemFont, 'Segoe UI', Helvetica, Arial, sans-serif, 'Apple Color Emoji', 'Segoe UI Emoji', 'Segoe UI Symbol'", fontSize: 18}}>🌱🌿 <mark style={{ background: '#3dff74', padding: '0.45em 0.6em', margin: '0 0.25em', lineHeight: 1, borderRadius: '0.35em'}}>🐍 <span style={{ fontSize: '0.8em', fontWeight: 'bold', lineHeight: 1, borderRadius: '0.35em', marginLeft: '0.5rem'}}>SNEK</span></mark> ____ 🌳🌲 ____ <mark style={{ background: '#cfc5ff', padding: '0.45em 0.6em', margin: '0 0.25em', lineHeight: 1, borderRadius: '0.35em'}}>👨‍🌾 <span style={{ fontSize: '0.8em', fontWeight: 'bold', lineHeight: 1, borderRadius: '0.35em', marginLeft: '0.5rem'}}>HUMAN</span></mark> 🏘️</div>
+</Standalone>
 
 ## Saving, loading and distributing trained pipelines {id="models"}
 
diff --git a/website/docs/usage/v3-3.mdx b/website/docs/usage/v3-3.mdx
index d692475de..fd211e6d2 100644
--- a/website/docs/usage/v3-3.mdx
+++ b/website/docs/usage/v3-3.mdx
@@ -77,11 +77,9 @@ doc.spans["custom"] = [Span(doc, 3, 6, "ORG"), Span(doc, 5, 6, "GPE")]
 displacy.serve(doc, style="span", options={"spans_key": "custom"})
 ```
 
-<Iframe
-  title="displaCy visualizer for overlapping spans"
-  src="/images/displacy-span.html"
-  height={180}
-/>
+<Standalone height={100}>
+<div style={{ lineHeight: 2.5, direction: 'ltr', fontFamily: "-apple-system, BlinkMacSystemFont, 'Segoe UI', Helvetica, Arial, sans-serif, 'Apple Color Emoji', 'Segoe UI Emoji', 'Segoe UI Symbol'", fontSize: 18 }}>Welcome to the <span style={{ fontWeight: 'bold', display: 'inline-block', position: 'relative'}}>Bank<span style={{ background: '#7aecec', top: 40, height: 4, left: -1, width: 'calc(100% + 2px)', position: 'absolute' }}></span><span style={{ background: '#7aecec', top: 40, height: 4, borderTopLeftRadius: 3, borderBottomLeftRadius: 3, left: -1, width: 'calc(100% + 2px)', position: 'absolute' }}><span style={{ background: '#7aecec', color: '#000', top: '-0.5em', padding: '2px 3px', position: 'absolute', fontSize: '0.6em', fontWeight: 'bold', lineHeight: 1, borderRadius: 3 }}>ORG</span></span></span> <span style={{ fontWeight: 'bold', display: 'inline-block', position: 'relative'}}>of <span style={{ background: '#7aecec', top: 40, height: 4, left: -1, width: 'calc(100% + 2px)', position: 'absolute' }}></span></span> <span style={{ fontWeight: 'bold', display: 'inline-block', position: 'relative'}}>China<span style={{ background: '#7aecec', top: 40, height: 4, left: -1, width: 'calc(100% + 2px)', position: 'absolute' }}></span><span style={{ background: '#feca74', top: 57, height: 4, left: -1, width: 'calc(100% + 2px)', position: 'absolute' }}></span><span style={{ background: '#feca74', top: 57, height: 4, borderTopLeftRadius: 3, borderBottomLeftRadius: 3, left: -1, width: 'calc(100% + 2px)', position: 'absolute' }}><span style={{ background: '#feca74', color: '#000', top: '-0.5em', padding: '2px 3px', position: 'absolute', fontSize: '0.6em', fontWeight: 'bold', lineHeight: 1, borderRadius: 3 }}>GPE</span></span></span>.</div>
+</Standalone>
 
 ## Additional features and improvements
 
diff --git a/website/docs/usage/visualizers.mdx b/website/docs/usage/visualizers.mdx
index e73c4a16a..2905ba2bd 100644
--- a/website/docs/usage/visualizers.mdx
+++ b/website/docs/usage/visualizers.mdx
@@ -119,11 +119,9 @@ doc = nlp(text)
 displacy.serve(doc, style="ent")
 ```
 
-<Iframe
-  title="displaCy visualizer for entities"
-  src="/images/displacy-ent2.html"
-  height={180}
-/>
+<Standalone height={180}>
+<div style={{lineHeight: 2.5, fontFamily: "-apple-system, BlinkMacSystemFont, 'Segoe UI', Helvetica, Arial, sans-serif, 'Apple Color Emoji', 'Segoe UI Emoji', 'Segoe UI Symbol'", fontSize: 18}}>When <mark style={{ background: '#aa9cfc', padding: '0.45em 0.6em', margin: '0 0.25em', lineHeight: 1, borderRadius: '0.35em'}}>Sebastian Thrun <span style={{ fontSize: '0.8em', fontWeight: 'bold', lineHeight: 1, borderRadius: '0.35em', marginLeft: '0.5rem'}}>PERSON</span></mark> started working on self-driving cars at <mark style={{ background: '#7aecec', padding: '0.45em 0.6em', margin: '0 0.25em', lineHeight: 1, borderRadius: '0.35em'}}>Google <span style={{ fontSize: '0.8em', fontWeight: 'bold', lineHeight: 1, borderRadius: '0.35em', marginLeft: '0.5rem'}}>ORG</span></mark> in <mark style={{ background: '#bfe1d9', padding: '0.45em 0.6em', margin: '0 0.25em', lineHeight: 1, borderRadius: '0.35em'}}>2007 <span style={{ fontSize: '0.8em', fontWeight: 'bold', lineHeight: 1, borderRadius: '0.35em', marginLeft: '0.5rem'}}>DATE</span></mark>, few people outside of the company took him seriously.</div>
+</Standalone>
 
 The entity visualizer lets you customize the following `options`:
 
@@ -148,11 +146,9 @@ use the `colors` setting to add your own colors for them.
 > displacy.serve(doc, style="ent", options=options)
 > ```
 
-<Iframe
-  title="displaCy visualizer for entities (custom styling)"
-  src="/images/displacy-ent-custom.html"
-  height={225}
-/>
+<Standalone height={225}>
+<div style={{lineHeight: 2.5, fontFamily: "-apple-system, BlinkMacSystemFont, 'Segoe UI', Helvetica, Arial, sans-serif, 'Apple Color Emoji', 'Segoe UI Emoji', 'Segoe UI Symbol'", fontSize: 18}}>But <mark style={{ background: 'linear-gradient(90deg, #aa9cfc, #fc9ce7)', padding: '0.45em 0.6em', margin: '0 0.25em', lineHeight: 1, borderRadius: '0.35em'}}>Google <span style={{ fontSize: '0.8em', fontWeight: 'bold', lineHeight: 1, borderRadius: '0.35em', marginLeft: '0.5rem'}}>ORG</span></mark> is starting from behind. The company made a late push into hardware, and <mark style={{ background: 'linear-gradient(90deg, #aa9cfc, #fc9ce7)', padding: '0.45em 0.6em', margin: '0 0.25em', lineHeight: 1, borderRadius: '0.35em'}}>Apple <span style={{ fontSize: '0.8em', fontWeight: 'bold', lineHeight: 1, borderRadius: '0.35em', marginLeft: '0.5rem'}}>ORG</span></mark>’s Siri, available on iPhones, and <mark style={{ background: 'linear-gradient(90deg, #aa9cfc, #fc9ce7)', padding: '0.45em 0.6em', margin: '0 0.25em', lineHeight: 1, borderRadius: '0.35em'}}>Amazon <span style={{ fontSize: '0.8em', fontWeight: 'bold', lineHeight: 1, borderRadius: '0.35em', marginLeft: '0.5rem'}}>ORG</span></mark>’s Alexa software, which runs on its Echo and Dot devices, have clear leads in consumer adoption.</div>
+</Standalone>
 
 The above example uses a little trick: Since the background color values are
 added as the `background` style attribute, you can use any
@@ -197,11 +193,9 @@ doc.spans["sc"] = [
 displacy.serve(doc, style="span")
 ```
 
-<Iframe
-  title="displaCy visualizer for overlapping spans"
-  src="/images/displacy-span.html"
-  height={180}
-/>
+<Standalone height={100}>
+<div style={{ lineHeight: 2.5, direction: 'ltr', fontFamily: "-apple-system, BlinkMacSystemFont, 'Segoe UI', Helvetica, Arial, sans-serif, 'Apple Color Emoji', 'Segoe UI Emoji', 'Segoe UI Symbol'", fontSize: 18 }}>Welcome to the <span style={{ fontWeight: 'bold', display: 'inline-block', position: 'relative'}}>Bank<span style={{ background: '#7aecec', top: 40, height: 4, left: -1, width: 'calc(100% + 2px)', position: 'absolute' }}></span><span style={{ background: '#7aecec', top: 40, height: 4, borderTopLeftRadius: 3, borderBottomLeftRadius: 3, left: -1, width: 'calc(100% + 2px)', position: 'absolute' }}><span style={{ background: '#7aecec', color: '#000', top: '-0.5em', padding: '2px 3px', position: 'absolute', fontSize: '0.6em', fontWeight: 'bold', lineHeight: 1, borderRadius: 3 }}>ORG</span></span></span> <span style={{ fontWeight: 'bold', display: 'inline-block', position: 'relative'}}>of <span style={{ background: '#7aecec', top: 40, height: 4, left: -1, width: 'calc(100% + 2px)', position: 'absolute' }}></span></span> <span style={{ fontWeight: 'bold', display: 'inline-block', position: 'relative'}}>China<span style={{ background: '#7aecec', top: 40, height: 4, left: -1, width: 'calc(100% + 2px)', position: 'absolute' }}></span><span style={{ background: '#feca74', top: 57, height: 4, left: -1, width: 'calc(100% + 2px)', position: 'absolute' }}></span><span style={{ background: '#feca74', top: 57, height: 4, borderTopLeftRadius: 3, borderBottomLeftRadius: 3, left: -1, width: 'calc(100% + 2px)', position: 'absolute' }}><span style={{ background: '#feca74', color: '#000', top: '-0.5em', padding: '2px 3px', position: 'absolute', fontSize: '0.6em', fontWeight: 'bold', lineHeight: 1, borderRadius: 3 }}>GPE</span></span></span>.</div>
+</Standalone>
 
 The span visualizer lets you customize the following `options`:
 
@@ -223,11 +217,9 @@ specify which one displaCy should use with `spans_key` (`sc` is the default).
 > displacy.serve(doc, style="span", options=options)
 > ```
 
-<Iframe
-  title="displaCy visualizer for spans (custom spans_key)"
-  src="/images/displacy-span-custom.html"
-  height={225}
-/>
+<Standalone height={100}>
+<div style={{ lineHeight: 2.5, direction: 'ltr', fontFamily: "-apple-system, BlinkMacSystemFont, 'Segoe UI', Helvetica, Arial, sans-serif, 'Apple Color Emoji', 'Segoe UI Emoji', 'Segoe UI Symbol'", fontSize: 18 }}>Welcome to the <span style={{ fontWeight: 'bold', display: 'inline-block', position: 'relative'}}>Bank<span style={{ background: '#ddd', top: 40, height: 4, left: -1, width: 'calc(100% + 2px)', position: 'absolute' }}></span><span style={{ background: '#ddd', top: 40, height: 4, borderTopLeftRadius: 3, borderBottomLeftRadius: 3, left: -1, width: 'calc(100% + 2px)', position: 'absolute' }}><span style={{ background: '#ddd', color: '#000', top: '-0.5em', padding: '2px 3px', position: 'absolute', fontSize: '0.6em', fontWeight: 'bold', lineHeight: 1, borderRadius: 3 }}>BANK</span></span></span> <span style={{ fontWeight: 'bold', display: 'inline-block', position: 'relative'}}>of <span style={{ background: '#ddd', top: 40, height: 4, left: -1, width: 'calc(100% + 2px)', position: 'absolute' }}></span></span> <span style={{ fontWeight: 'bold', display: 'inline-block', position: 'relative'}}>China<span style={{ background: '#ddd', top: 40, height: 4, left: -1, width: 'calc(100% + 2px)', position: 'absolute' }}></span></span>.</div>
+</Standalone>
 
 ## Using displaCy in Jupyter notebooks {id="jupyter"}
 
diff --git a/website/public/images/displacy-dep-founded.html b/website/public/images/displacy-dep-founded.svg
similarity index 100%
rename from website/public/images/displacy-dep-founded.html
rename to website/public/images/displacy-dep-founded.svg
diff --git a/website/public/images/displacy-ent-custom.html b/website/public/images/displacy-ent-custom.html
deleted file mode 100644
index 5da472fdb..000000000
--- a/website/public/images/displacy-ent-custom.html
+++ /dev/null
@@ -1,80 +0,0 @@
-<div
-    class="entities"
-    style="
-        line-height: 2.5;
-        font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Helvetica, Arial, sans-serif,
-            'Apple Color Emoji', 'Segoe UI Emoji', 'Segoe UI Symbol';
-        font-size: 18px;
-    "
-    >But
-    <mark
-        class="entity"
-        style="
-            background: linear-gradient(90deg, #aa9cfc, #fc9ce7);
-            padding: 0.45em 0.6em;
-            margin: 0 0.25em;
-            line-height: 1;
-            border-radius: 0.35em;
-        "
-        >Google
-        <span
-            style="
-                font-size: 0.8em;
-                font-weight: bold;
-                line-height: 1;
-                border-radius: 0.35em;
-                text-transform: uppercase;
-                vertical-align: middle;
-                margin-left: 0.5rem;
-            "
-            >ORG</span
-        ></mark
-    >is starting from behind. The company made a late push into hardware, and
-    <mark
-        class="entity"
-        style="
-            background: linear-gradient(90deg, #aa9cfc, #fc9ce7);
-            padding: 0.45em 0.6em;
-            margin: 0 0.25em;
-            line-height: 1;
-            border-radius: 0.35em;
-        "
-        >Apple
-        <span
-            style="
-                font-size: 0.8em;
-                font-weight: bold;
-                line-height: 1;
-                border-radius: 0.35em;
-                text-transform: uppercase;
-                vertical-align: middle;
-                margin-left: 0.5rem;
-            "
-            >ORG</span
-        ></mark
-    >’s Siri, available on iPhones, and
-    <mark
-        class="entity"
-        style="
-            background: linear-gradient(90deg, #aa9cfc, #fc9ce7);
-            padding: 0.45em 0.6em;
-            margin: 0 0.25em;
-            line-height: 1;
-            border-radius: 0.35em;
-        "
-        >Amazon
-        <span
-            style="
-                font-size: 0.8em;
-                font-weight: bold;
-                line-height: 1;
-                border-radius: 0.35em;
-                text-transform: uppercase;
-                vertical-align: middle;
-                margin-left: 0.5rem;
-            "
-            >ORG</span
-        ></mark
-    >’s Alexa software, which runs on its Echo and Dot devices, have clear leads in consumer
-    adoption.</div
->
diff --git a/website/public/images/displacy-ent-snek.html b/website/public/images/displacy-ent-snek.html
deleted file mode 100644
index 6604d9b78..000000000
--- a/website/public/images/displacy-ent-snek.html
+++ /dev/null
@@ -1,59 +0,0 @@
-<div
-    class="entities"
-    style="
-        line-height: 2.5;
-        font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Helvetica, Arial, sans-serif,
-            'Apple Color Emoji', 'Segoe UI Emoji', 'Segoe UI Symbol';
-        font-size: 16px;
-    "
->
-    🌱🌿
-    <mark
-        class="entity"
-        style="
-            background: #3dff74;
-            padding: 0.45em 0.6em;
-            margin: 0 0.25em;
-            line-height: 1;
-            border-radius: 0.35em;
-        "
-        >🐍
-        <span
-            style="
-                font-size: 0.8em;
-                font-weight: bold;
-                line-height: 1;
-                border-radius: 0.35em;
-                text-transform: uppercase;
-                vertical-align: middle;
-                margin-left: 0.5rem;
-            "
-            >SNEK</span
-        ></mark
-    >
-    ____ 🌳🌲 ____
-    <mark
-        class="entity"
-        style="
-            background: #cfc5ff;
-            padding: 0.45em 0.6em;
-            margin: 0 0.25em;
-            line-height: 1;
-            border-radius: 0.35em;
-        "
-        >👨‍🌾
-        <span
-            style="
-                font-size: 0.8em;
-                font-weight: bold;
-                line-height: 1;
-                border-radius: 0.35em;
-                text-transform: uppercase;
-                vertical-align: middle;
-                margin-left: 0.5rem;
-            "
-            >HUMAN</span
-        ></mark
-    >
-    🏘️
-</div>
diff --git a/website/public/images/displacy-ent1.html b/website/public/images/displacy-ent1.html
deleted file mode 100644
index 9fde5cf88..000000000
--- a/website/public/images/displacy-ent1.html
+++ /dev/null
@@ -1,84 +0,0 @@
-<div
-    class="entities"
-    style="
-        line-height: 2.5;
-        font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Helvetica, Arial, sans-serif,
-            'Apple Color Emoji', 'Segoe UI Emoji', 'Segoe UI Symbol';
-        font-size: 16px;
-    "
->
-    <mark
-        class="entity"
-        style="
-            background: #7aecec;
-            padding: 0.45em 0.6em;
-            margin: 0 0.25em;
-            line-height: 1;
-            border-radius: 0.35em;
-        "
-    >
-        Apple
-        <span
-            style="
-                font-size: 0.8em;
-                font-weight: bold;
-                line-height: 1;
-                border-radius: 0.35em;
-                text-transform: uppercase;
-                vertical-align: middle;
-                margin-left: 0.5rem;
-            "
-            >ORG</span
-        >
-    </mark>
-    is looking at buying
-    <mark
-        class="entity"
-        style="
-            background: #feca74;
-            padding: 0.45em 0.6em;
-            margin: 0 0.25em;
-            line-height: 1;
-            border-radius: 0.35em;
-        "
-    >
-        U.K.
-        <span
-            style="
-                font-size: 0.8em;
-                font-weight: bold;
-                line-height: 1;
-                border-radius: 0.35em;
-                text-transform: uppercase;
-                vertical-align: middle;
-                margin-left: 0.5rem;
-            "
-            >GPE</span
-        >
-    </mark>
-    startup for
-    <mark
-        class="entity"
-        style="
-            background: #e4e7d2;
-            padding: 0.45em 0.6em;
-            margin: 0 0.25em;
-            line-height: 1;
-            border-radius: 0.35em;
-        "
-    >
-        $1 billion
-        <span
-            style="
-                font-size: 0.8em;
-                font-weight: bold;
-                line-height: 1;
-                border-radius: 0.35em;
-                text-transform: uppercase;
-                vertical-align: middle;
-                margin-left: 0.5rem;
-            "
-            >MONEY</span
-        >
-    </mark>
-</div>
diff --git a/website/public/images/displacy-ent2.html b/website/public/images/displacy-ent2.html
deleted file mode 100644
index 01ab5c2bf..000000000
--- a/website/public/images/displacy-ent2.html
+++ /dev/null
@@ -1,86 +0,0 @@
-<div
-    class="entities"
-    style="
-        line-height: 2.5;
-        font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Helvetica, Arial, sans-serif,
-            'Apple Color Emoji', 'Segoe UI Emoji', 'Segoe UI Symbol';
-        font-size: 18px;
-    "
->
-    When
-    <mark
-        class="entity"
-        style="
-            background: #aa9cfc;
-            padding: 0.45em 0.6em;
-            margin: 0 0.25em;
-            line-height: 1;
-            border-radius: 0.35em;
-        "
-    >
-        Sebastian Thrun
-        <span
-            style="
-                font-size: 0.8em;
-                font-weight: bold;
-                line-height: 1;
-                border-radius: 0.35em;
-                text-transform: uppercase;
-                vertical-align: middle;
-                margin-left: 0.5rem;
-            "
-            >PERSON</span
-        >
-    </mark>
-    started working on self-driving cars at
-    <mark
-        class="entity"
-        style="
-            background: #7aecec;
-            padding: 0.45em 0.6em;
-            margin: 0 0.25em;
-            line-height: 1;
-            border-radius: 0.35em;
-        "
-    >
-        Google
-        <span
-            style="
-                font-size: 0.8em;
-                font-weight: bold;
-                line-height: 1;
-                border-radius: 0.35em;
-                text-transform: uppercase;
-                vertical-align: middle;
-                margin-left: 0.5rem;
-            "
-            >ORG</span
-        >
-    </mark>
-    in
-    <mark
-        class="entity"
-        style="
-            background: #bfe1d9;
-            padding: 0.45em 0.6em;
-            margin: 0 0.25em;
-            line-height: 1;
-            border-radius: 0.35em;
-        "
-    >
-        2007
-        <span
-            style="
-                font-size: 0.8em;
-                font-weight: bold;
-                line-height: 1;
-                border-radius: 0.35em;
-                text-transform: uppercase;
-                vertical-align: middle;
-                margin-left: 0.5rem;
-            "
-            >DATE</span
-        >
-    </mark>
-    , few people outside of the company took him seriously.
-</div>
diff --git a/website/public/images/displacy-long.html b/website/public/images/displacy-long.svg
similarity index 100%
rename from website/public/images/displacy-long.html
rename to website/public/images/displacy-long.svg
diff --git a/website/public/images/displacy-long2.svg b/website/public/images/displacy-long2.svg
new file mode 100644
index 000000000..c428bd2cb
--- /dev/null
+++ b/website/public/images/displacy-long2.svg
@@ -0,0 +1,212 @@
+<svg
+    xmlns="http://www.w3.org/2000/svg"
+    xmlns:xlink="http://www.w3.org/1999/xlink"
+    id="0"
+    class="displacy"
+    width="1275"
+    height="399.5"
+    style="
+        max-width: none;
+        height: 399.5px;
+        color: #000000;
+        background: #ffffff;
+        font-family: Arial;
+    "
+>
+    <text class="displacy-token" fill="currentColor" text-anchor="middle" y="309.5">
+        <tspan class="displacy-word" fill="currentColor" x="50">Autonomous</tspan>
+        <tspan class="displacy-tag" dy="2em" fill="currentColor" x="50">ADJ</tspan>
+    </text>
+
+    <text class="displacy-token" fill="currentColor" text-anchor="middle" y="309.5">
+        <tspan class="displacy-word" fill="currentColor" x="225">cars</tspan>
+        <tspan class="displacy-tag" dy="2em" fill="currentColor" x="225">NOUN</tspan>
+    </text>
+
+    <text class="displacy-token" fill="currentColor" text-anchor="middle" y="309.5">
+        <tspan class="displacy-word" fill="currentColor" x="400">shift</tspan>
+        <tspan class="displacy-tag" dy="2em" fill="currentColor" x="400">VERB</tspan>
+    </text>
+
+    <text class="displacy-token" fill="currentColor" text-anchor="middle" y="309.5">
+        <tspan class="displacy-word" fill="currentColor" x="575">insurance</tspan>
+        <tspan class="displacy-tag" dy="2em" fill="currentColor" x="575">NOUN</tspan>
+    </text>
+
+    <text class="displacy-token" fill="currentColor" text-anchor="middle" y="309.5">
+        <tspan class="displacy-word" fill="currentColor" x="750">liability</tspan>
+        <tspan class="displacy-tag" dy="2em" fill="currentColor" x="750">NOUN</tspan>
+    </text>
+
+    <text class="displacy-token" fill="currentColor" text-anchor="middle" y="309.5">
+        <tspan class="displacy-word" fill="currentColor" x="925">toward</tspan>
+        <tspan class="displacy-tag" dy="2em" fill="currentColor" x="925">ADP</tspan>
+    </text>
+
+    <text class="displacy-token" fill="currentColor" text-anchor="middle" y="309.5">
+        <tspan class="displacy-word" fill="currentColor" x="1100">manufacturers</tspan>
+        <tspan class="displacy-tag" dy="2em" fill="currentColor" x="1100">NOUN</tspan>
+    </text>
+
+    <g class="displacy-arrow">
+        <path
+            class="displacy-arc"
+            id="arrow-0-0"
+            stroke-width="2px"
+            d="M70,264.5 C70,177.0 215.0,177.0 215.0,264.5"
+            fill="none"
+            stroke="currentColor"
+        ></path>
+        <text dy="1.25em" style="font-size: 0.8em; letter-spacing: 1px">
+            <textpath
+                xlink:href="#arrow-0-0"
+                class="displacy-label"
+                startOffset="50%"
+                fill="currentColor"
+                text-anchor="middle"
+            >
+                amod
+            </textpath>
+        </text>
+        <path
+            class="displacy-arrowhead"
+            d="M70,266.5 L62,254.5 78,254.5"
+            fill="currentColor"
+        ></path>
+    </g>
+
+    <g class="displacy-arrow">
+        <path
+            class="displacy-arc"
+            id="arrow-0-1"
+            stroke-width="2px"
+            d="M245,264.5 C245,177.0 390.0,177.0 390.0,264.5"
+            fill="none"
+            stroke="currentColor"
+        ></path>
+        <text dy="1.25em" style="font-size: 0.8em; letter-spacing: 1px">
+            <textpath
+                xlink:href="#arrow-0-1"
+                class="displacy-label"
+                startOffset="50%"
+                fill="currentColor"
+                text-anchor="middle"
+            >
+                nsubj
+            </textpath>
+        </text>
+        <path
+            class="displacy-arrowhead"
+            d="M245,266.5 L237,254.5 253,254.5"
+            fill="currentColor"
+        ></path>
+    </g>
+
+    <g class="displacy-arrow">
+        <path
+            class="displacy-arc"
+            id="arrow-0-2"
+            stroke-width="2px"
+            d="M595,264.5 C595,177.0 740.0,177.0 740.0,264.5"
+            fill="none"
+            stroke="currentColor"
+        ></path>
+        <text dy="1.25em" style="font-size: 0.8em; letter-spacing: 1px">
+            <textpath
+                xlink:href="#arrow-0-2"
+                class="displacy-label"
+                startOffset="50%"
+                fill="currentColor"
+                text-anchor="middle"
+            >
+                compound
+            </textpath>
+        </text>
+        <path
+            class="displacy-arrowhead"
+            d="M595,266.5 L587,254.5 603,254.5"
+            fill="currentColor"
+        ></path>
+    </g>
+
+    <g class="displacy-arrow">
+        <path
+            class="displacy-arc"
+            id="arrow-0-3"
+            stroke-width="2px"
+            d="M420,264.5 C420,89.5 745.0,89.5 745.0,264.5"
+            fill="none"
+            stroke="currentColor"
+        ></path>
+        <text dy="1.25em" style="font-size: 0.8em; letter-spacing: 1px">
+            <textpath
+                xlink:href="#arrow-0-3"
+                class="displacy-label"
+                startOffset="50%"
+                fill="currentColor"
+                text-anchor="middle"
+            >
+                dobj
+            </textpath>
+        </text>
+        <path
+            class="displacy-arrowhead"
+            d="M745.0,266.5 L753.0,254.5 737.0,254.5"
+            fill="currentColor"
+        ></path>
+    </g>
+
+    <g class="displacy-arrow">
+        <path
+            class="displacy-arc"
+            id="arrow-0-4"
+            stroke-width="2px"
+            d="M420,264.5 C420,2.0 925.0,2.0 925.0,264.5"
+            fill="none"
+            stroke="currentColor"
+        ></path>
+        <text dy="1.25em" style="font-size: 0.8em; letter-spacing: 1px">
+            <textpath
+                xlink:href="#arrow-0-4"
+                class="displacy-label"
+                startOffset="50%"
+                fill="currentColor"
+                text-anchor="middle"
+            >
+                prep
+            </textpath>
+        </text>
+        <path
+            class="displacy-arrowhead"
+            d="M925.0,266.5 L933.0,254.5 917.0,254.5"
+            fill="currentColor"
+        ></path>
+    </g>
+
+    <g class="displacy-arrow">
+        <path
+            class="displacy-arc"
+            id="arrow-0-5"
+            stroke-width="2px"
+            d="M945,264.5 C945,177.0 1090.0,177.0 1090.0,264.5"
+            fill="none"
+            stroke="currentColor"
+        ></path>
+        <text dy="1.25em" style="font-size: 0.8em; letter-spacing: 1px">
+            <textpath
+                xlink:href="#arrow-0-5"
+                class="displacy-label"
+                startOffset="50%"
+                fill="currentColor"
+                text-anchor="middle"
+            >
+                pobj
+            </textpath>
+        </text>
+        <path
+            class="displacy-arrowhead"
+            d="M1090.0,266.5 L1098.0,254.5 1082.0,254.5"
+            fill="currentColor"
+        ></path>
+    </g>
+</svg>
diff --git a/website/public/images/displacy-span-custom.html b/website/public/images/displacy-span-custom.html
deleted file mode 100644
index 10cb6dd2d..000000000
--- a/website/public/images/displacy-span-custom.html
+++ /dev/null
@@ -1,84 +0,0 @@
-<div
-    class="spans"
-    style="
-        line-height: 2.5;
-        font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Helvetica, Arial, sans-serif,
-            'Apple Color Emoji', 'Segoe UI Emoji', 'Segoe UI Symbol';
-        font-size: 18px;
-        direction: ltr;
-    "
->
-    Welcome to the
-    <span style="font-weight: bold; display: inline-block; position: relative">
-        Bank
-        <span
-            style="
-                background: #ddd;
-                top: 40px;
-                height: 4px;
-                left: -1px;
-                width: calc(100% + 2px);
-                position: absolute;
-            "
-        >
-        </span>
-        <span
-            style="
-                background: #ddd;
-                top: 40px;
-                height: 4px;
-                border-top-left-radius: 3px;
-                border-bottom-left-radius: 3px;
-                left: -1px;
-                width: calc(100% + 2px);
-                position: absolute;
-            "
-        >
-            <span
-                style="
-                    background: #ddd;
-                    color: #000;
-                    top: -0.5em;
-                    padding: 2px 3px;
-                    position: absolute;
-                    font-size: 0.6em;
-                    font-weight: bold;
-                    line-height: 1;
-                    border-radius: 3px;
-                "
-            >
-                BANK
-            </span>
-        </span>
-    </span>
-    <span style="font-weight: bold; display: inline-block; position: relative">
-        of
-        <span
-            style="
-                background: #ddd;
-                top: 40px;
-                height: 4px;
-                left: -1px;
-                width: calc(100% + 2px);
-                position: absolute;
-            "
-        >
-        </span>
-    </span>
-    <span style="font-weight: bold; display: inline-block; position: relative">
-        China
-
-        <span
-            style="
-                background: #ddd;
-                top: 40px;
-                height: 4px;
-                left: -1px;
-                width: calc(100% + 2px);
-                position: absolute;
-            "
-        >
-        </span>
-    </span>
-    .
-</div>
diff --git a/website/public/images/displacy-span.html b/website/public/images/displacy-span.html
deleted file mode 100644
index cfee1dc7e..000000000
--- a/website/public/images/displacy-span.html
+++ /dev/null
@@ -1,123 +0,0 @@
-<div
-    class="spans"
-    style="
-        line-height: 2.5;
-        direction: ltr;
-        font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Helvetica, Arial, sans-serif,
-            'Apple Color Emoji', 'Segoe UI Emoji', 'Segoe UI Symbol';
-        font-size: 18px;
-    "
->
-    Welcome to the
-    <span style="font-weight: bold; display: inline-block; position: relative">
-        Bank
-        <span
-            style="
-                background: #7aecec;
-                top: 40px;
-                height: 4px;
-                left: -1px;
-                width: calc(100% + 2px);
-                position: absolute;
-            "
-        >
-        </span>
-        <span
-            style="
-                background: #7aecec;
-                top: 40px;
-                height: 4px;
-                border-top-left-radius: 3px;
-                border-bottom-left-radius: 3px;
-                left: -1px;
-                width: calc(100% + 2px);
-                position: absolute;
-            "
-        >
-            <span
-                style="
-                    background: #7aecec;
-                    color: #000;
-                    top: -0.5em;
-                    padding: 2px 3px;
-                    position: absolute;
-                    font-size: 0.6em;
-                    font-weight: bold;
-                    line-height: 1;
-                    border-radius: 3px;
-                "
-            >
-                ORG
-            </span>
-        </span>
-    </span>
-    <span style="font-weight: bold; display: inline-block; position: relative">
-        of
-
-        <span
-            style="
-                background: #7aecec;
-                top: 40px;
-                height: 4px;
-                left: -1px;
-                width: calc(100% + 2px);
-                position: absolute;
-            "
-        >
-        </span>
-    </span>
-    <span style="font-weight: bold; display: inline-block; position: relative">
-        China
-        <span
-            style="
-                background: #7aecec;
-                top: 40px;
-                height: 4px;
-                left: -1px;
-                width: calc(100% + 2px);
-                position: absolute;
-            "
-        >
-        </span>
-        <span
-            style="
-                background: #feca74;
-                top: 57px;
-                height: 4px;
-                left: -1px;
-                width: calc(100% + 2px);
-                position: absolute;
-            "
-        >
-        </span>
-        <span
-            style="
-                background: #feca74;
-                top: 57px;
-                height: 4px;
-                border-top-left-radius: 3px;
-                border-bottom-left-radius: 3px;
-                left: -1px;
-                width: calc(100% + 2px);
-                position: absolute;
-            "
-        >
-            <span
-                style="
-                    background: #feca74;
-                    color: #000;
-                    top: -0.5em;
-                    padding: 2px 3px;
-                    position: absolute;
-                    font-size: 0.6em;
-                    font-weight: bold;
-                    line-height: 1;
-                    border-radius: 3px;
-                "
-            >
-                GPE
-            </span>
-        </span>
-    </span>
-    .
-</div>
diff --git a/website/src/components/embed.js b/website/src/components/embed.js
index ad15a0b8b..5e92ca535 100644
--- a/website/src/components/embed.js
+++ b/website/src/components/embed.js
@@ -107,6 +107,22 @@ const Image = ({ src, alt, title, href, ...props }) => {
     )
 }
 
+const ImageScrollable = ({ src, alt, width, ...props }) => {
+    return (
+        <figure className={classNames(classes.standalone, classes.scrollable)}>
+            <img className={classes['image-scrollable']} src={src} alt={alt} width={width} height="auto" />
+        </figure>
+    )
+}
+
+const Standalone = ({ height, children, ...props }) => {
+    return (
+        <figure className={classes.standalone} style={{ height }}>
+            {children}
+        </figure>
+    )
+}
+
 const ImageFill = ({ image, ...props }) => {
     return (
         <span
@@ -137,4 +153,4 @@ const GoogleSheet = ({ id, link, height, button = 'View full table' }) => {
     )
 }
 
-export { YouTube, SoundCloud, Iframe, Image, ImageFill, GoogleSheet }
+export { YouTube, SoundCloud, Iframe, Image, ImageFill, ImageScrollable, GoogleSheet, Standalone }
diff --git a/website/src/remark.js b/website/src/remark.js
index 7e5499b01..be787eb84 100644
--- a/website/src/remark.js
+++ b/website/src/remark.js
@@ -13,7 +13,7 @@ import Aside from './components/aside'
 import Button from './components/button'
 import Tag from './components/tag'
 import Grid from './components/grid'
-import { YouTube, SoundCloud, Iframe, Image, GoogleSheet } from './components/embed'
+import { YouTube, SoundCloud, Iframe, Image, ImageScrollable, GoogleSheet, Standalone } from './components/embed'
 import Project from './widgets/project'
 import { Integration, IntegrationLogo } from './widgets/integration.js'
 import { Logos, Colors, Patterns } from './widgets/styleguide'
@@ -90,6 +90,8 @@ export const remarkComponents = {
      * For regular img elements it is not possible to pass properties
      */
     Image,
+    ImageScrollable,
+    Standalone,
 
     Label,
     Logos,
diff --git a/website/src/styles/embed.module.sass b/website/src/styles/embed.module.sass
index 82b7408ca..01814421f 100644
--- a/website/src/styles/embed.module.sass
+++ b/website/src/styles/embed.module.sass
@@ -26,12 +26,20 @@
     padding: var(--spacing-xs)
     margin-bottom: var(--spacing-md)
 
+.scrollable
+    max-width: 100%
+    overflow: auto
+
 .image
     position: relative
     display: block
     max-width: 100%
     margin: 0 auto
 
+.image-scrollable
+    display: block
+    max-width: fit-content
+
 .figure-fill
     display: block
     position: relative

From 65e7bd54f5d612aa0aeb4f6a4dd9595d73c012b0 Mon Sep 17 00:00:00 2001
From: Ines Montani <ines@ines.io>
Date: Fri, 6 Oct 2023 14:36:37 +0200
Subject: [PATCH 13/25] Update usage sidebar and nav alert [ci skip]

---
 website/meta/sidebars.json     | 9 ++-------
 website/src/templates/index.js | 4 ++--
 2 files changed, 4 insertions(+), 9 deletions(-)

diff --git a/website/meta/sidebars.json b/website/meta/sidebars.json
index 24213ed12..2df120ffa 100644
--- a/website/meta/sidebars.json
+++ b/website/meta/sidebars.json
@@ -9,14 +9,9 @@
                     { "text": "Models & Languages", "url": "/usage/models" },
                     { "text": "Facts & Figures", "url": "/usage/facts-figures" },
                     { "text": "spaCy 101", "url": "/usage/spacy-101" },
-                    { "text": "New in v3.0", "url": "/usage/v3" },
-                    { "text": "New in v3.1", "url": "/usage/v3-1" },
-                    { "text": "New in v3.2", "url": "/usage/v3-2" },
-                    { "text": "New in v3.3", "url": "/usage/v3-3" },
-                    { "text": "New in v3.4", "url": "/usage/v3-4" },
-                    { "text": "New in v3.5", "url": "/usage/v3-5" },
+                    { "text": "New in v3.7", "url": "/usage/v3-7" },
                     { "text": "New in v3.6", "url": "/usage/v3-6" },
-                    { "text": "New in v3.7", "url": "/usage/v3-7" }
+                    { "text": "New in v3.5", "url": "/usage/v3-5" }
                 ]
             },
             {
diff --git a/website/src/templates/index.js b/website/src/templates/index.js
index 1c969bd39..fad12f4c8 100644
--- a/website/src/templates/index.js
+++ b/website/src/templates/index.js
@@ -58,8 +58,8 @@ const AlertSpace = ({ nightly, legacy }) => {
 }
 
 const navAlert = (
-    <Link to="/usage/v3-7" noLinkLayout>
-        <strong>💥 Out now:</strong> spaCy v3.7
+    <Link to="https://form.typeform.com/to/WlflqP1b" noLinkLayout>
+        💥 Interested in <strong>Premium spaCy Models</strong>?
     </Link>
 )
 

From 77c568e5247bd0ff3744abce5c8541ecd7930524 Mon Sep 17 00:00:00 2001
From: Adriane Boyd <adrianeboyd@gmail.com>
Date: Tue, 10 Oct 2023 15:35:25 +0200
Subject: [PATCH 14/25] Restore spacy.cli.project API (#13053)

* Restore spacy.cli.project API

* Fix typing errors, add simple import test
---
 spacy/cli/__init__.py               | 13 +++++++++++--
 spacy/cli/project/__init__.py       |  0
 spacy/cli/project/assets.py         |  1 +
 spacy/cli/project/clone.py          |  1 +
 spacy/cli/project/document.py       |  1 +
 spacy/cli/project/dvc.py            |  1 +
 spacy/cli/project/pull.py           |  1 +
 spacy/cli/project/push.py           |  1 +
 spacy/cli/project/remote_storage.py |  1 +
 spacy/cli/project/run.py            |  1 +
 spacy/tests/test_cli.py             |  5 +++++
 11 files changed, 24 insertions(+), 2 deletions(-)
 create mode 100644 spacy/cli/project/__init__.py
 create mode 100644 spacy/cli/project/assets.py
 create mode 100644 spacy/cli/project/clone.py
 create mode 100644 spacy/cli/project/document.py
 create mode 100644 spacy/cli/project/dvc.py
 create mode 100644 spacy/cli/project/pull.py
 create mode 100644 spacy/cli/project/push.py
 create mode 100644 spacy/cli/project/remote_storage.py
 create mode 100644 spacy/cli/project/run.py

diff --git a/spacy/cli/__init__.py b/spacy/cli/__init__.py
index f3c6dbfed..1d402ff0c 100644
--- a/spacy/cli/__init__.py
+++ b/spacy/cli/__init__.py
@@ -22,8 +22,17 @@ from .init_pipeline import init_pipeline_cli  # noqa: F401
 from .package import package  # noqa: F401
 from .pretrain import pretrain  # noqa: F401
 from .profile import profile  # noqa: F401
-from .train import train_cli  # noqa: F401
-from .validate import validate  # noqa: F401
+from .project.assets import project_assets  # type: ignore[attr-defined]  # noqa: F401
+from .project.clone import project_clone  # type: ignore[attr-defined]  # noqa: F401
+from .project.document import (  # type: ignore[attr-defined]  # noqa: F401
+    project_document,
+)
+from .project.dvc import project_update_dvc  # type: ignore[attr-defined]  # noqa: F401
+from .project.pull import project_pull  # type: ignore[attr-defined]  # noqa: F401
+from .project.push import project_push  # type: ignore[attr-defined]  # noqa: F401
+from .project.run import project_run  # type: ignore[attr-defined]  # noqa: F401
+from .train import train_cli  # type: ignore[attr-defined]  # noqa: F401
+from .validate import validate  # type: ignore[attr-defined]  # noqa: F401
 
 
 @app.command("link", no_args_is_help=True, deprecated=True, hidden=True)
diff --git a/spacy/cli/project/__init__.py b/spacy/cli/project/__init__.py
new file mode 100644
index 000000000..e69de29bb
diff --git a/spacy/cli/project/assets.py b/spacy/cli/project/assets.py
new file mode 100644
index 000000000..591d1959e
--- /dev/null
+++ b/spacy/cli/project/assets.py
@@ -0,0 +1 @@
+from weasel.cli.assets import *
diff --git a/spacy/cli/project/clone.py b/spacy/cli/project/clone.py
new file mode 100644
index 000000000..11d2511a3
--- /dev/null
+++ b/spacy/cli/project/clone.py
@@ -0,0 +1 @@
+from weasel.cli.clone import *
diff --git a/spacy/cli/project/document.py b/spacy/cli/project/document.py
new file mode 100644
index 000000000..1952524a9
--- /dev/null
+++ b/spacy/cli/project/document.py
@@ -0,0 +1 @@
+from weasel.cli.document import *
diff --git a/spacy/cli/project/dvc.py b/spacy/cli/project/dvc.py
new file mode 100644
index 000000000..aa1ae7dd9
--- /dev/null
+++ b/spacy/cli/project/dvc.py
@@ -0,0 +1 @@
+from weasel.cli.dvc import *
diff --git a/spacy/cli/project/pull.py b/spacy/cli/project/pull.py
new file mode 100644
index 000000000..5e603273d
--- /dev/null
+++ b/spacy/cli/project/pull.py
@@ -0,0 +1 @@
+from weasel.cli.pull import *
diff --git a/spacy/cli/project/push.py b/spacy/cli/project/push.py
new file mode 100644
index 000000000..3a8e8869d
--- /dev/null
+++ b/spacy/cli/project/push.py
@@ -0,0 +1 @@
+from weasel.cli.push import *
diff --git a/spacy/cli/project/remote_storage.py b/spacy/cli/project/remote_storage.py
new file mode 100644
index 000000000..29409150f
--- /dev/null
+++ b/spacy/cli/project/remote_storage.py
@@ -0,0 +1 @@
+from weasel.cli.remote_storage import *
diff --git a/spacy/cli/project/run.py b/spacy/cli/project/run.py
new file mode 100644
index 000000000..cc6a5ac42
--- /dev/null
+++ b/spacy/cli/project/run.py
@@ -0,0 +1 @@
+from weasel.cli.run import *
diff --git a/spacy/tests/test_cli.py b/spacy/tests/test_cli.py
index 86451317b..ff53ed1e1 100644
--- a/spacy/tests/test_cli.py
+++ b/spacy/tests/test_cli.py
@@ -1061,3 +1061,8 @@ def test_debug_data_trainable_lemmatizer_not_annotated():
 
     data = _compile_gold(train_examples, ["trainable_lemmatizer"], nlp, True)
     assert data["no_lemma_annotations"] == 2
+
+
+def test_project_api_imports():
+    from spacy.cli import project_run
+    from spacy.cli.project.run import project_run  # noqa: F401, F811

From d72029d9c88f479da1b1866ab9998f3427821e2e Mon Sep 17 00:00:00 2001
From: Raphael Mitsch <r.mitsch@outlook.com>
Date: Wed, 11 Oct 2023 12:23:38 +0200
Subject: [PATCH 15/25] Add binary examples for Textcat task in `spacy-llm`
 (#13051)

* Add examples for binary classification.

* Fix example.

* Remove binary textcat example. Format.

* Rephrase.
---
 website/docs/api/large-language-models.mdx | 19 +++++++++++++++++++
 1 file changed, 19 insertions(+)

diff --git a/website/docs/api/large-language-models.mdx b/website/docs/api/large-language-models.mdx
index f8404cb2e..55d137e21 100644
--- a/website/docs/api/large-language-models.mdx
+++ b/website/docs/api/large-language-models.mdx
@@ -752,6 +752,25 @@ supports `.yml`, `.yaml`, `.json` and `.jsonl`.
 path = "textcat_examples.json"
 ```
 
+If you want to perform few-shot learning with a binary classifier (i. e. a text
+either should or should not be assigned to a given class), you can provide
+positive and negative examples with answers of "POS" or "NEG". "POS" means that
+this example should be assigned the class label defined in the configuration,
+"NEG" means it shouldn't. E. g. for spam classification:
+
+```json
+[
+  {
+    "text": "You won the lottery! Wire a fee of 200$ to be able to withdraw your winnings.",
+    "answer": "POS"
+  },
+  {
+    "text": "Your order #123456789 has arrived",
+    "answer": "NEG"
+  }
+]
+```
+
 ### REL {id="rel"}
 
 The REL task extracts relations between named entities.

From ea1befa8ff5dc8e93c5ee4fd824a16b1c0d8534c Mon Sep 17 00:00:00 2001
From: Adriane Boyd <adrianeboyd@gmail.com>
Date: Thu, 12 Oct 2023 11:53:33 +0200
Subject: [PATCH 16/25] Support Any comparisons for Token and Span (#13058)

* Support Any comparisons for Token and Span

* Preserve previous behavior for None
---
 spacy/tests/doc/test_span.py      | 9 +++++++++
 spacy/tests/doc/test_token_api.py | 9 +++++++++
 spacy/tokens/span.pyx             | 7 +++++--
 spacy/tokens/token.pyi            | 7 ++++++-
 spacy/tokens/token.pyx            | 9 ++++++---
 5 files changed, 35 insertions(+), 6 deletions(-)

diff --git a/spacy/tests/doc/test_span.py b/spacy/tests/doc/test_span.py
index 04dde2bfa..98a74bc21 100644
--- a/spacy/tests/doc/test_span.py
+++ b/spacy/tests/doc/test_span.py
@@ -731,3 +731,12 @@ def test_for_no_ent_sents():
     sents = list(doc.ents[0].sents)
     assert len(sents) == 1
     assert str(sents[0]) == str(doc.ents[0].sent) == "ENTITY"
+
+
+def test_span_api_richcmp_other(en_tokenizer):
+    doc1 = en_tokenizer("a b")
+    doc2 = en_tokenizer("b c")
+    assert not doc1[1:2] == doc1[1]
+    assert not doc1[1:2] == doc2[0]
+    assert not doc1[1:2] == doc2[0:1]
+    assert not doc1[0:1] == doc2
diff --git a/spacy/tests/doc/test_token_api.py b/spacy/tests/doc/test_token_api.py
index 782dfd774..c10221e65 100644
--- a/spacy/tests/doc/test_token_api.py
+++ b/spacy/tests/doc/test_token_api.py
@@ -294,3 +294,12 @@ def test_missing_head_dep(en_vocab):
     assert aligned_heads[0] == ref_heads[0]
     assert aligned_deps[5] == ref_deps[5]
     assert aligned_heads[5] == ref_heads[5]
+
+
+def test_token_api_richcmp_other(en_tokenizer):
+    doc1 = en_tokenizer("a b")
+    doc2 = en_tokenizer("b c")
+    assert not doc1[1] == doc1[0:1]
+    assert not doc1[1] == doc2[1:2]
+    assert not doc1[1] == doc2[0]
+    assert not doc1[0] == doc2
diff --git a/spacy/tokens/span.pyx b/spacy/tokens/span.pyx
index af3ba8db5..e179bbce7 100644
--- a/spacy/tokens/span.pyx
+++ b/spacy/tokens/span.pyx
@@ -127,14 +127,17 @@ cdef class Span:
         self._vector = vector
         self._vector_norm = vector_norm
 
-    def __richcmp__(self, Span other, int op):
+    def __richcmp__(self, object other, int op):
         if other is None:
             if op == 0 or op == 1 or op == 2:
                 return False
             else:
                 return True
+        if not isinstance(other, Span):
+            return False
+        cdef Span other_span = other
         self_tuple = (self.c.start_char, self.c.end_char, self.c.label, self.c.kb_id, self.id, self.doc)
-        other_tuple = (other.c.start_char, other.c.end_char, other.c.label, other.c.kb_id, other.id, other.doc)
+        other_tuple = (other_span.c.start_char, other_span.c.end_char, other_span.c.label, other_span.c.kb_id, other_span.id, other_span.doc)
         # <
         if op == 0:
             return self_tuple < other_tuple
diff --git a/spacy/tokens/token.pyi b/spacy/tokens/token.pyi
index e7863fd16..435ace527 100644
--- a/spacy/tokens/token.pyi
+++ b/spacy/tokens/token.pyi
@@ -53,7 +53,12 @@ class Token:
     def __bytes__(self) -> bytes: ...
     def __str__(self) -> str: ...
     def __repr__(self) -> str: ...
-    def __richcmp__(self, other: Token, op: int) -> bool: ...
+    def __lt__(self, other: Any) -> bool: ...
+    def __le__(self, other: Any) -> bool: ...
+    def __eq__(self, other: Any) -> bool: ...
+    def __ne__(self, other: Any) -> bool: ...
+    def __gt__(self, other: Any) -> bool: ...
+    def __ge__(self, other: Any) -> bool: ...
     @property
     def _(self) -> Underscore: ...
     def nbor(self, i: int = ...) -> Token: ...
diff --git a/spacy/tokens/token.pyx b/spacy/tokens/token.pyx
index 9fd4118d6..2ed736b70 100644
--- a/spacy/tokens/token.pyx
+++ b/spacy/tokens/token.pyx
@@ -139,17 +139,20 @@ cdef class Token:
     def __repr__(self):
         return self.__str__()
 
-    def __richcmp__(self, Token other, int op):
+    def __richcmp__(self, object other, int op):
         # http://cython.readthedocs.io/en/latest/src/userguide/special_methods.html
         if other is None:
             if op in (0, 1, 2):
                 return False
             else:
                 return True
+        if not isinstance(other, Token):
+            return False
+        cdef Token other_token = other
         cdef Doc my_doc = self.doc
-        cdef Doc other_doc = other.doc
+        cdef Doc other_doc = other_token.doc
         my = self.idx
-        their = other.idx
+        their = other_token.idx
         if op == 0:
             return my < their
         elif op == 2:

From 699dd8b3b7a21dfdc71c740de7096f5d9cb5d646 Mon Sep 17 00:00:00 2001
From: Sofie Van Landeghem <svlandeg@users.noreply.github.com>
Date: Mon, 16 Oct 2023 10:17:47 +0200
Subject: [PATCH 17/25] Update __all__ fields (#13063)

* update all for pipeline.init

* add all in training.init

* add all in kb.init

* alphabetically
---
 spacy/kb/__init__.py       |  8 ++++++++
 spacy/matcher/__init__.py  |  2 +-
 spacy/pipeline/__init__.py |  1 +
 spacy/tokens/__init__.py   |  2 +-
 spacy/training/__init__.py | 25 +++++++++++++++++++++++++
 5 files changed, 36 insertions(+), 2 deletions(-)

diff --git a/spacy/kb/__init__.py b/spacy/kb/__init__.py
index 3ce3e4c33..93a65ab61 100644
--- a/spacy/kb/__init__.py
+++ b/spacy/kb/__init__.py
@@ -1,3 +1,11 @@
 from .candidate import Candidate, get_candidates, get_candidates_batch
 from .kb import KnowledgeBase
 from .kb_in_memory import InMemoryLookupKB
+
+__all__ = [
+    "Candidate",
+    "KnowledgeBase",
+    "InMemoryLookupKB",
+    "get_candidates",
+    "get_candidates_batch",
+]
diff --git a/spacy/matcher/__init__.py b/spacy/matcher/__init__.py
index f671f2e35..b6d6d70ab 100644
--- a/spacy/matcher/__init__.py
+++ b/spacy/matcher/__init__.py
@@ -3,4 +3,4 @@ from .levenshtein import levenshtein
 from .matcher import Matcher
 from .phrasematcher import PhraseMatcher
 
-__all__ = ["Matcher", "PhraseMatcher", "DependencyMatcher", "levenshtein"]
+__all__ = ["DependencyMatcher", "Matcher", "PhraseMatcher", "levenshtein"]
diff --git a/spacy/pipeline/__init__.py b/spacy/pipeline/__init__.py
index 40e3fd638..2c4a5a8a8 100644
--- a/spacy/pipeline/__init__.py
+++ b/spacy/pipeline/__init__.py
@@ -22,6 +22,7 @@ from .trainable_pipe import TrainablePipe
 __all__ = [
     "AttributeRuler",
     "DependencyParser",
+    "EditTreeLemmatizer",
     "EntityLinker",
     "EntityRecognizer",
     "EntityRuler",
diff --git a/spacy/tokens/__init__.py b/spacy/tokens/__init__.py
index f4b2bf022..3393ca6ec 100644
--- a/spacy/tokens/__init__.py
+++ b/spacy/tokens/__init__.py
@@ -5,4 +5,4 @@ from .span import Span
 from .span_group import SpanGroup
 from .token import Token
 
-__all__ = ["Doc", "Token", "Span", "SpanGroup", "DocBin", "MorphAnalysis"]
+__all__ = ["Doc", "DocBin", "MorphAnalysis", "Span", "SpanGroup", "Token"]
diff --git a/spacy/training/__init__.py b/spacy/training/__init__.py
index b8c0792f0..5c2ba9932 100644
--- a/spacy/training/__init__.py
+++ b/spacy/training/__init__.py
@@ -16,3 +16,28 @@ from .iob_utils import (  # noqa: F401
     tags_to_entities,
 )
 from .loggers import console_logger  # noqa: F401
+
+__all__ = [
+    "Alignment",
+    "Corpus",
+    "Example",
+    "JsonlCorpus",
+    "PlainTextCorpus",
+    "biluo_tags_to_offsets",
+    "biluo_tags_to_spans",
+    "biluo_to_iob",
+    "create_copy_from_base_model",
+    "docs_to_json",
+    "dont_augment",
+    "iob_to_biluo",
+    "minibatch_by_padded_size",
+    "minibatch_by_words",
+    "offsets_to_biluo_tags",
+    "orth_variants_augmenter",
+    "read_json_file",
+    "remove_bilu_prefix",
+    "split_bilu_label",
+    "tags_to_entities",
+    "validate_get_examples",
+    "validate_examples",
+]

From a89eae928340f66c954345c56346475f6597e786 Mon Sep 17 00:00:00 2001
From: Adriane Boyd <adrianeboyd@gmail.com>
Date: Mon, 16 Oct 2023 15:10:55 +0200
Subject: [PATCH 18/25] Set version to v3.7.2 (#13066)

---
 spacy/about.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/spacy/about.py b/spacy/about.py
index 0e718400b..9da0b6d74 100644
--- a/spacy/about.py
+++ b/spacy/about.py
@@ -1,5 +1,5 @@
 # fmt: off
 __title__ = "spacy"
-__version__ = "3.7.1"
+__version__ = "3.7.2"
 __download_url__ = "https://github.com/explosion/spacy-models/releases/download"
 __compatibility__ = "https://raw.githubusercontent.com/explosion/spacy-models/master/compatibility.json"

From d717123819fb02cf81dcc26be305c0f9cd9893bf Mon Sep 17 00:00:00 2001
From: Sofie Van Landeghem <svlandeg@users.noreply.github.com>
Date: Mon, 23 Oct 2023 11:59:18 +0200
Subject: [PATCH 19/25] Update LICENSE (#13078)

---
 LICENSE | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/LICENSE b/LICENSE
index d76864579..979f5ade7 100644
--- a/LICENSE
+++ b/LICENSE
@@ -1,6 +1,6 @@
 The MIT License (MIT)
 
-Copyright (C) 2016-2022 ExplosionAI GmbH, 2016 spaCy GmbH, 2015 Matthew Honnibal
+Copyright (C) 2016-2023 ExplosionAI GmbH, 2016 spaCy GmbH, 2015 Matthew Honnibal
 
 Permission is hereby granted, free of charge, to any person obtaining a copy
 of this software and associated documentation files (the "Software"), to deal

From 9deaac9786a8dd47aa246ba3ef53dc5924d646ab Mon Sep 17 00:00:00 2001
From: Raphael Mitsch <r.mitsch@outlook.com>
Date: Mon, 30 Oct 2023 17:02:08 +0100
Subject: [PATCH 20/25] Add note in docs on `score_weight` config if using a
 non-default `spans_key` for SpanCat (#13093)

* Add note on score_weight if using a non-default span_key for SpanCat.

* Fix formatting.

* Fix formatting.

* Fix typo.

* Use warning infobox.

* Fix infobox formatting.
---
 website/docs/api/spancategorizer.mdx | 14 ++++++++++++++
 1 file changed, 14 insertions(+)

diff --git a/website/docs/api/spancategorizer.mdx b/website/docs/api/spancategorizer.mdx
index bfe33dfb9..8c8a71256 100644
--- a/website/docs/api/spancategorizer.mdx
+++ b/website/docs/api/spancategorizer.mdx
@@ -89,6 +89,20 @@ architectures and their arguments and hyperparameters.
 | `negative_weight` <Tag variant="new">3.5.1</Tag>    | Multiplier for the loss terms. It can be used to downweight the negative samples if there are too many. It is only used when `add_negative_label` is `True`. Defaults to `1.0`. ~~float~~                                                                                                               |
 | `allow_overlap` <Tag variant="new">3.5.1</Tag>      | If `True`, the data is assumed to contain overlapping spans. It is only available when `max_positive` is exactly 1. Defaults to `True`. ~~bool~~                                                                                                                                                        |
 
+<Infobox variant="warning">
+
+If you set a non-default value for `spans_key`, you'll have to update
+`[training.score_weights]` as well so that weights are computed properly. E. g. for `span_key == "myspankey"`, include this in your config:
+
+```ini
+[training.score_weights]
+spans_myspankey_f = 1.0
+spans_myspankey_p = 0.0
+spans_myspankey_r = 0.0
+```
+
+</Infobox>
+
 ```python
 %%GITHUB_SPACY/spacy/pipeline/spancat.py
 ```

From 0c158765024aac04088af8c3ae77650df5a79a3d Mon Sep 17 00:00:00 2001
From: Raphael Mitsch <r.mitsch@outlook.com>
Date: Tue, 31 Oct 2023 13:45:10 +0100
Subject: [PATCH 21/25] Fix spancat typo. (#13095)

---
 website/docs/api/spancategorizer.mdx | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/website/docs/api/spancategorizer.mdx b/website/docs/api/spancategorizer.mdx
index 8c8a71256..98a1948ee 100644
--- a/website/docs/api/spancategorizer.mdx
+++ b/website/docs/api/spancategorizer.mdx
@@ -92,7 +92,8 @@ architectures and their arguments and hyperparameters.
 <Infobox variant="warning">
 
 If you set a non-default value for `spans_key`, you'll have to update
-`[training.score_weights]` as well so that weights are computed properly. E. g. for `span_key == "myspankey"`, include this in your config:
+`[training.score_weights]` as well so that weights are computed properly. E. g.
+for `spans_key == "myspankey"`, include this in your config:
 
 ```ini
 [training.score_weights]

From 48248c62b6190a833d3cc4557e40497f1a5a1eff Mon Sep 17 00:00:00 2001
From: Sofie Van Landeghem <svlandeg@users.noreply.github.com>
Date: Tue, 31 Oct 2023 21:58:29 +0100
Subject: [PATCH 22/25] Clarify EL example in docs (#13071)

* add comment that pipeline is a custom one

* add link to NEL tutorial

* prettier

* revert prettier reformat

* revert prettier reformat (2)

* fix typo

Co-authored-by: Raphael Mitsch <r.mitsch@outlook.com>

---------

Co-authored-by: Raphael Mitsch <r.mitsch@outlook.com>
---
 website/docs/usage/linguistic-features.mdx | 10 ++++++----
 1 file changed, 6 insertions(+), 4 deletions(-)

diff --git a/website/docs/usage/linguistic-features.mdx b/website/docs/usage/linguistic-features.mdx
index 47259ce15..21cedd1ef 100644
--- a/website/docs/usage/linguistic-features.mdx
+++ b/website/docs/usage/linguistic-features.mdx
@@ -290,10 +290,7 @@ for token in doc:
 | toward        | `prep`     | shift     | `NOUN`   | manufacturers           |
 | manufacturers | `pobj`     | toward    | `ADP`    |                         |
 
-<ImageScrollable
-  src="/images/displacy-long2.svg"
-  width={1275}
-/>
+<ImageScrollable src="/images/displacy-long2.svg" width={1275} />
 
 Because the syntactic relations form a tree, every word has **exactly one
 head**. You can therefore iterate over the arcs in the tree by iterating over
@@ -720,6 +717,10 @@ identifier from a knowledge base (KB). You can create your own
 [`KnowledgeBase`](/api/kb) and [train](/usage/training) a new
 [`EntityLinker`](/api/entitylinker) using that custom knowledge base.
 
+As an example on how to define a KnowledgeBase and train an entity linker model,
+see [`this tutorial`](https://github.com/explosion/projects/blob/v3/tutorials/nel_emerson)
+using [spaCy projects](/usage/projects).
+
 ### Accessing entity identifiers {id="entity-linking-accessing",model="entity linking"}
 
 The annotated KB identifier is accessible as either a hash value or as a string,
@@ -730,6 +731,7 @@ object, or the `ent_kb_id` and `ent_kb_id_` attributes of a
 ```python
 import spacy
 
+# "my_custom_el_pipeline" is assumed to be a custom NLP pipeline that was trained and serialized to disk
 nlp = spacy.load("my_custom_el_pipeline")
 doc = nlp("Ada Lovelace was born in London")
 

From a804b83a4bb8cbe1c49ba529ad1d54d6f32de3a5 Mon Sep 17 00:00:00 2001
From: Sofie Van Landeghem <svlandeg@users.noreply.github.com>
Date: Tue, 31 Oct 2023 22:07:07 +0100
Subject: [PATCH 23/25] Update llm docs to clarify task-specific factories
 (#13082)

* fix typo

* add examples to specify custom model for task-specific factory
---
 website/docs/api/large-language-models.mdx | 23 +++++++++++++---------
 1 file changed, 14 insertions(+), 9 deletions(-)

diff --git a/website/docs/api/large-language-models.mdx b/website/docs/api/large-language-models.mdx
index 55d137e21..5739a6c2f 100644
--- a/website/docs/api/large-language-models.mdx
+++ b/website/docs/api/large-language-models.mdx
@@ -16,14 +16,6 @@ prototyping** and **prompting**, and turning unstructured responses into
 
 ## Config and implementation {id="config"}
 
-An LLM component is implemented through the `LLMWrapper` class. It is accessible
-through a generic `llm`
-[component factory](https://spacy.io/usage/processing-pipelines#custom-components-factories)
-as well as through task-specific component factories: `llm_ner`, `llm_spancat`,
-`llm_rel`, `llm_textcat`, `llm_sentiment` and `llm_summarization`.
-
-### LLMWrapper.\_\_init\_\_ {id="init",tag="method"}
-
 > #### Example
 >
 > ```python
@@ -32,13 +24,26 @@ as well as through task-specific component factories: `llm_ner`, `llm_spancat`,
 > llm = nlp.add_pipe("llm", config=config)
 >
 > # Construction via add_pipe with a task-specific factory and default GPT3.5 model
-> llm = nlp.add_pipe("llm-ner")
+> llm = nlp.add_pipe("llm_ner")
+>
+> # Construction via add_pipe with a task-specific factory and custom model
+> llm = nlp.add_pipe("llm_ner", config={"model": {"@llm_models": "spacy.Dolly.v1", "name": "dolly-v2-12b"}})
 >
 > # Construction from class
 > from spacy_llm.pipeline import LLMWrapper
 > llm = LLMWrapper(vocab=nlp.vocab, task=task, model=model, cache=cache, save_io=True)
 > ```
 
+An LLM component is implemented through the `LLMWrapper` class. It is accessible
+through a generic `llm`
+[component factory](https://spacy.io/usage/processing-pipelines#custom-components-factories)
+as well as through task-specific component factories: `llm_ner`, `llm_spancat`,
+`llm_rel`, `llm_textcat`, `llm_sentiment` and `llm_summarization`. For these
+factories, the GPT-3-5 model from OpenAI is used by default, but this can be
+customized.
+
+### LLMWrapper.\_\_init\_\_ {id="init",tag="method"}
+
 Create a new pipeline instance. In your application, you would normally use a
 shortcut for this and instantiate the component using its string name and
 [`nlp.add_pipe`](/api/language#add_pipe).

From c4e2daf6ef24a280e3c252e62a8534110c417ce8 Mon Sep 17 00:00:00 2001
From: Raphael Mitsch <r.mitsch@outlook.com>
Date: Thu, 2 Nov 2023 12:02:18 +0100
Subject: [PATCH 24/25] Fix displacy span stacking (#13068)

* Fix displacy span stacking.

* Format. Remove counter.

* Remove test files.

* Add unit test. Refactor to allow for unit test.

* Fix off-by-one error in tests.
---
 spacy/displacy/render.py     | 39 +++++++++++++++++++++++++++---------
 spacy/tests/test_displacy.py | 22 +++++++++++++++++++-
 2 files changed, 51 insertions(+), 10 deletions(-)

diff --git a/spacy/displacy/render.py b/spacy/displacy/render.py
index 2ab41ccc2..40b9986e8 100644
--- a/spacy/displacy/render.py
+++ b/spacy/displacy/render.py
@@ -142,7 +142,25 @@ class SpanRenderer:
         spans (list): Individual entity spans and their start, end, label, kb_id and kb_url.
         title (str / None): Document title set in Doc.user_data['title'].
         """
-        per_token_info = []
+        per_token_info = self._assemble_per_token_info(tokens, spans)
+        markup = self._render_markup(per_token_info)
+        markup = TPL_SPANS.format(content=markup, dir=self.direction)
+        if title:
+            markup = TPL_TITLE.format(title=title) + markup
+        return markup
+
+    @staticmethod
+    def _assemble_per_token_info(
+        tokens: List[str], spans: List[Dict[str, Any]]
+    ) -> List[Dict[str, List[Dict[str, Any]]]]:
+        """Assembles token info used to generate markup in render_spans().
+        tokens (List[str]): Tokens in text.
+        spans (List[Dict[str, Any]]): Spans in text.
+        RETURNS (List[Dict[str, List[Dict, str, Any]]]): Per token info needed to render HTML markup for given tokens
+            and spans.
+        """
+        per_token_info: List[Dict[str, List[Dict[str, Any]]]] = []
+
         # we must sort so that we can correctly describe when spans need to "stack"
         # which is determined by their start token, then span length (longer spans on top),
         # then break any remaining ties with the span label
@@ -154,21 +172,22 @@ class SpanRenderer:
                 s["label"],
             ),
         )
+
         for s in spans:
             # this is the vertical 'slot' that the span will be rendered in
             # vertical_position = span_label_offset + (offset_step * (slot - 1))
             s["render_slot"] = 0
+
         for idx, token in enumerate(tokens):
             # Identify if a token belongs to a Span (and which) and if it's a
             # start token of said Span. We'll use this for the final HTML render
             token_markup: Dict[str, Any] = {}
             token_markup["text"] = token
-            concurrent_spans = 0
+            intersecting_spans: List[Dict[str, Any]] = []
             entities = []
             for span in spans:
                 ent = {}
                 if span["start_token"] <= idx < span["end_token"]:
-                    concurrent_spans += 1
                     span_start = idx == span["start_token"]
                     ent["label"] = span["label"]
                     ent["is_start"] = span_start
@@ -176,7 +195,12 @@ class SpanRenderer:
                         # When the span starts, we need to know how many other
                         # spans are on the 'span stack' and will be rendered.
                         # This value becomes the vertical render slot for this entire span
-                        span["render_slot"] = concurrent_spans
+                        span["render_slot"] = (
+                            intersecting_spans[-1]["render_slot"]
+                            if len(intersecting_spans)
+                            else 0
+                        ) + 1
+                    intersecting_spans.append(span)
                     ent["render_slot"] = span["render_slot"]
                     kb_id = span.get("kb_id", "")
                     kb_url = span.get("kb_url", "#")
@@ -193,11 +217,8 @@ class SpanRenderer:
                     span["render_slot"] = 0
             token_markup["entities"] = entities
             per_token_info.append(token_markup)
-        markup = self._render_markup(per_token_info)
-        markup = TPL_SPANS.format(content=markup, dir=self.direction)
-        if title:
-            markup = TPL_TITLE.format(title=title) + markup
-        return markup
+
+        return per_token_info
 
     def _render_markup(self, per_token_info: List[Dict[str, Any]]) -> str:
         """Render the markup from per-token information"""
diff --git a/spacy/tests/test_displacy.py b/spacy/tests/test_displacy.py
index 12d903dca..b83c7db07 100644
--- a/spacy/tests/test_displacy.py
+++ b/spacy/tests/test_displacy.py
@@ -2,7 +2,7 @@ import numpy
 import pytest
 
 from spacy import displacy
-from spacy.displacy.render import DependencyRenderer, EntityRenderer
+from spacy.displacy.render import DependencyRenderer, EntityRenderer, SpanRenderer
 from spacy.lang.en import English
 from spacy.lang.fa import Persian
 from spacy.tokens import Doc, Span
@@ -468,3 +468,23 @@ def test_issue12816(en_vocab) -> None:
     # Verify that the HTML tag is still escaped
     html = displacy.render(doc, style="span")
     assert "&lt;TEST&gt;" in html
+
+
+@pytest.mark.issue(13056)
+def test_displacy_span_stacking():
+    """Test whether span stacking works properly for multiple overlapping spans."""
+    spans = [
+        {"start_token": 2, "end_token": 5, "label": "SkillNC"},
+        {"start_token": 0, "end_token": 2, "label": "Skill"},
+        {"start_token": 1, "end_token": 3, "label": "Skill"},
+    ]
+    tokens = ["Welcome", "to", "the", "Bank", "of", "China", "."]
+    per_token_info = SpanRenderer._assemble_per_token_info(spans=spans, tokens=tokens)
+
+    assert len(per_token_info) == len(tokens)
+    assert all([len(per_token_info[i]["entities"]) == 1 for i in (0, 3, 4)])
+    assert all([len(per_token_info[i]["entities"]) == 2 for i in (1, 2)])
+    assert per_token_info[1]["entities"][0]["render_slot"] == 1
+    assert per_token_info[1]["entities"][1]["render_slot"] == 2
+    assert per_token_info[2]["entities"][0]["render_slot"] == 2
+    assert per_token_info[2]["entities"][1]["render_slot"] == 3

From 92f1d0a195ed96706f548ef16cfda5ef5226bb07 Mon Sep 17 00:00:00 2001
From: Adriane Boyd <adrianeboyd@gmail.com>
Date: Fri, 3 Nov 2023 15:46:03 +0100
Subject: [PATCH 25/25] CI: Switch to stable python 3.12 and limit 3.11 runs
 (#13104)

---
 .github/workflows/tests.yml | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml
index 976b1f4f2..840b8e5f9 100644
--- a/.github/workflows/tests.yml
+++ b/.github/workflows/tests.yml
@@ -58,7 +58,7 @@ jobs:
       fail-fast: true
       matrix:
         os: [ubuntu-latest, windows-latest, macos-latest]
-        python_version: ["3.11", "3.12.0-rc.2"]
+        python_version: ["3.12"]
         include:
           - os: windows-latest
             python_version: "3.7"
@@ -68,6 +68,8 @@ jobs:
             python_version: "3.9"
           - os: windows-latest
             python_version: "3.10"
+          - os: macos-latest
+            python_version: "3.11"
 
     runs-on: ${{ matrix.os }}