diff --git a/website/docs/usage/linguistic-features.mdx b/website/docs/usage/linguistic-features.mdx index 6c84762f6..2d5fb2b67 100644 --- a/website/docs/usage/linguistic-features.mdx +++ b/website/docs/usage/linguistic-features.mdx @@ -1301,7 +1301,7 @@ correct type. @spacy.registry.tokenizers("bert_word_piece_tokenizer") def create_whitespace_tokenizer(vocab_file: str, lowercase: bool): def create_tokenizer(nlp): - return BertWordPieceTokenizer(vocab_file, lowercase=lowercase) + return BertTokenizer(nlp.vocab, vocab_file, lowercase) return create_tokenizer ```