fix BertWordPieceTokenizer constructor call

This commit is contained in:
svlandeg 2023-09-05 13:24:17 +02:00
parent 6d1f6d9a23
commit 3bc564c28e

View File

@ -1301,7 +1301,7 @@ correct type.
@spacy.registry.tokenizers("bert_word_piece_tokenizer")
def create_whitespace_tokenizer(vocab_file: str, lowercase: bool):
def create_tokenizer(nlp):
return BertWordPieceTokenizer(nlp.vocab, vocab_file, lowercase)
return BertWordPieceTokenizer(vocab_file, lowercase=lowercase)
return create_tokenizer
```