mirror of
https://github.com/explosion/spaCy.git
synced 2025-04-22 01:51:58 +03:00
fix token len
This commit is contained in:
parent
86d78d9730
commit
82ce3cc3f0
|
@ -61,7 +61,7 @@ def test_ms_tokenizer_splits_uneven_wrap_interact(id_tokenizer, text):
|
|||
|
||||
|
||||
@pytest.mark.parametrize(
|
||||
"text,length", [("kerana", 1), ("Mahathir-Anwar", 3), ("Tun Dr. Ismail-Abdul Rahman", 4)]
|
||||
"text,length", [("kerana", 1), ("Mahathir-Anwar", 3), ("Tun Dr. Ismail-Abdul Rahman", 6)]
|
||||
)
|
||||
def test_my_tokenizer_splits_hyphens(ms_tokenizer, text, length):
|
||||
tokens = ms_tokenizer(text)
|
||||
|
|
Loading…
Reference in New Issue
Block a user