mirror of
https://github.com/explosion/spaCy.git
synced 2024-12-26 18:06:29 +03:00
update tokenizertokenizer
This commit is contained in:
parent
45bc78461c
commit
85438aee1b
|
@ -35,6 +35,9 @@ ABBREVIATIONS = {
|
|||
{ORTH: "সে.মি", LEMMA: "সেন্টিমিটার"},
|
||||
{ORTH: "সে.মি.", LEMMA: "সেন্টিমিটার"},
|
||||
],
|
||||
"মি.লি.": [
|
||||
{ORTH: "মি.লি.", LEMMA: "মিলিলিটার"},
|
||||
]
|
||||
}
|
||||
|
||||
TOKENIZER_EXCEPTIONS.update(ABBREVIATIONS)
|
||||
|
|
Loading…
Reference in New Issue
Block a user