mirror of
https://github.com/explosion/spaCy.git
synced 2024-11-11 04:08:09 +03:00
update tokenizertokenizer
This commit is contained in:
parent
45bc78461c
commit
85438aee1b
|
@ -35,6 +35,9 @@ ABBREVIATIONS = {
|
||||||
{ORTH: "সে.মি", LEMMA: "সেন্টিমিটার"},
|
{ORTH: "সে.মি", LEMMA: "সেন্টিমিটার"},
|
||||||
{ORTH: "সে.মি.", LEMMA: "সেন্টিমিটার"},
|
{ORTH: "সে.মি.", LEMMA: "সেন্টিমিটার"},
|
||||||
],
|
],
|
||||||
|
"মি.লি.": [
|
||||||
|
{ORTH: "মি.লি.", LEMMA: "মিলিলিটার"},
|
||||||
|
]
|
||||||
}
|
}
|
||||||
|
|
||||||
TOKENIZER_EXCEPTIONS.update(ABBREVIATIONS)
|
TOKENIZER_EXCEPTIONS.update(ABBREVIATIONS)
|
||||||
|
|
Loading…
Reference in New Issue
Block a user