mirror of
https://github.com/explosion/spaCy.git
synced 2025-05-30 02:33:07 +03:00
Update tokenizer_exceptions.py
This commit is contained in:
parent
d1f0b397b5
commit
5352fc8fc3
|
@ -10,6 +10,8 @@ _exc = {}
|
||||||
|
|
||||||
# translate / delete what is not necessary
|
# translate / delete what is not necessary
|
||||||
for exc_data in [
|
for exc_data in [
|
||||||
|
{ORTH: "’t", LEMMA: "et", NORM: "et"},
|
||||||
|
{ORTH: "’T", LEMMA: "et", NORM: "et"},
|
||||||
{ORTH: "'t", LEMMA: "et", NORM: "et"},
|
{ORTH: "'t", LEMMA: "et", NORM: "et"},
|
||||||
{ORTH: "'T", LEMMA: "et", NORM: "et"},
|
{ORTH: "'T", LEMMA: "et", NORM: "et"},
|
||||||
{ORTH: "wgl.", LEMMA: "wannechgelift", NORM: "wannechgelift"},
|
{ORTH: "wgl.", LEMMA: "wannechgelift", NORM: "wannechgelift"},
|
||||||
|
|
Loading…
Reference in New Issue
Block a user