mirror of
https://github.com/explosion/spaCy.git
synced 2024-11-11 12:18:04 +03:00
11 lines
236 B
Python
11 lines
236 B
Python
# coding: utf8
|
|
from __future__ import unicode_literals
|
|
|
|
from ._tokenizer_exceptions_list import ID_BASE_EXCEPTIONS
|
|
|
|
_exc = {}
|
|
|
|
for orth in ID_BASE_EXCEPTIONS + ["etc."]:
|
|
_exc[orth] = [{ORTH: orth}]
|
|
|
|
TOKENIZER_EXCEPTIONS = dict(_exc) |