mirror of
https://github.com/explosion/spaCy.git
synced 2024-09-22 03:49:17 +03:00
11 lines
236 B
Python
11 lines
236 B
Python
# coding: utf8
|
|
from __future__ import unicode_literals
|
|
|
|
from ._tokenizer_exceptions_list import FR_BASE_EXCEPTIONS
|
|
|
|
_exc = {}
|
|
|
|
for orth in FR_BASE_EXCEPTIONS + ["etc."]:
|
|
_exc[orth] = [{ORTH: orth}]
|
|
|
|
TOKENIZER_EXCEPTIONS = dict(_exc) |