mirror of
https://github.com/explosion/spaCy.git
synced 2024-11-11 04:08:09 +03:00
52ee1f9bf9
attrs
35 lines
783 B
Python
35 lines
783 B
Python
# coding: utf8
|
||
from __future__ import unicode_literals
|
||
|
||
|
||
_exc = {
|
||
# Slang
|
||
'прив': 'привет',
|
||
|
||
# Weekdays abbreviations
|
||
"пн.": "понедельник",
|
||
"вт.": "вторник",
|
||
"ср.": "среда",
|
||
"чт.": "четверг",
|
||
"пт.": "пятница",
|
||
"сб.": "суббота",
|
||
"вс.": "воскресенье",
|
||
|
||
# Months abbreviations
|
||
"янв.": "январь",
|
||
"фев.": "февраль",
|
||
"мар.": "март",
|
||
"апр.": "апрель",
|
||
|
||
}
|
||
|
||
|
||
NORM_EXCEPTIONS = {}
|
||
|
||
for string, norm in _exc.items():
|
||
NORM_EXCEPTIONS[string] = norm
|
||
NORM_EXCEPTIONS[string.title()] = norm
|
||
if string.endswith('.'):
|
||
NORM_EXCEPTIONS[string[:-1]] = norm
|
||
NORM_EXCEPTIONS[string.title()[:-1]] = norm
|