mirror of
https://github.com/explosion/spaCy.git
synced 2024-11-11 12:18:04 +03:00
29 lines
619 B
Python
29 lines
619 B
Python
|
# encoding: utf8
|
|||
|
from __future__ import unicode_literals
|
|||
|
|
|||
|
from ..symbols import *
|
|||
|
|
|||
|
|
|||
|
TOKENIZER_EXCEPTIONS = {
|
|||
|
"Пн.": [
|
|||
|
{ORTH: "Пн.", LEMMA: "Понедельник"}
|
|||
|
],
|
|||
|
"Вт.": [
|
|||
|
{ORTH: "Вт.", LEMMA: "Вторник"}
|
|||
|
],
|
|||
|
"Ср.": [
|
|||
|
{ORTH: "Ср.", LEMMA: "Среда"}
|
|||
|
],
|
|||
|
"Чт.": [
|
|||
|
{ORTH: "Чт.", LEMMA: "Четверг"}
|
|||
|
],
|
|||
|
"Пт.": [
|
|||
|
{ORTH: "Пт.", LEMMA: "Пятница"}
|
|||
|
],
|
|||
|
"Сб.": [
|
|||
|
{ORTH: "Сб.", LEMMA: "Суббота"}
|
|||
|
],
|
|||
|
"Вс.": [
|
|||
|
{ORTH: "Вс.", LEMMA: "Воскресенье"}
|
|||
|
],
|
|||
|
}
|