This commit is contained in:
Jim O'Regan 2017-11-29 23:03:41 +00:00
parent 3696ce6a7b
commit b32575e78c
2 changed files with 3 additions and 1 deletions

View File

@ -2,6 +2,7 @@
from __future__ import unicode_literals
from .tokenizer_exceptions import TOKENIZER_EXCEPTIONS
from .tag_map import TAG_MAP
from .stop_words import STOP_WORDS
from ..tokenizer_exceptions import BASE_EXCEPTIONS
@ -17,6 +18,7 @@ class PolishDefaults(Language.Defaults):
lex_attr_getters[NORM] = add_lookups(Language.Defaults.lex_attr_getters[NORM], BASE_NORMS)
tokenizer_exceptions = update_exc(BASE_EXCEPTIONS, TOKENIZER_EXCEPTIONS)
stop_words = STOP_WORDS
tag_map = TAG_MAP
class Polish(Language):

View File

@ -1,6 +1,6 @@
# coding: utf8
from __future__ import unicode_literals
from ...symbols import POS, ADJ, CCONJ, SCONJ, NUM, ADV, ADP, X, VERB, NOUN
from ...symbols import POS, ADJ, ADP, ADV, AUX, CCONJ, DET, INTJ, NOUN, NUM, PART, PRON, PROPN, PUNCT, SCONJ, VERB, X
TAG_MAP = {
"adja": {POS: ADJ},