mirror of
https://github.com/explosion/spaCy.git
synced 2025-08-05 04:40:20 +03:00
small tweaks
This commit is contained in:
parent
031a60e3cd
commit
b2031710a8
|
@ -13,7 +13,6 @@ class HaitianCreoleLemmatizer(Lemmatizer):
|
||||||
"""
|
"""
|
||||||
|
|
||||||
def is_base_form(self, token: Token) -> bool:
|
def is_base_form(self, token: Token) -> bool:
|
||||||
# Treat tokens as base if they're uninflected (most Creole words)
|
|
||||||
morph = token.morph.to_dict()
|
morph = token.morph.to_dict()
|
||||||
upos = token.pos_.lower()
|
upos = token.pos_.lower()
|
||||||
|
|
||||||
|
@ -41,10 +40,6 @@ class HaitianCreoleLemmatizer(Lemmatizer):
|
||||||
# fallback rule: just return lowercased form
|
# fallback rule: just return lowercased form
|
||||||
forms.append(string)
|
forms.append(string)
|
||||||
|
|
||||||
# optionally: plug in basic rules
|
|
||||||
# e.g. 'te manje' or 'pral fè' may need rule-based stems
|
|
||||||
# You could add more logic here later.
|
|
||||||
|
|
||||||
self.cache[cache_key] = forms
|
self.cache[cache_key] = forms
|
||||||
return forms
|
return forms
|
||||||
|
|
||||||
|
|
Loading…
Reference in New Issue
Block a user