From b2031710a8df2fb96e248d7bc6768470e01c9661 Mon Sep 17 00:00:00 2001 From: Jeff Adolphe Date: Sun, 27 Apr 2025 14:19:55 -0400 Subject: [PATCH] small tweaks --- spacy/lang/ht/lemmatizer.py | 5 ----- 1 file changed, 5 deletions(-) diff --git a/spacy/lang/ht/lemmatizer.py b/spacy/lang/ht/lemmatizer.py index 5782a2c46..9ac096f6d 100644 --- a/spacy/lang/ht/lemmatizer.py +++ b/spacy/lang/ht/lemmatizer.py @@ -13,7 +13,6 @@ class HaitianCreoleLemmatizer(Lemmatizer): """ def is_base_form(self, token: Token) -> bool: - # Treat tokens as base if they're uninflected (most Creole words) morph = token.morph.to_dict() upos = token.pos_.lower() @@ -41,10 +40,6 @@ class HaitianCreoleLemmatizer(Lemmatizer): # fallback rule: just return lowercased form forms.append(string) - # optionally: plug in basic rules - # e.g. 'te manje' or 'pral fè' may need rule-based stems - # You could add more logic here later. - self.cache[cache_key] = forms return forms