Revert "Fix apparent bug in Spanish lemmatizer. Not sure why this emerges in v4 not in v3"

This reverts commit 64b22be76e.
This commit is contained in:
Matthew Honnibal 2024-09-04 14:26:39 +02:00
parent 64b22be76e
commit 6f7590bbf1

View File

@ -53,15 +53,12 @@ class SpanishLemmatizer(Lemmatizer):
else:
rule_pos = pos
rule = self.select_rule(rule_pos, list(features))
if rule is None:
lemmas = [string]
else:
index = self.lookups.get_table("lemma_index").get(rule_pos, [])
lemmas = getattr(self, "lemmatize_" + rule_pos)(
string, features, rule, index
)
# Remove duplicates but preserve the ordering
lemmas = list(dict.fromkeys(lemmas))
index = self.lookups.get_table("lemma_index").get(rule_pos, [])
lemmas = getattr(self, "lemmatize_" + rule_pos)(
string, features, rule, index
)
# Remove duplicates but preserve the ordering
lemmas = list(dict.fromkeys(lemmas))
self.cache[cache_key] = lemmas
return lemmas
@ -206,7 +203,6 @@ class SpanishLemmatizer(Lemmatizer):
word (str): The word to lemmatize.
features (List[str]): The morphological features as a list of Feat=Val
pairs.
rule (str): The rule ID to use
index (List[str]): The POS-specific lookup list.
RETURNS (List[str]): The list of lemmas.