mirror of
https://github.com/explosion/spaCy.git
synced 2024-12-25 17:36:30 +03:00
Add GreekLemmatizer.lookup (resolves #4272)
This commit is contained in:
parent
6279d74c65
commit
8f9f48b04c
|
@ -46,6 +46,11 @@ class GreekLemmatizer(object):
|
||||||
)
|
)
|
||||||
return lemmas
|
return lemmas
|
||||||
|
|
||||||
|
def lookup(self, string):
|
||||||
|
if string in self.lookup_table:
|
||||||
|
return self.lookup_table[string]
|
||||||
|
return string
|
||||||
|
|
||||||
|
|
||||||
def lemmatize(string, index, exceptions, rules):
|
def lemmatize(string, index, exceptions, rules):
|
||||||
string = string.lower()
|
string = string.lower()
|
||||||
|
|
12
spacy/tests/regression/test_issue4272.py
Normal file
12
spacy/tests/regression/test_issue4272.py
Normal file
|
@ -0,0 +1,12 @@
|
||||||
|
# coding: utf8
|
||||||
|
from __future__ import unicode_literals
|
||||||
|
|
||||||
|
from spacy.lang.el import Greek
|
||||||
|
|
||||||
|
|
||||||
|
def test_issue4272():
|
||||||
|
"""Test that lookup table can be accessed from Token.lemma if no POS tags
|
||||||
|
are available."""
|
||||||
|
nlp = Greek()
|
||||||
|
doc = nlp("Χθες")
|
||||||
|
assert doc[0].lemma_
|
Loading…
Reference in New Issue
Block a user