mirror of
https://github.com/explosion/spaCy.git
synced 2024-12-24 17:06:29 +03:00
German lemmatizer additions (#2529)
* lemma of was-> was * added new pairs issue @2486 * added article tests
This commit is contained in:
parent
c21efea9bb
commit
00b9a58558
File diff suppressed because it is too large
Load Diff
|
@ -7,7 +7,9 @@ import pytest
|
||||||
@pytest.mark.parametrize('string,lemma', [('Abgehängten', 'Abgehängte'),
|
@pytest.mark.parametrize('string,lemma', [('Abgehängten', 'Abgehängte'),
|
||||||
('engagierte', 'engagieren'),
|
('engagierte', 'engagieren'),
|
||||||
('schließt', 'schließen'),
|
('schließt', 'schließen'),
|
||||||
('vorgebenden', 'vorgebend')])
|
('vorgebenden', 'vorgebend'),
|
||||||
|
('die', 'der'),
|
||||||
|
('Die', 'der')])
|
||||||
def test_lemmatizer_lookup_assigns(de_tokenizer, string, lemma):
|
def test_lemmatizer_lookup_assigns(de_tokenizer, string, lemma):
|
||||||
tokens = de_tokenizer(string)
|
tokens = de_tokenizer(string)
|
||||||
assert tokens[0].lemma_ == lemma
|
assert tokens[0].lemma_ == lemma
|
||||||
|
|
Loading…
Reference in New Issue
Block a user