diff --git a/tests/tagger/test_lemmatizer.py b/tests/tagger/test_lemmatizer.py index 8461a854e..df553c3d6 100644 --- a/tests/tagger/test_lemmatizer.py +++ b/tests/tagger/test_lemmatizer.py @@ -1,3 +1,4 @@ +# -*- coding: utf-8 -*- from __future__ import unicode_literals from spacy.lemmatizer import Lemmatizer, read_index, read_exc @@ -34,3 +35,14 @@ def test_noun_lemmas(lemmatizer): assert do('planets') == set(['planet']) assert do('ring') == set(['ring']) assert do('axes') == set(['axis', 'axe', 'ax']) + + +def test_smart_quotes(lemmatizer): + do = lemmatizer.punct + assert do('“') == set(['``']) + assert do('“') == set(['``']) + + +def test_smart_quotes(lemmatizer): + do = lemmatizer.punct + assert do('–') == set(["--"])