From 8df9e52829485eb4b3ee4571380d3fed143fc76f Mon Sep 17 00:00:00 2001 From: Thomas Opsomer Date: Tue, 27 Feb 2018 19:50:01 +0100 Subject: [PATCH] lemma property to return hash instead of unicode --- spacy/tokens/token.pyx | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/spacy/tokens/token.pyx b/spacy/tokens/token.pyx index 9e4b878cf..cdd07ebc0 100644 --- a/spacy/tokens/token.pyx +++ b/spacy/tokens/token.pyx @@ -269,8 +269,8 @@ cdef class Token: """ def __get__(self): if self.c.lemma == 0: - lemma = self.vocab.morphology.lemmatizer.lookup(self.orth_) - return lemma + lemma_ = self.vocab.morphology.lemmatizer.lookup(self.orth_) + return self.vocab.strings[lemma_] else: return self.c.lemma