mirror of
https://github.com/explosion/spaCy.git
synced 2024-12-25 17:36:30 +03:00
Fix Issue #639: stop words in language class not used. This patch is messy, but it's better not to change too much until the language data loading can be properly refactored.
This commit is contained in:
parent
48e1dc29d4
commit
09f68bc641
|
@ -45,7 +45,11 @@ class BaseDefaults(object):
|
|||
def create_vocab(cls, nlp=None):
|
||||
lemmatizer = cls.create_lemmatizer(nlp)
|
||||
if nlp is None or nlp.path is None:
|
||||
return Vocab(lex_attr_getters=cls.lex_attr_getters, tag_map=cls.tag_map,
|
||||
lex_attr_getters = dict(cls.lex_attr_getters)
|
||||
# This is very messy, but it's the minimal working fix to Issue #639.
|
||||
# This defaults stuff needs to be refactored (again)
|
||||
lex_attr_getters[IS_STOP] = lambda string: string.lower() in cls.stop_words
|
||||
return Vocab(lex_attr_getters=lex_attr_getters, tag_map=cls.tag_map,
|
||||
lemmatizer=lemmatizer)
|
||||
else:
|
||||
return Vocab.load(nlp.path, lex_attr_getters=cls.lex_attr_getters,
|
||||
|
|
Loading…
Reference in New Issue
Block a user