From 40e71586d607626cf7b144e39c2e049916933fa7 Mon Sep 17 00:00:00 2001 From: Matthew Honnibal Date: Sun, 18 Dec 2016 23:44:05 +0100 Subject: [PATCH] Fix Issue #683: Add 'SP' to tag_map, if it's not there already, within the Morphology class. --- spacy/morphology.pyx | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/spacy/morphology.pyx b/spacy/morphology.pyx index c13ce1920..18f4f0ae1 100644 --- a/spacy/morphology.pyx +++ b/spacy/morphology.pyx @@ -12,7 +12,7 @@ try: except ImportError: import json -from .parts_of_speech cimport ADJ, VERB, NOUN, PUNCT +from .parts_of_speech cimport ADJ, SPACE, VERB, NOUN, PUNCT from .attrs cimport POS, IS_SPACE from .parts_of_speech import IDS as POS_IDS from .lexeme cimport Lexeme @@ -48,6 +48,9 @@ cdef class Morphology: self.reverse_index = {} self.rich_tags = self.mem.alloc(self.n_tags, sizeof(RichTagC)) + # Add the 'SP' tag to the map, if it's not there already. See Issue #683. + if 'SP' not in tag_map: + tag_map['SP'] = {POS: SPACE} for i, (tag_str, attrs) in enumerate(sorted(tag_map.items())): attrs = _normalize_props(attrs) attrs = intify_attrs(attrs, self.strings, _do_deprecated=True)