* Fiddle with the way strings are interned in lexeme

2025-07-02 10:53:05 +03:00 · 2014-09-15 06:34:45 +02:00 · 2014-09-15 06:34:45 +02:00 · c396581a0b
commit c396581a0b
parent 0bb547ab98
1 changed files with 2 additions and 2 deletions
--- a/spacy/lexeme.pyx
+++ b/spacy/lexeme.pyx
@ -24,8 +24,8 @@ cdef int lexeme_free(LexemeC* lexeme) except -1:
 cdef char* intern_and_encode(unicode string, size_t* length):
-    global _strings
+    cdef bytes byte_string = string.encode('utf8')
-    cdef bytes utf8_string = intern(string.encode('utf8'))
+    cdef bytes utf8_string = intern(byte_string)
    Py_INCREF(utf8_string)
    length[0] = len(utf8_string)
    return <char*>utf8_string