mirror of
https://github.com/explosion/spaCy.git
synced 2024-11-10 19:57:17 +03:00
30 lines
634 B
Cython
30 lines
634 B
Cython
from libc.stdint cimport int64_t
|
|
|
|
from cymem.cymem cimport Pool
|
|
from preshed.maps cimport PreshMap
|
|
from murmurhash.mrmr cimport hash64
|
|
|
|
from .typedefs cimport attr_t, hash_t
|
|
|
|
|
|
cpdef hash_t hash_string(unicode string) except 0
|
|
|
|
|
|
ctypedef union Utf8Str:
|
|
unsigned char[8] s
|
|
unsigned char* p
|
|
|
|
|
|
cdef class StringStore:
|
|
cdef Pool mem
|
|
cdef Utf8Str* c
|
|
cdef int64_t size
|
|
cdef bint is_frozen
|
|
|
|
cdef public PreshMap _map
|
|
cdef public PreshMap _oov
|
|
cdef int64_t _resize_at
|
|
|
|
cdef const Utf8Str* intern_unicode(self, unicode py_string)
|
|
cdef const Utf8Str* _intern_utf8(self, char* utf8_string, int length)
|