2014-12-19 22:42:01 +03:00
|
|
|
from cymem.cymem cimport Pool
|
|
|
|
from preshed.maps cimport PreshMap
|
2014-12-19 23:41:08 +03:00
|
|
|
from murmurhash.mrmr cimport hash64
|
2015-07-18 23:39:57 +03:00
|
|
|
from .typedefs cimport attr_t
|
|
|
|
|
|
|
|
from libc.stdint cimport int64_t
|
2014-12-19 22:42:01 +03:00
|
|
|
|
2015-01-12 02:26:22 +03:00
|
|
|
from .typedefs cimport hash_t
|
|
|
|
|
2016-09-30 11:14:47 +03:00
|
|
|
DEF UINT64_MAX = 18446744073709551615
|
|
|
|
|
2015-01-12 02:26:22 +03:00
|
|
|
cpdef hash_t hash_string(unicode string) except 0
|
2014-12-19 23:41:08 +03:00
|
|
|
|
|
|
|
|
2015-07-20 13:06:10 +03:00
|
|
|
ctypedef union Utf8Str:
|
|
|
|
unsigned char[8] s
|
|
|
|
unsigned char* p
|
|
|
|
|
|
|
|
|
2014-12-19 22:42:01 +03:00
|
|
|
cdef class StringStore:
|
|
|
|
cdef Pool mem
|
2015-07-20 13:06:10 +03:00
|
|
|
cdef Utf8Str* c
|
2015-07-18 23:39:57 +03:00
|
|
|
cdef int64_t size
|
2014-12-19 22:42:01 +03:00
|
|
|
|
2015-11-05 14:32:19 +03:00
|
|
|
cdef public PreshMap _map
|
|
|
|
cdef int64_t _resize_at
|
2016-09-30 11:14:47 +03:00
|
|
|
cdef PreshMap oov_maps
|
|
|
|
|
|
|
|
cpdef int remove_oov_map(self, Pool mem) except -1
|
2014-12-19 22:42:01 +03:00
|
|
|
|
2016-09-30 11:14:47 +03:00
|
|
|
cdef hash_t intern(self, unicode py_string, Pool mem=*) except UINT64_MAX
|
|
|
|
cdef const Utf8Str* _intern_utf8(self, const unsigned char* utf8_string,
|
|
|
|
int length) except NULL
|