2023-06-26 12:41:03 +03:00
|
|
|
from cymem.cymem cimport Pool
|
2022-10-06 11:51:06 +03:00
|
|
|
from libc.stdint cimport int64_t, uint32_t
|
2017-11-11 03:11:27 +03:00
|
|
|
from libcpp.set cimport set
|
2023-06-26 12:41:03 +03:00
|
|
|
from libcpp.vector cimport vector
|
2014-12-19 23:41:08 +03:00
|
|
|
from murmurhash.mrmr cimport hash64
|
2023-06-26 12:41:03 +03:00
|
|
|
from preshed.maps cimport PreshMap
|
2015-07-18 23:39:57 +03:00
|
|
|
|
2016-10-09 13:24:24 +03:00
|
|
|
from .typedefs cimport attr_t, hash_t
|
2014-12-19 22:42:01 +03:00
|
|
|
|
2015-07-20 13:06:10 +03:00
|
|
|
ctypedef union Utf8Str:
|
|
|
|
unsigned char[8] s
|
|
|
|
unsigned char* p
|
|
|
|
|
|
|
|
|
2014-12-19 22:42:01 +03:00
|
|
|
cdef class StringStore:
|
|
|
|
cdef Pool mem
|
2022-10-06 11:51:06 +03:00
|
|
|
cdef vector[hash_t] _keys
|
|
|
|
cdef PreshMap _map
|
|
|
|
|
|
|
|
cdef hash_t _intern_str(self, str string)
|
|
|
|
cdef Utf8Str* _allocate_str_repr(self, const unsigned char* chars, uint32_t length) except *
|
|
|
|
cdef str _decode_str_repr(self, const Utf8Str* string)
|
2014-12-19 22:42:01 +03:00
|
|
|
|
|
|
|
|
2022-10-06 11:51:06 +03:00
|
|
|
cpdef hash_t hash_string(object string) except -1
|
|
|
|
cpdef hash_t get_string_id(object string_or_hash) except -1
|