mirror of
https://github.com/explosion/spaCy.git
synced 2024-12-25 17:36:30 +03:00
* Remove dead code in strings.pyx
This commit is contained in:
parent
a9c3863665
commit
8bf0f65f1c
|
@ -15,39 +15,6 @@ cpdef hash_t hash_string(unicode string) except 0:
|
||||||
return hash64(chars, len(string) * sizeof(Py_UNICODE), 0)
|
return hash64(chars, len(string) * sizeof(Py_UNICODE), 0)
|
||||||
|
|
||||||
|
|
||||||
"""
|
|
||||||
cdef class SymbolMap:
|
|
||||||
def __init__(self):
|
|
||||||
self._string_to_id = {'': 0}
|
|
||||||
self._id_to_string = ['']
|
|
||||||
|
|
||||||
def __iter__(self):
|
|
||||||
for id_, string in enumerate(self._id_to_string[1:]):
|
|
||||||
yield string, id_
|
|
||||||
|
|
||||||
def __len__(self):
|
|
||||||
return len(self._id_to_string)
|
|
||||||
|
|
||||||
def __getitem__(self, object string_or_id):
|
|
||||||
cdef bytes byte_string
|
|
||||||
if isinstance(string_or_id, int) or isinstance(string_or_id, long):
|
|
||||||
if string_or_id < 1 or string_or_id >= self.size:
|
|
||||||
raise IndexError(string_or_id)
|
|
||||||
return self._int_to_string[string_or_id]
|
|
||||||
else:
|
|
||||||
string = string_or_id
|
|
||||||
if isinstance(string, unicode):
|
|
||||||
string = string.encode('utf8')
|
|
||||||
if string in self._string_to_id:
|
|
||||||
id_ = self._string_to_id[string]
|
|
||||||
else:
|
|
||||||
id_ = len(self._string_to_id)
|
|
||||||
self._string_to_id[string] = id_
|
|
||||||
self._id_to_string.append(string)
|
|
||||||
return id_
|
|
||||||
"""
|
|
||||||
|
|
||||||
|
|
||||||
cdef class StringStore:
|
cdef class StringStore:
|
||||||
'''Map strings to and from integer IDs.'''
|
'''Map strings to and from integer IDs.'''
|
||||||
def __init__(self):
|
def __init__(self):
|
||||||
|
|
Loading…
Reference in New Issue
Block a user