mirror of
https://github.com/explosion/spaCy.git
synced 2024-12-26 01:46:28 +03:00
Fix unicode regex for Python 2 (see #834)
This commit is contained in:
parent
44de3c7642
commit
aa92d4e9b5
|
@ -472,7 +472,7 @@ cdef class Vocab:
|
||||||
cdef int32_t vec_len = -1
|
cdef int32_t vec_len = -1
|
||||||
cdef double norm = 0.0
|
cdef double norm = 0.0
|
||||||
|
|
||||||
whitespace_pattern = re.compile(r'\s')
|
whitespace_pattern = re.compile(r'\s', re.UNICODE)
|
||||||
|
|
||||||
for line_num, line in enumerate(file_):
|
for line_num, line in enumerate(file_):
|
||||||
pieces = line.split()
|
pieces = line.split()
|
||||||
|
|
Loading…
Reference in New Issue
Block a user