Try fixing unicode inconsistencies on Python 2

This commit is contained in:
Ines Montani 2019-03-09 02:37:50 +01:00
parent d957d7a697
commit ae09b6a6cf

View File

@ -423,5 +423,5 @@ _regular_exp.append(URL_PATTERN)
TOKENIZER_EXCEPTIONS = _exc
TOKEN_MATCH = re.compile(
"|".join("(?:{})".format(m) for m in _regular_exp), re.IGNORECASE
"|".join("(?:{})".format(m) for m in _regular_exp), re.IGNORECASE, re.UNICODE
).match