mirror of
https://github.com/explosion/spaCy.git
synced 2024-11-11 04:08:09 +03:00
Update punctuation.py
In Chinese, `~` and `——` is hyphens, `·` is intermittent symbol
This commit is contained in:
parent
aa728b33ca
commit
978b24ccd4
|
@ -25,12 +25,12 @@ _QUOTES = r"""
|
||||||
|
|
||||||
_PUNCT = r"""
|
_PUNCT = r"""
|
||||||
… , : ; \! \? ¿ ¡ \( \) \[ \] \{ \} < > _ # \* &
|
… , : ; \! \? ¿ ¡ \( \) \[ \] \{ \} < > _ # \* &
|
||||||
。 ? ! , 、 ; : ~
|
。 ? ! , 、 ; : ~ ·
|
||||||
"""
|
"""
|
||||||
|
|
||||||
|
|
||||||
_HYPHENS = r"""
|
_HYPHENS = r"""
|
||||||
- – — -- ---
|
- – — -- --- —— ~
|
||||||
"""
|
"""
|
||||||
|
|
||||||
|
|
||||||
|
|
Loading…
Reference in New Issue
Block a user