mirror of
https://github.com/explosion/spaCy.git
synced 2024-12-27 18:36:36 +03:00
28 lines
468 B
Python
28 lines
468 B
Python
from __future__ import unicode_literals
|
|
|
|
import pytest
|
|
|
|
from spacy.orth import word_shape as ws
|
|
|
|
|
|
def test_capitalized():
|
|
assert ws('Nasa') == 'Xxxx'
|
|
|
|
def test_truncate():
|
|
assert ws('capitalized') == 'xxxx'
|
|
|
|
def test_digits():
|
|
assert ws('999999999') == 'dddd'
|
|
|
|
def test_mix():
|
|
assert ws('C3P0') == 'XdXd'
|
|
|
|
def test_punct():
|
|
assert ws(',') == ','
|
|
|
|
def test_space():
|
|
assert ws('\n') == '\n'
|
|
|
|
def test_punct_seq():
|
|
assert ws('``,-') == '``,-'
|