mirror of
https://github.com/explosion/spaCy.git
synced 2024-12-26 01:46:28 +03:00
181 lines
5.2 KiB
Python
181 lines
5.2 KiB
Python
# coding: utf-8
|
|
from __future__ import unicode_literals
|
|
|
|
import pytest
|
|
import os
|
|
import ctypes
|
|
import srsly
|
|
from pathlib import Path
|
|
from spacy import util
|
|
from spacy import prefer_gpu, require_gpu
|
|
from spacy.compat import symlink_to, symlink_remove, path2str, is_windows
|
|
from spacy._ml import PrecomputableAffine
|
|
from subprocess import CalledProcessError
|
|
from .util import make_tempdir
|
|
|
|
|
|
@pytest.fixture
|
|
def symlink_target():
|
|
return Path("./foo-target")
|
|
|
|
|
|
@pytest.fixture
|
|
def symlink():
|
|
return Path("./foo-symlink")
|
|
|
|
|
|
@pytest.fixture(scope="function")
|
|
def symlink_setup_target(request, symlink_target, symlink):
|
|
if not symlink_target.exists():
|
|
os.mkdir(path2str(symlink_target))
|
|
# yield -- need to cleanup even if assertion fails
|
|
# https://github.com/pytest-dev/pytest/issues/2508#issuecomment-309934240
|
|
|
|
def cleanup():
|
|
# Remove symlink only if it was created
|
|
if symlink.exists():
|
|
symlink_remove(symlink)
|
|
os.rmdir(path2str(symlink_target))
|
|
|
|
request.addfinalizer(cleanup)
|
|
|
|
|
|
@pytest.fixture
|
|
def is_admin():
|
|
"""Determine if the tests are run as admin or not."""
|
|
try:
|
|
admin = os.getuid() == 0
|
|
except AttributeError:
|
|
admin = ctypes.windll.shell32.IsUserAnAdmin() != 0
|
|
|
|
return admin
|
|
|
|
|
|
@pytest.mark.parametrize("text", ["hello/world", "hello world"])
|
|
def test_util_ensure_path_succeeds(text):
|
|
path = util.ensure_path(text)
|
|
assert isinstance(path, Path)
|
|
|
|
|
|
@pytest.mark.parametrize("package", ["numpy"])
|
|
def test_util_is_package(package):
|
|
"""Test that an installed package via pip is recognised by util.is_package."""
|
|
assert util.is_package(package)
|
|
|
|
|
|
@pytest.mark.parametrize("package", ["thinc"])
|
|
def test_util_get_package_path(package):
|
|
"""Test that a Path object is returned for a package name."""
|
|
path = util.get_package_path(package)
|
|
assert isinstance(path, Path)
|
|
|
|
|
|
def test_PrecomputableAffine(nO=4, nI=5, nF=3, nP=2):
|
|
model = PrecomputableAffine(nO=nO, nI=nI, nF=nF, nP=nP)
|
|
assert model.W.shape == (nF, nO, nP, nI)
|
|
tensor = model.ops.allocate((10, nI))
|
|
Y, get_dX = model.begin_update(tensor)
|
|
assert Y.shape == (tensor.shape[0] + 1, nF, nO, nP)
|
|
assert model.d_pad.shape == (1, nF, nO, nP)
|
|
dY = model.ops.allocate((15, nO, nP))
|
|
ids = model.ops.allocate((15, nF))
|
|
ids[1, 2] = -1
|
|
dY[1] = 1
|
|
assert model.d_pad[0, 2, 0, 0] == 0.0
|
|
model._backprop_padding(dY, ids)
|
|
assert model.d_pad[0, 2, 0, 0] == 1.0
|
|
model.d_pad.fill(0.0)
|
|
ids.fill(0.0)
|
|
dY.fill(0.0)
|
|
ids[1, 2] = -1
|
|
ids[1, 1] = -1
|
|
ids[1, 0] = -1
|
|
dY[1] = 1
|
|
assert model.d_pad[0, 2, 0, 0] == 0.0
|
|
model._backprop_padding(dY, ids)
|
|
assert model.d_pad[0, 2, 0, 0] == 3.0
|
|
|
|
|
|
def test_prefer_gpu():
|
|
try:
|
|
import cupy # noqa: F401
|
|
except ImportError:
|
|
assert not prefer_gpu()
|
|
|
|
|
|
def test_require_gpu():
|
|
try:
|
|
import cupy # noqa: F401
|
|
except ImportError:
|
|
with pytest.raises(ValueError):
|
|
require_gpu()
|
|
|
|
|
|
def test_create_symlink_windows(
|
|
symlink_setup_target, symlink_target, symlink, is_admin
|
|
):
|
|
"""Test the creation of symlinks on windows. If run as admin or not on windows it should succeed, otherwise a CalledProcessError should be raised."""
|
|
assert symlink_target.exists()
|
|
|
|
if is_admin or not is_windows:
|
|
try:
|
|
symlink_to(symlink, symlink_target)
|
|
assert symlink.exists()
|
|
except CalledProcessError as e:
|
|
pytest.fail(e)
|
|
else:
|
|
with pytest.raises(CalledProcessError):
|
|
symlink_to(symlink, symlink_target)
|
|
|
|
assert not symlink.exists()
|
|
|
|
|
|
def test_ascii_filenames():
|
|
"""Test that all filenames in the project are ASCII.
|
|
See: https://twitter.com/_inesmontani/status/1177941471632211968
|
|
"""
|
|
root = Path(__file__).parent.parent
|
|
for path in root.glob("**/*"):
|
|
assert all(ord(c) < 128 for c in path.name), path.name
|
|
|
|
|
|
def test_load_model_blank_shortcut():
|
|
"""Test that using a model name like "blank:en" works as a shortcut for
|
|
spacy.blank("en").
|
|
"""
|
|
nlp = util.load_model("blank:en")
|
|
assert nlp.lang == "en"
|
|
assert nlp.pipeline == []
|
|
with pytest.raises(ImportError):
|
|
util.load_model("blank:fjsfijsdof")
|
|
|
|
|
|
def test_load_model_version_compat():
|
|
"""Test warnings for various spacy_version specifications in meta. Since
|
|
this is more of a hack for v2, manually specify the current major.minor
|
|
version to simplify test creation."""
|
|
nlp = util.load_model("blank:en")
|
|
assert nlp.meta["spacy_version"].startswith(">=2.3")
|
|
with make_tempdir() as d:
|
|
# no change: compatible
|
|
nlp.to_disk(d)
|
|
meta_path = Path(d / "meta.json")
|
|
util.get_model_meta(d)
|
|
|
|
# additional compatible upper pin
|
|
nlp.meta["spacy_version"] = ">=2.3.0,<2.4.0"
|
|
srsly.write_json(meta_path, nlp.meta)
|
|
util.get_model_meta(d)
|
|
|
|
# incompatible older version
|
|
nlp.meta["spacy_version"] = ">=2.2.5"
|
|
srsly.write_json(meta_path, nlp.meta)
|
|
with pytest.warns(UserWarning):
|
|
util.get_model_meta(d)
|
|
|
|
# invalid version specification
|
|
nlp.meta["spacy_version"] = ">@#$%_invalid_version"
|
|
srsly.write_json(meta_path, nlp.meta)
|
|
with pytest.warns(UserWarning):
|
|
util.get_model_meta(d)
|