mirror of
https://github.com/explosion/spaCy.git
synced 2025-01-10 09:16:31 +03:00
b0228d8ea6
* chore: add cython-linter dev dependency * fix: lexeme.pyx * fix: morphology.pxd * fix: tokenizer.pxd * fix: vocab.pxd * fix: morphology.pxd (line length) * ci: add cython-lint * ci: fix cython-lint call * Fix kb/candidate.pyx. * Fix kb/kb.pyx. * Fix kb/kb_in_memory.pyx. * Fix kb. * Fix training/ partially. * Fix training/. Ignore trailing whitespaces and too long lines. * Fix ml/. * Fix matcher/. * Fix pipeline/. * Fix tokens/. * Fix build errors. Fix vocab.pyx. * Fix cython-lint install and run. * Fix lexeme.pyx, parts_of_speech.pxd, vectors.pyx. Temporarily disable cython-lint execution. * Fix attrs.pyx, lexeme.pyx, symbols.pxd, isort issues. * Make cython-lint install conditional. Fix tokenizer.pyx. * Fix remaining files. Reenable cython-lint check. * Readded parentheses. * Fix test_build_dependencies(). * Add explanatory comment to cython-lint execution. --------- Co-authored-by: Raphael Mitsch <r.mitsch@outlook.com>
96 lines
3.2 KiB
Python
96 lines
3.2 KiB
Python
import re
|
|
from pathlib import Path
|
|
|
|
|
|
def test_build_dependencies():
|
|
# Check that library requirements are pinned exactly the same across different setup files.
|
|
# TODO: correct checks for numpy rather than ignoring
|
|
libs_ignore_requirements = [
|
|
"pytest",
|
|
"pytest-timeout",
|
|
"mock",
|
|
"flake8",
|
|
"hypothesis",
|
|
"pre-commit",
|
|
"cython-lint",
|
|
"black",
|
|
"isort",
|
|
"mypy",
|
|
"types-dataclasses",
|
|
"types-mock",
|
|
"types-requests",
|
|
"types-setuptools",
|
|
]
|
|
# ignore language-specific packages that shouldn't be installed by all
|
|
libs_ignore_setup = [
|
|
"fugashi",
|
|
"natto-py",
|
|
"pythainlp",
|
|
"sudachipy",
|
|
"sudachidict_core",
|
|
"spacy-pkuseg",
|
|
"thinc-apple-ops",
|
|
]
|
|
|
|
# check requirements.txt
|
|
req_dict = {}
|
|
|
|
root_dir = Path(__file__).parent
|
|
req_file = root_dir / "requirements.txt"
|
|
with req_file.open() as f:
|
|
lines = f.readlines()
|
|
for line in lines:
|
|
line = line.strip()
|
|
if not line.startswith("#"):
|
|
lib, v = _parse_req(line)
|
|
if lib and lib not in libs_ignore_requirements:
|
|
req_dict[lib] = v
|
|
# check setup.cfg and compare to requirements.txt
|
|
# also fails when there are missing or additional libs
|
|
setup_file = root_dir / "setup.cfg"
|
|
with setup_file.open() as f:
|
|
lines = f.readlines()
|
|
|
|
setup_keys = set()
|
|
for line in lines:
|
|
line = line.strip()
|
|
if not line.startswith("#"):
|
|
lib, v = _parse_req(line)
|
|
if lib and not lib.startswith("cupy") and lib not in libs_ignore_setup:
|
|
req_v = req_dict.get(lib, None)
|
|
assert (
|
|
req_v is not None
|
|
), "{} in setup.cfg but not in requirements.txt".format(lib)
|
|
assert (lib + v) == (lib + req_v), (
|
|
"{} has different version in setup.cfg and in requirements.txt: "
|
|
"{} and {} respectively".format(lib, v, req_v)
|
|
)
|
|
setup_keys.add(lib)
|
|
assert sorted(setup_keys) == sorted(
|
|
req_dict.keys()
|
|
) # if fail: requirements.txt contains a lib not in setup.cfg
|
|
|
|
# check pyproject.toml and compare the versions of the libs to requirements.txt
|
|
# does not fail when there are missing or additional libs
|
|
toml_file = root_dir / "pyproject.toml"
|
|
with toml_file.open() as f:
|
|
lines = f.readlines()
|
|
for line in lines:
|
|
line = line.strip().strip(",").strip('"')
|
|
if not line.startswith("#"):
|
|
lib, v = _parse_req(line)
|
|
if lib and lib not in libs_ignore_requirements:
|
|
req_v = req_dict.get(lib, None)
|
|
assert (lib + v) == (lib + req_v), (
|
|
"{} has different version in pyproject.toml and in requirements.txt: "
|
|
"{} and {} respectively".format(lib, v, req_v)
|
|
)
|
|
|
|
|
|
def _parse_req(line):
|
|
lib = re.match(r"^[a-z0-9\-]*", line).group(0)
|
|
v = line.replace(lib, "").strip()
|
|
if not re.match(r"^[<>=][<>=].*", v):
|
|
return None, None
|
|
return lib, v
|