mirror of
https://github.com/explosion/spaCy.git
synced 2025-01-26 09:14:32 +03:00
Fix handling of errors around git [ci skip]
This commit is contained in:
parent
f8846c198d
commit
a5633b205f
|
@ -301,6 +301,7 @@ def ensure_pathy(path):
|
||||||
|
|
||||||
|
|
||||||
def git_sparse_checkout(repo: str, subpath: str, dest: Path, *, branch: str = "master"):
|
def git_sparse_checkout(repo: str, subpath: str, dest: Path, *, branch: str = "master"):
|
||||||
|
git_version = get_git_version()
|
||||||
if dest.exists():
|
if dest.exists():
|
||||||
msg.fail("Destination of checkout must not exist", exits=1)
|
msg.fail("Destination of checkout must not exist", exits=1)
|
||||||
if not dest.parent.exists():
|
if not dest.parent.exists():
|
||||||
|
@ -321,24 +322,28 @@ def git_sparse_checkout(repo: str, subpath: str, dest: Path, *, branch: str = "m
|
||||||
# *that* we can do by path.
|
# *that* we can do by path.
|
||||||
# We're using Git and sparse checkout to only clone the files we need
|
# We're using Git and sparse checkout to only clone the files we need
|
||||||
with make_tempdir() as tmp_dir:
|
with make_tempdir() as tmp_dir:
|
||||||
git_version = get_git_version()
|
|
||||||
supports_sparse = git_version >= (2, 22)
|
supports_sparse = git_version >= (2, 22)
|
||||||
# This is the "clone, but don't download anything" part.
|
# This is the "clone, but don't download anything" part.
|
||||||
cmd = f"git clone {repo} {tmp_dir} --no-checkout --depth 1 " f"-b {branch} "
|
cmd = f"git clone {repo} {tmp_dir} --no-checkout --depth 1 " f"-b {branch} "
|
||||||
if supports_sparse:
|
if supports_sparse:
|
||||||
cmd += f"--filter=blob:none" # <-- The key bit
|
cmd += f"--filter=blob:none" # <-- The key bit
|
||||||
else:
|
else:
|
||||||
msg.warn(
|
err_old = (
|
||||||
f"You're running an old version of Git (v{git_version[0]}.{git_version[1]}) "
|
f"You're running an old version of Git (v{git_version[0]}.{git_version[1]}) "
|
||||||
f"that doesn't fully support sparse checkout yet. This means that "
|
f"that doesn't fully support sparse checkout yet."
|
||||||
f"more files than necessary may be downloaded temporarily. To "
|
|
||||||
f"only download the files needed, upgrade to Git v2.22 or above."
|
|
||||||
)
|
)
|
||||||
_attempt_run_command(cmd)
|
err_unk = "You're running an unknown version of Git, so sparse checkout has been disabled."
|
||||||
|
msg.warn(
|
||||||
|
f"{err_unk if git_version == (0, 0) else err_old} "
|
||||||
|
f"This means that more files than necessary may be downloaded "
|
||||||
|
f"temporarily. To only download the files needed, make sure "
|
||||||
|
f"you're using Git v2.22 or above."
|
||||||
|
)
|
||||||
|
try_run_command(cmd)
|
||||||
# Now we need to find the missing filenames for the subpath we want.
|
# Now we need to find the missing filenames for the subpath we want.
|
||||||
# Looking for this 'rev-list' command in the git --help? Hah.
|
# Looking for this 'rev-list' command in the git --help? Hah.
|
||||||
cmd = f"git -C {tmp_dir} rev-list --objects --all {'--missing=print ' if supports_sparse else ''} -- {subpath}"
|
cmd = f"git -C {tmp_dir} rev-list --objects --all {'--missing=print ' if supports_sparse else ''} -- {subpath}"
|
||||||
ret = _attempt_run_command(cmd)
|
ret = try_run_command(cmd)
|
||||||
git_repo = _from_http_to_git(repo)
|
git_repo = _from_http_to_git(repo)
|
||||||
# Now pass those missings into another bit of git internals
|
# Now pass those missings into another bit of git internals
|
||||||
missings = " ".join([x[1:] for x in ret.stdout.split() if x.startswith("?")])
|
missings = " ".join([x[1:] for x in ret.stdout.split() if x.startswith("?")])
|
||||||
|
@ -351,27 +356,44 @@ def git_sparse_checkout(repo: str, subpath: str, dest: Path, *, branch: str = "m
|
||||||
msg.fail(err, exits=1)
|
msg.fail(err, exits=1)
|
||||||
if supports_sparse:
|
if supports_sparse:
|
||||||
cmd = f"git -C {tmp_dir} fetch-pack {git_repo} {missings}"
|
cmd = f"git -C {tmp_dir} fetch-pack {git_repo} {missings}"
|
||||||
_attempt_run_command(cmd)
|
try_run_command(cmd)
|
||||||
# And finally, we can checkout our subpath
|
# And finally, we can checkout our subpath
|
||||||
cmd = f"git -C {tmp_dir} checkout {branch} {subpath}"
|
cmd = f"git -C {tmp_dir} checkout {branch} {subpath}"
|
||||||
_attempt_run_command(cmd)
|
try_run_command(cmd)
|
||||||
# We need Path(name) to make sure we also support subdirectories
|
# We need Path(name) to make sure we also support subdirectories
|
||||||
shutil.move(str(tmp_dir / Path(subpath)), str(dest))
|
shutil.move(str(tmp_dir / Path(subpath)), str(dest))
|
||||||
|
|
||||||
|
|
||||||
def get_git_version() -> Tuple[int, int]:
|
def get_git_version(
|
||||||
ret = _attempt_run_command(["git", "--version"])
|
error: str = "Could not run 'git'. Make sure it's installed and the executable is available.",
|
||||||
# TODO: this seems kinda brittle?
|
) -> Tuple[int, int]:
|
||||||
version = ret.stdout[11:].strip().split(".")
|
"""Get the version of git and raise an error if calling 'git --version' fails.
|
||||||
|
|
||||||
|
error (str): The error message to show.
|
||||||
|
RETURNS (Tuple[int, int]): The version as a (major, minor) tuple. Returns
|
||||||
|
(0, 0) if the version couldn't be determined.
|
||||||
|
"""
|
||||||
|
ret = try_run_command(["git", "--version"], error=error)
|
||||||
|
stdout = ret.stdout.strip()
|
||||||
|
if not stdout or not stdout.startswith("git version"):
|
||||||
|
return (0, 0)
|
||||||
|
version = stdout[11:].strip().split(".")
|
||||||
return (int(version[0]), int(version[1]))
|
return (int(version[0]), int(version[1]))
|
||||||
|
|
||||||
|
|
||||||
def _attempt_run_command(cmd: Union[str, List[str]]):
|
def try_run_command(
|
||||||
|
cmd: Union[str, List[str]], error: str = "Could not run command"
|
||||||
|
) -> subprocess.CompletedProcess:
|
||||||
|
"""Try running a command and raise an error if it fails.
|
||||||
|
|
||||||
|
cmd (Union[str, List[str]]): The command to run.
|
||||||
|
error (str): The error message.
|
||||||
|
RETURNS (CompletedProcess): The completed process if the command ran.
|
||||||
|
"""
|
||||||
try:
|
try:
|
||||||
return run_command(cmd, capture=True)
|
return run_command(cmd, capture=True)
|
||||||
except subprocess.CalledProcessError as e:
|
except subprocess.CalledProcessError as e:
|
||||||
err = f"Could not run command"
|
msg.fail(error)
|
||||||
msg.fail(err)
|
|
||||||
print(cmd)
|
print(cmd)
|
||||||
sys.exit(1)
|
sys.exit(1)
|
||||||
|
|
||||||
|
|
|
@ -7,7 +7,7 @@ import requests
|
||||||
|
|
||||||
from ...util import ensure_path, working_dir
|
from ...util import ensure_path, working_dir
|
||||||
from .._util import project_cli, Arg, PROJECT_FILE, load_project_config, get_checksum
|
from .._util import project_cli, Arg, PROJECT_FILE, load_project_config, get_checksum
|
||||||
from .._util import download_file, git_sparse_checkout
|
from .._util import download_file, git_sparse_checkout, get_git_version
|
||||||
|
|
||||||
|
|
||||||
@project_cli.command("assets")
|
@project_cli.command("assets")
|
||||||
|
@ -41,6 +41,11 @@ def project_assets(project_dir: Path) -> None:
|
||||||
dest = (project_dir / asset["dest"]).resolve()
|
dest = (project_dir / asset["dest"]).resolve()
|
||||||
checksum = asset.get("checksum")
|
checksum = asset.get("checksum")
|
||||||
if "git" in asset:
|
if "git" in asset:
|
||||||
|
git_err = (
|
||||||
|
f"Cloning spaCy project templates requires Git and the 'git' command. "
|
||||||
|
f"Make sure it's installed and that the executable is available."
|
||||||
|
)
|
||||||
|
get_git_version(error=git_err)
|
||||||
if dest.exists():
|
if dest.exists():
|
||||||
# If there's already a file, check for checksum
|
# If there's already a file, check for checksum
|
||||||
if checksum and checksum == get_checksum(dest):
|
if checksum and checksum == get_checksum(dest):
|
||||||
|
|
|
@ -7,7 +7,7 @@ import re
|
||||||
from ... import about
|
from ... import about
|
||||||
from ...util import ensure_path
|
from ...util import ensure_path
|
||||||
from .._util import project_cli, Arg, Opt, COMMAND, PROJECT_FILE
|
from .._util import project_cli, Arg, Opt, COMMAND, PROJECT_FILE
|
||||||
from .._util import git_sparse_checkout
|
from .._util import git_sparse_checkout, get_git_version
|
||||||
|
|
||||||
|
|
||||||
@project_cli.command("clone")
|
@project_cli.command("clone")
|
||||||
|
@ -70,16 +70,12 @@ def check_clone(name: str, dest: Path, repo: str) -> None:
|
||||||
dest (Path): Local destination of cloned directory.
|
dest (Path): Local destination of cloned directory.
|
||||||
repo (str): URL of the repo to clone from.
|
repo (str): URL of the repo to clone from.
|
||||||
"""
|
"""
|
||||||
try:
|
git_err = (
|
||||||
subprocess.run(["git", "--version"], stdout=subprocess.DEVNULL)
|
|
||||||
except Exception:
|
|
||||||
msg.fail(
|
|
||||||
f"Cloning spaCy project templates requires Git and the 'git' command. ",
|
f"Cloning spaCy project templates requires Git and the 'git' command. ",
|
||||||
f"To clone a project without Git, copy the files from the '{name}' "
|
f"To clone a project without Git, copy the files from the '{name}' "
|
||||||
f"directory in the {repo} to {dest} manually and then run:",
|
f"directory in the {repo} to {dest} manually.",
|
||||||
f"{COMMAND} project init {dest}",
|
|
||||||
exits=1,
|
|
||||||
)
|
)
|
||||||
|
get_git_version(error=git_err)
|
||||||
if not dest:
|
if not dest:
|
||||||
msg.fail(f"Not a valid directory to clone project: {dest}", exits=1)
|
msg.fail(f"Not a valid directory to clone project: {dest}", exits=1)
|
||||||
if dest.exists():
|
if dest.exists():
|
||||||
|
|
Loading…
Reference in New Issue
Block a user