mirror of
https://github.com/explosion/spaCy.git
synced 2025-03-03 10:55:52 +03:00
Add "project document" and more project.yml meta fields
This commit is contained in:
parent
fdcaf86c54
commit
f10989e8c4
|
@ -23,6 +23,7 @@ from .project.run import project_run # noqa: F401
|
||||||
from .project.dvc import project_update_dvc # noqa: F401
|
from .project.dvc import project_update_dvc # noqa: F401
|
||||||
from .project.push import project_push # noqa: F401
|
from .project.push import project_push # noqa: F401
|
||||||
from .project.pull import project_pull # noqa: F401
|
from .project.pull import project_pull # noqa: F401
|
||||||
|
from .project.document import project_document # noqa: F401
|
||||||
|
|
||||||
|
|
||||||
@app.command("link", no_args_is_help=True, deprecated=True, hidden=True)
|
@app.command("link", no_args_is_help=True, deprecated=True, hidden=True)
|
||||||
|
|
107
spacy/cli/project/document.py
Normal file
107
spacy/cli/project/document.py
Normal file
|
@ -0,0 +1,107 @@
|
||||||
|
from typing import Iterable, Optional
|
||||||
|
from pathlib import Path
|
||||||
|
from wasabi import msg
|
||||||
|
|
||||||
|
from .._util import project_cli, Arg, Opt, PROJECT_FILE, load_project_config
|
||||||
|
|
||||||
|
|
||||||
|
DOCS_URL = "https://nightly.spacy.io"
|
||||||
|
INTRO_PROJECT = f"""The `{PROJECT_FILE}` defines the data assets required by the
|
||||||
|
project, as well as the available commands and workflows. For details, see the
|
||||||
|
[spaCy projects documentation]({DOCS_URL}/usage/projects)."""
|
||||||
|
INTRO_COMMANDS = f"""The following commands are defined by the project. They
|
||||||
|
can be executed using [`spacy project run [name]`]({DOCS_URL}/api/cli#project-run).
|
||||||
|
Commands are only re-run if their inputs have changed."""
|
||||||
|
INTRO_WORKFLOWS = f"""The following workflows are defined by the project. They
|
||||||
|
can be executed using [`spacy project run [name]`]({DOCS_URL}/api/cli#project-run)
|
||||||
|
and will run the specified commands in order. Commands are only re-run if their
|
||||||
|
inputs have changed."""
|
||||||
|
INTRO_ASSETS = f"""The following assets are defined by the project. They can
|
||||||
|
be fetched by running [`spacy project assets`]({DOCS_URL}/api/cli#project-assets)
|
||||||
|
in the project directory."""
|
||||||
|
|
||||||
|
|
||||||
|
@project_cli.command("document")
|
||||||
|
def project_document_cli(
|
||||||
|
# fmt: off
|
||||||
|
project_dir: Path = Arg(Path.cwd(), help="Path to cloned project. Defaults to current working directory.", exists=True, file_okay=False),
|
||||||
|
output_file: Path = Opt("-", "--output", "-o", help="Path to output Markdown file for output. Defaults to - for standard output"),
|
||||||
|
no_emoji: bool = Opt(False, "--no-emoji", "-NE", help="Don't use emoji")
|
||||||
|
# fmt: on
|
||||||
|
):
|
||||||
|
"""Auto-generate a README.md for a project."""
|
||||||
|
project_document(project_dir, output_file, no_emoji=no_emoji)
|
||||||
|
|
||||||
|
|
||||||
|
def project_document(
|
||||||
|
project_dir: Path, output_file: Path, *, no_emoji: bool = False
|
||||||
|
) -> None:
|
||||||
|
is_stdout = str(output_file) == "-"
|
||||||
|
config = load_project_config(project_dir)
|
||||||
|
md = MarkdownRenderer(no_emoji=no_emoji)
|
||||||
|
title = config.get("title")
|
||||||
|
description = config.get("description")
|
||||||
|
md.add(md.title(1, f"spaCy Project{f': {title}' if title else ''}", "🪐"))
|
||||||
|
if description:
|
||||||
|
md.add(description)
|
||||||
|
md.add(md.title(2, PROJECT_FILE, "📋"))
|
||||||
|
md.add(INTRO_PROJECT)
|
||||||
|
# Commands
|
||||||
|
cmds = config.get("commands", [])
|
||||||
|
data = [(md.code(cmd["name"]), cmd.get("help", "")) for cmd in cmds]
|
||||||
|
if data:
|
||||||
|
md.add(md.title(3, "Commands", "⏯"))
|
||||||
|
md.add(INTRO_COMMANDS)
|
||||||
|
md.add(md.table(data, ["Command", "Description"]))
|
||||||
|
# Workflows
|
||||||
|
wfs = config.get("workflows", {}).items()
|
||||||
|
data = [(md.code(n), " → ".join(md.code(w) for w in stp)) for n, stp in wfs]
|
||||||
|
if data:
|
||||||
|
md.add(md.title(3, "Workflows", "⏭"))
|
||||||
|
md.add(INTRO_WORKFLOWS)
|
||||||
|
md.add(md.table(data, ["Workflow", "Steps"]))
|
||||||
|
# Assets
|
||||||
|
assets = config.get("assets", [])
|
||||||
|
data = []
|
||||||
|
for a in assets:
|
||||||
|
source = "Git" if a.get("git") else "URL" if a.get("url") else "Local"
|
||||||
|
data.append((md.code(a["dest"]), source, a.get("description", "")))
|
||||||
|
if data:
|
||||||
|
md.add(md.title(3, "Assets", "🗂"))
|
||||||
|
md.add(INTRO_ASSETS)
|
||||||
|
md.add(md.table(data, ["File", "Source", "Description"]))
|
||||||
|
# Output result
|
||||||
|
if is_stdout:
|
||||||
|
print(md.text)
|
||||||
|
else:
|
||||||
|
with output_file.open("w") as f:
|
||||||
|
f.write(md.text)
|
||||||
|
msg.good("Saved project documentation", output_file)
|
||||||
|
|
||||||
|
|
||||||
|
class MarkdownRenderer:
|
||||||
|
"""Simple helper for generating raw Markdown."""
|
||||||
|
|
||||||
|
def __init__(self, no_emoji: bool = False):
|
||||||
|
self.data = []
|
||||||
|
self.no_emoji = no_emoji
|
||||||
|
|
||||||
|
@property
|
||||||
|
def text(self):
|
||||||
|
return "\n\n".join(self.data)
|
||||||
|
|
||||||
|
def add(self, content: str) -> None:
|
||||||
|
self.data.append(content)
|
||||||
|
|
||||||
|
def table(self, data: Iterable[Iterable[str]], header: Iterable[str]) -> str:
|
||||||
|
head = f"| {' | '.join(header)} |"
|
||||||
|
divider = f"| {' | '.join('---' for _ in header)} |"
|
||||||
|
body = "\n".join(f"| {' | '.join(row)} |" for row in data)
|
||||||
|
return f"{head}\n{divider}\n{body}"
|
||||||
|
|
||||||
|
def title(self, level: int, text: str, emoji: Optional[str] = None) -> str:
|
||||||
|
prefix = f"{emoji} " if emoji and not self.no_emoji else ""
|
||||||
|
return f"{'#' * level} {prefix}{text}"
|
||||||
|
|
||||||
|
def code(self, text: str) -> str:
|
||||||
|
return f"`{text}`"
|
|
@ -296,6 +296,7 @@ class ProjectConfigAssetURL(BaseModel):
|
||||||
dest: StrictStr = Field(..., title="Destination of downloaded asset")
|
dest: StrictStr = Field(..., title="Destination of downloaded asset")
|
||||||
url: Optional[StrictStr] = Field(None, title="URL of asset")
|
url: Optional[StrictStr] = Field(None, title="URL of asset")
|
||||||
checksum: str = Field(None, title="MD5 hash of file", regex=r"([a-fA-F\d]{32})")
|
checksum: str = Field(None, title="MD5 hash of file", regex=r"([a-fA-F\d]{32})")
|
||||||
|
description: StrictStr = Field("", title="Description of asset")
|
||||||
# fmt: on
|
# fmt: on
|
||||||
|
|
||||||
|
|
||||||
|
@ -303,6 +304,7 @@ class ProjectConfigAssetGit(BaseModel):
|
||||||
# fmt: off
|
# fmt: off
|
||||||
git: ProjectConfigAssetGitItem = Field(..., title="Git repo information")
|
git: ProjectConfigAssetGitItem = Field(..., title="Git repo information")
|
||||||
checksum: str = Field(None, title="MD5 hash of file", regex=r"([a-fA-F\d]{32})")
|
checksum: str = Field(None, title="MD5 hash of file", regex=r"([a-fA-F\d]{32})")
|
||||||
|
description: Optional[StrictStr] = Field(None, title="Description of asset")
|
||||||
# fmt: on
|
# fmt: on
|
||||||
|
|
||||||
|
|
||||||
|
@ -328,6 +330,7 @@ class ProjectConfigSchema(BaseModel):
|
||||||
assets: List[Union[ProjectConfigAssetURL, ProjectConfigAssetGit]] = Field([], title="Data assets")
|
assets: List[Union[ProjectConfigAssetURL, ProjectConfigAssetGit]] = Field([], title="Data assets")
|
||||||
workflows: Dict[StrictStr, List[StrictStr]] = Field({}, title="Named workflows, mapped to list of project commands to run in order")
|
workflows: Dict[StrictStr, List[StrictStr]] = Field({}, title="Named workflows, mapped to list of project commands to run in order")
|
||||||
commands: List[ProjectConfigCommand] = Field([], title="Project command shortucts")
|
commands: List[ProjectConfigCommand] = Field([], title="Project command shortucts")
|
||||||
|
title: Optional[str] = Field(None, title="Project title")
|
||||||
# fmt: on
|
# fmt: on
|
||||||
|
|
||||||
class Config:
|
class Config:
|
||||||
|
|
Loading…
Reference in New Issue
Block a user