1
1
mirror of https://github.com/explosion/spaCy.git synced 2025-01-15 03:56:23 +03:00
spaCy/spacy/cli/info.py

63 lines
2.2 KiB
Python
Raw Normal View History

# coding: utf8
from __future__ import unicode_literals
import plac
import platform
from pathlib import Path
2017-03-18 20:57:45 +03:00
2017-05-08 00:25:29 +03:00
from ..compat import path2str
from .. import about
from .. import util
@plac.annotations(
model=("optional: shortcut link of model", "positional", None, str),
2017-10-27 15:38:39 +03:00
markdown=("generate Markdown for GitHub issues", "flag", "md", str))
def info(cmd, model=None, markdown=False):
"""Print info about spaCy installation. If a model shortcut link is
speficied as an argument, print model information. Flag --markdown
prints details in Markdown for easy copy-pasting to GitHub issues.
"""
if model:
if util.is_package(model):
model_path = util.get_package_path(model)
else:
model_path = util.get_data_path() / model
meta_path = model_path / 'meta.json'
if not meta_path.is_file():
2017-06-01 17:46:15 +03:00
util.prints(meta_path, title="Can't find model meta.json", exits=1)
2017-06-04 21:44:15 +03:00
meta = util.read_json(meta_path)
if model_path.resolve() != model_path:
meta['link'] = path2str(model_path)
meta['source'] = path2str(model_path.resolve())
else:
meta['source'] = path2str(model_path)
print_info(meta, 'model %s' % model, markdown)
else:
2017-05-08 00:25:29 +03:00
data = {'spaCy version': about.__version__,
'Location': path2str(Path(__file__).parent.parent),
'Platform': platform.platform(),
'Python version': platform.python_version(),
'Models': list_models()}
print_info(data, 'spaCy', markdown)
def print_info(data, title, markdown):
2017-05-08 00:25:29 +03:00
title = 'Info about %s' % title
if markdown:
util.print_markdown(data, title=title)
else:
util.print_table(data, title=title)
def list_models():
2017-05-08 00:25:29 +03:00
def exclude_dir(dir_name):
# exclude common cache directories and hidden directories
exclude = ['cache', 'pycache', '__pycache__']
return dir_name in exclude or dir_name.startswith('.')
data_path = util.get_data_path()
if data_path:
models = [f.parts[-1] for f in data_path.iterdir() if f.is_dir()]
2017-05-08 00:25:29 +03:00
return ', '.join([m for m in models if not exclude_dir(m)])
return '-'