spaCy/spacy/__init__.py

38 lines
1.2 KiB
Python
Raw Normal View History

# coding: utf8
from __future__ import unicode_literals
from . import util
2017-05-08 00:25:29 +03:00
from .util import prints
from .deprecated import resolve_model_name
2017-05-03 12:01:42 +03:00
import importlib
2017-03-28 15:10:20 +03:00
from .cli.info import info
from .glossary import explain
2017-03-18 21:30:03 +03:00
2017-05-03 12:01:42 +03:00
_languages_name = set(["en", "de", "es", "pt", "fr",
"it", "hu", "zh", "nl", "sv",
2017-05-03 12:04:51 +03:00
"fi", "bn", "he", "nb", "ja"])
2017-02-01 01:27:29 +03:00
2016-03-25 20:54:45 +03:00
2016-10-18 20:23:31 +03:00
def load(name, **overrides):
if overrides.get('path') in (None, False, True):
data_path = util.get_data_path()
model_name = resolve_model_name(name)
model_path = data_path / model_name
if not model_path.exists():
lang_name = util.get_lang_class(name).lang
model_path = None
2017-05-08 00:25:29 +03:00
prints("Only loading the '%s' tokenizer." % lang_name,
title="Warning: no model found for '%s'" % name)
else:
model_path = util.ensure_path(overrides['path'])
data_path = model_path.parent
model_name = ''
meta = util.parse_package_meta(data_path, model_name, require=False)
2017-03-17 02:30:02 +03:00
lang = meta['lang'] if meta and 'lang' in meta else name
module = importlib.import_module("."+lang, "spacy")
cls = module.EXPORT
overrides['meta'] = meta
overrides['path'] = model_path
2017-04-27 12:14:26 +03:00
return cls(**overrides)