mirror of
https://github.com/explosion/spaCy.git
synced 2024-12-26 01:46:28 +03:00
Improve entry points and allow custom language classes via entry points (#3080)
* Remove check for overwritten factory This needs to be handled differently – on first initialization, a new factory will be added and any subsequent initializations will trigger this warning, even if it's a new entry point that doesn't overwrite a built-in. * Add helper to only load specific entry point Useful for loading languages via entry points, so that they can be lazy-loaded. Otherwise, all entry point languages would have to be loaded upfront. * Check entry points for custom languages
This commit is contained in:
parent
ca244f5f84
commit
bb9ad37e05
|
@ -28,7 +28,7 @@ from .lang.punctuation import TOKENIZER_INFIXES
|
||||||
from .lang.tokenizer_exceptions import TOKEN_MATCH
|
from .lang.tokenizer_exceptions import TOKEN_MATCH
|
||||||
from .lang.tag_map import TAG_MAP
|
from .lang.tag_map import TAG_MAP
|
||||||
from .lang.lex_attrs import LEX_ATTRS, is_stop
|
from .lang.lex_attrs import LEX_ATTRS, is_stop
|
||||||
from .errors import Errors, Warnings, user_warning
|
from .errors import Errors
|
||||||
from . import util
|
from . import util
|
||||||
from . import about
|
from . import about
|
||||||
|
|
||||||
|
@ -146,9 +146,6 @@ class Language(object):
|
||||||
RETURNS (Language): The newly constructed object.
|
RETURNS (Language): The newly constructed object.
|
||||||
"""
|
"""
|
||||||
user_factories = util.get_entry_points("spacy_factories")
|
user_factories = util.get_entry_points("spacy_factories")
|
||||||
for factory in user_factories.keys():
|
|
||||||
if factory in self.factories:
|
|
||||||
user_warning(Warnings.W009.format(name=factory))
|
|
||||||
self.factories.update(user_factories)
|
self.factories.update(user_factories)
|
||||||
self._meta = dict(meta)
|
self._meta = dict(meta)
|
||||||
self._path = None
|
self._path = None
|
||||||
|
|
|
@ -43,6 +43,11 @@ def get_lang_class(lang):
|
||||||
RETURNS (Language): Language class.
|
RETURNS (Language): Language class.
|
||||||
"""
|
"""
|
||||||
global LANGUAGES
|
global LANGUAGES
|
||||||
|
# Check if an entry point is exposed for the language code
|
||||||
|
entry_point = get_entry_point("spacy_languages", lang)
|
||||||
|
if entry_point is not None:
|
||||||
|
LANGUAGES[lang] = entry_point
|
||||||
|
return entry_point
|
||||||
if lang not in LANGUAGES:
|
if lang not in LANGUAGES:
|
||||||
try:
|
try:
|
||||||
module = importlib.import_module(".lang.%s" % lang, "spacy")
|
module = importlib.import_module(".lang.%s" % lang, "spacy")
|
||||||
|
@ -230,6 +235,19 @@ def get_entry_points(key):
|
||||||
return result
|
return result
|
||||||
|
|
||||||
|
|
||||||
|
def get_entry_point(key, value):
|
||||||
|
"""Check if registered entry point is available for a given name and
|
||||||
|
load it. Otherwise, return None.
|
||||||
|
|
||||||
|
key (unicode): Entry point name.
|
||||||
|
value (unicode): Name of entry point to load.
|
||||||
|
RETURNS: The loaded entry point or None.
|
||||||
|
"""
|
||||||
|
for entry_point in pkg_resources.iter_entry_points(key):
|
||||||
|
if entry_point.name == value:
|
||||||
|
return entry_point.load()
|
||||||
|
|
||||||
|
|
||||||
def is_in_jupyter():
|
def is_in_jupyter():
|
||||||
"""Check if user is running spaCy from a Jupyter notebook by detecting the
|
"""Check if user is running spaCy from a Jupyter notebook by detecting the
|
||||||
IPython kernel. Mainly used for the displaCy visualizer.
|
IPython kernel. Mainly used for the displaCy visualizer.
|
||||||
|
|
Loading…
Reference in New Issue
Block a user