mirror of
https://github.com/explosion/spaCy.git
synced 2025-01-12 10:16:27 +03:00
51 lines
1.6 KiB
Python
51 lines
1.6 KiB
Python
from typing import Union, Iterable, Dict, Any
|
|
from pathlib import Path
|
|
import warnings
|
|
import sys
|
|
|
|
warnings.filterwarnings("ignore", message="numpy.dtype size changed") # noqa
|
|
warnings.filterwarnings("ignore", message="numpy.ufunc size changed") # noqa
|
|
|
|
# These are imported as part of the API
|
|
from thinc.api import prefer_gpu, require_gpu # noqa: F401
|
|
|
|
from . import pipeline # noqa: F401
|
|
from .cli.info import info # noqa: F401
|
|
from .glossary import explain # noqa: F401
|
|
from .about import __version__ # noqa: F401
|
|
from .util import registry # noqa: F401
|
|
|
|
from .errors import Errors
|
|
from .language import Language
|
|
from . import util
|
|
|
|
if sys.maxunicode == 65535:
|
|
raise SystemError(Errors.E130)
|
|
|
|
|
|
def load(
|
|
name: Union[str, Path],
|
|
disable: Iterable[str] = tuple(),
|
|
component_cfg: Dict[str, Dict[str, Any]] = util.SimpleFrozenDict(),
|
|
) -> Language:
|
|
"""Load a spaCy model from an installed package or a local path.
|
|
|
|
name (str): Package name or model path.
|
|
disable (Iterable[str]): Names of pipeline components to disable.
|
|
component_cfg (Dict[str, dict]): Config overrides for pipeline components,
|
|
keyed by component names.
|
|
RETURNS (Language): The loaded nlp object.
|
|
"""
|
|
return util.load_model(name, disable=disable, component_cfg=component_cfg)
|
|
|
|
|
|
def blank(name: str, **overrides) -> Language:
|
|
"""Create a blank nlp object for a given language code.
|
|
|
|
name (str): The language code, e.g. "en".
|
|
**overrides: Keyword arguments passed to language subclass on init.
|
|
RETURNS (Language): The nlp object.
|
|
"""
|
|
LangClass = util.get_lang_class(name)
|
|
return LangClass(**overrides)
|