mirror of
https://github.com/explosion/spaCy.git
synced 2024-12-28 02:46:35 +03:00
49cee4af92
* Integrate Python kernel via Binder * Add live model test for languages with examples * Update docs and code examples * Adjust margin (if not bootstrapped) * Add binder version to global config * Update terminal and executable code mixins * Pass attributes through infobox and section * Hide v-cloak * Fix example * Take out model comparison for now * Add meta text for compat * Remove chart.js dependency * Tidy up and simplify JS and port big components over to Vue * Remove chartjs example * Add Twitter icon * Add purple stylesheet option * Add utility for hand cursor (special cases only) * Add transition classes * Add small option for section * Add thumb object for small round thumbnail images * Allow unset code block language via "none" value (workaround to still allow unset language to default to DEFAULT_SYNTAX) * Pass through attributes * Add syntax highlighting definitions for Julia, R and Docker * Add website icon * Remove user survey from navigation * Don't hide GitHub icon on small screens * Make top navigation scrollable on small screens * Remove old resources page and references to it * Add Universe * Add helper functions for better page URL and title * Update site description * Increment versions * Update preview images * Update mentions of resources * Fix image * Fix social images * Fix problem with cover sizing and floats * Add divider and move badges into heading * Add docstrings * Reference converting section * Add section on converting word vectors * Move converting section to custom section and fix formatting * Remove old fastText example * Move extensions content to own section Keep weird ID to not break permalinks for now (we don't want to rewrite URLs if not absolutely necessary) * Use better component example and add factories section * Add note on larger model * Use better example for non-vector * Remove similarity in context section Only works via small models with tensors so has always been kind of confusing * Add note on init-model command * Fix lightning tour examples and make excutable if possible * Add spacy train CLI section to train * Fix formatting and add video * Fix formatting * Fix textcat example description (resolves #2246) * Add dummy file to try resolve conflict * Delete dummy file * Tidy up [ci skip] * Ensure sufficient height of loading container * Add loading animation to universe * Update Thebelab build and use better startup message * Fix asset versioning * Fix typo [ci skip] * Add note on project idea label
142 lines
4.7 KiB
JSON
142 lines
4.7 KiB
JSON
{
|
|
"sidebar": {
|
|
"Models": {
|
|
"Overview": "./"
|
|
},
|
|
|
|
"Language models": {
|
|
"English": "en",
|
|
"German": "de",
|
|
"Spanish": "es",
|
|
"Portuguese": "pt",
|
|
"French": "fr",
|
|
"Italian": "it",
|
|
"Dutch": "nl",
|
|
"Multi-Language": "xx"
|
|
}
|
|
},
|
|
|
|
"index": {
|
|
"title": "Models Overview",
|
|
"teaser": "Downloadable statistical models for spaCy to predict and assign linguistic features.",
|
|
"quickstart": true,
|
|
"menu": {
|
|
"Quickstart": "quickstart",
|
|
"Installation": "install",
|
|
"Naming Conventions": "conventions"
|
|
}
|
|
},
|
|
|
|
"comparison": {
|
|
"title": "Model Comparison",
|
|
"teaser": "Compare spaCy's statistical models and their accuracy.",
|
|
"tag": "experimental",
|
|
"compare_models": true,
|
|
"default_models": {
|
|
"model1": "en_core_web_sm",
|
|
"model2": "en_core_web_lg"
|
|
}
|
|
},
|
|
|
|
"MODELS": {
|
|
"en": ["en_core_web_sm", "en_core_web_md", "en_core_web_lg", "en_vectors_web_lg"],
|
|
"de": ["de_core_news_sm"],
|
|
"es": ["es_core_news_sm", "es_core_news_md"],
|
|
"pt": ["pt_core_news_sm"],
|
|
"fr": ["fr_core_news_sm", "fr_core_news_md"],
|
|
"it": ["it_core_news_sm"],
|
|
"nl": ["nl_core_news_sm"],
|
|
"xx": ["xx_ent_wiki_sm"]
|
|
},
|
|
|
|
"MODEL_META": {
|
|
"core": "Vocabulary, syntax, entities, vectors",
|
|
"core_sm": "Vocabulary, syntax, entities",
|
|
"dep": "Vocabulary, syntax",
|
|
"ent": "Named entities",
|
|
"vectors": "Word vectors",
|
|
"web": "written text (blogs, news, comments)",
|
|
"news": "written text (news, media)",
|
|
"wiki": "Wikipedia",
|
|
"uas": "Unlabelled dependencies",
|
|
"las": "Labelled dependencies",
|
|
"tags_acc": "Part-of-speech tags (fine grained tags, Token.tag)",
|
|
"ents_f": "Entities (F-score)",
|
|
"ents_p": "Entities (precision)",
|
|
"ents_r": "Entities (recall)",
|
|
"cpu": "words per second on CPU",
|
|
"gpu": "words per second on GPU",
|
|
"pipeline": "Processing pipeline components in order",
|
|
"sources": "Sources of training data",
|
|
"vecs": "Word vectors included in the model. Models that only support context vectors compute similarity via the tensors shared with the pipeline.",
|
|
"benchmark_parser": "Syntax accuracy",
|
|
"benchmark_ner": "NER accuracy",
|
|
"benchmark_speed": "Speed",
|
|
"compat": "Latest compatible model version for your spaCy installation"
|
|
},
|
|
|
|
"MODEL_LICENSES": {
|
|
"CC BY 4.0": "https://creativecommons.org/licenses/by/4.0/",
|
|
"CC BY-SA": "https://creativecommons.org/licenses/by-sa/3.0/",
|
|
"CC BY-SA 3.0": "https://creativecommons.org/licenses/by-sa/3.0/",
|
|
"CC BY-SA 4.0": "https://creativecommons.org/licenses/by-sa/4.0/",
|
|
"CC BY-NC": "https://creativecommons.org/licenses/by-nc/3.0/",
|
|
"CC BY-NC 3.0": "https://creativecommons.org/licenses/by-nc/3.0/",
|
|
"CC-BY-NC-SA 3.0": "https://creativecommons.org/licenses/by-nc-sa/3.0/",
|
|
"GPL": "https://www.gnu.org/licenses/gpl.html",
|
|
"LGPL": "https://www.gnu.org/licenses/lgpl.html"
|
|
},
|
|
|
|
"MODEL_BENCHMARKS": {
|
|
"parser": { "uas": "UAS", "las": "LAS", "tags_acc": "POS" },
|
|
"ner": { "ents_f": "NER F", "ents_p": "NER P", "ents_r": "NER R" }
|
|
},
|
|
|
|
"EXAMPLE_SENT_LANGS": [
|
|
"da", "de", "en", "es", "fa", "fr", "he", "hi", "hu", "id", "it", "ja",
|
|
"nb", "nl", "pl", "pt", "ru", "sv", "tr", "zh"
|
|
],
|
|
|
|
"LANGUAGES": {
|
|
"en": "English",
|
|
"de": "German",
|
|
"fr": "French",
|
|
"es": "Spanish",
|
|
"it": "Italian",
|
|
"pt": "Portuguese",
|
|
"nl": "Dutch",
|
|
"sv": "Swedish",
|
|
"fi": "Finnish",
|
|
"nb": "Norwegian Bokmål",
|
|
"da": "Danish",
|
|
"hu": "Hungarian",
|
|
"pl": "Polish",
|
|
"ru": "Russian",
|
|
"ro": "Romanian",
|
|
"hr": "Croatian",
|
|
"tr": "Turkish",
|
|
"he": "Hebrew",
|
|
"fa": "Persian",
|
|
"ga": "Irish",
|
|
"bn": "Bengali",
|
|
"hi": "Hindi",
|
|
"id": "Indonesian",
|
|
"th": "Thai",
|
|
"zh": "Chinese",
|
|
"ja": "Japanese",
|
|
"vi": "Vietnamese",
|
|
"xx": "Multi-language"
|
|
},
|
|
|
|
"EXAMPLE_SENTENCES": {
|
|
"en": "This is a sentence.",
|
|
"de": "Dies ist ein Satz.",
|
|
"fr": "C'est une phrase.",
|
|
"es": "Esto es una frase.",
|
|
"pt": "Esta é uma frase.",
|
|
"it": "Questa è una frase.",
|
|
"nl": "Dit is een zin.",
|
|
"xx": "This is a sentence about Facebook."
|
|
}
|
|
}
|