spaCy/website/models/_data.json
Ines Montani 49cee4af92
💫 Interactive code examples, spaCy Universe and various docs improvements (#2274)
* Integrate Python kernel via Binder

* Add live model test for languages with examples

* Update docs and code examples

* Adjust margin (if not bootstrapped)

* Add binder version to global config

* Update terminal and executable code mixins

* Pass attributes through infobox and section

* Hide v-cloak

* Fix example

* Take out model comparison for now

* Add meta text for compat

* Remove chart.js dependency

* Tidy up and simplify JS and port big components over to Vue

* Remove chartjs example

* Add Twitter icon

* Add purple stylesheet option

* Add utility for hand cursor (special cases only)

* Add transition classes

* Add small option for section

* Add thumb object for small round thumbnail images

* Allow unset code block language via "none" value

(workaround to still allow unset language to default to DEFAULT_SYNTAX)

* Pass through attributes

* Add syntax highlighting definitions for Julia, R and Docker

* Add website icon

* Remove user survey from navigation

* Don't hide GitHub icon on small screens

* Make top navigation scrollable on small screens

* Remove old resources page and references to it

* Add Universe

* Add helper functions for better page URL and title

* Update site description

* Increment versions

* Update preview images

* Update mentions of resources

* Fix image

* Fix social images

* Fix problem with cover sizing and floats

* Add divider and move badges into heading

* Add docstrings

* Reference converting section

* Add section on converting word vectors

* Move converting section to custom section and fix formatting

* Remove old fastText example

* Move extensions content to own section

Keep weird ID to not break permalinks for now (we don't want to rewrite URLs if not absolutely necessary)

* Use better component example and add factories section

* Add note on larger model

* Use better example for non-vector

* Remove similarity in context section

Only works via small models with tensors so has always been kind of confusing

* Add note on init-model command

* Fix lightning tour examples and make excutable if possible

* Add spacy train CLI section to train

* Fix formatting and add video

* Fix formatting

* Fix textcat example description (resolves #2246)

* Add dummy file to try resolve conflict

* Delete dummy file

* Tidy up [ci skip]

* Ensure sufficient height of loading container

* Add loading animation to universe

* Update Thebelab build and use better startup message

* Fix asset versioning

* Fix typo [ci skip]

* Add note on project idea label
2018-04-29 02:06:46 +02:00

142 lines
4.7 KiB
JSON

{
"sidebar": {
"Models": {
"Overview": "./"
},
"Language models": {
"English": "en",
"German": "de",
"Spanish": "es",
"Portuguese": "pt",
"French": "fr",
"Italian": "it",
"Dutch": "nl",
"Multi-Language": "xx"
}
},
"index": {
"title": "Models Overview",
"teaser": "Downloadable statistical models for spaCy to predict and assign linguistic features.",
"quickstart": true,
"menu": {
"Quickstart": "quickstart",
"Installation": "install",
"Naming Conventions": "conventions"
}
},
"comparison": {
"title": "Model Comparison",
"teaser": "Compare spaCy's statistical models and their accuracy.",
"tag": "experimental",
"compare_models": true,
"default_models": {
"model1": "en_core_web_sm",
"model2": "en_core_web_lg"
}
},
"MODELS": {
"en": ["en_core_web_sm", "en_core_web_md", "en_core_web_lg", "en_vectors_web_lg"],
"de": ["de_core_news_sm"],
"es": ["es_core_news_sm", "es_core_news_md"],
"pt": ["pt_core_news_sm"],
"fr": ["fr_core_news_sm", "fr_core_news_md"],
"it": ["it_core_news_sm"],
"nl": ["nl_core_news_sm"],
"xx": ["xx_ent_wiki_sm"]
},
"MODEL_META": {
"core": "Vocabulary, syntax, entities, vectors",
"core_sm": "Vocabulary, syntax, entities",
"dep": "Vocabulary, syntax",
"ent": "Named entities",
"vectors": "Word vectors",
"web": "written text (blogs, news, comments)",
"news": "written text (news, media)",
"wiki": "Wikipedia",
"uas": "Unlabelled dependencies",
"las": "Labelled dependencies",
"tags_acc": "Part-of-speech tags (fine grained tags, Token.tag)",
"ents_f": "Entities (F-score)",
"ents_p": "Entities (precision)",
"ents_r": "Entities (recall)",
"cpu": "words per second on CPU",
"gpu": "words per second on GPU",
"pipeline": "Processing pipeline components in order",
"sources": "Sources of training data",
"vecs": "Word vectors included in the model. Models that only support context vectors compute similarity via the tensors shared with the pipeline.",
"benchmark_parser": "Syntax accuracy",
"benchmark_ner": "NER accuracy",
"benchmark_speed": "Speed",
"compat": "Latest compatible model version for your spaCy installation"
},
"MODEL_LICENSES": {
"CC BY 4.0": "https://creativecommons.org/licenses/by/4.0/",
"CC BY-SA": "https://creativecommons.org/licenses/by-sa/3.0/",
"CC BY-SA 3.0": "https://creativecommons.org/licenses/by-sa/3.0/",
"CC BY-SA 4.0": "https://creativecommons.org/licenses/by-sa/4.0/",
"CC BY-NC": "https://creativecommons.org/licenses/by-nc/3.0/",
"CC BY-NC 3.0": "https://creativecommons.org/licenses/by-nc/3.0/",
"CC-BY-NC-SA 3.0": "https://creativecommons.org/licenses/by-nc-sa/3.0/",
"GPL": "https://www.gnu.org/licenses/gpl.html",
"LGPL": "https://www.gnu.org/licenses/lgpl.html"
},
"MODEL_BENCHMARKS": {
"parser": { "uas": "UAS", "las": "LAS", "tags_acc": "POS" },
"ner": { "ents_f": "NER F", "ents_p": "NER P", "ents_r": "NER R" }
},
"EXAMPLE_SENT_LANGS": [
"da", "de", "en", "es", "fa", "fr", "he", "hi", "hu", "id", "it", "ja",
"nb", "nl", "pl", "pt", "ru", "sv", "tr", "zh"
],
"LANGUAGES": {
"en": "English",
"de": "German",
"fr": "French",
"es": "Spanish",
"it": "Italian",
"pt": "Portuguese",
"nl": "Dutch",
"sv": "Swedish",
"fi": "Finnish",
"nb": "Norwegian Bokmål",
"da": "Danish",
"hu": "Hungarian",
"pl": "Polish",
"ru": "Russian",
"ro": "Romanian",
"hr": "Croatian",
"tr": "Turkish",
"he": "Hebrew",
"fa": "Persian",
"ga": "Irish",
"bn": "Bengali",
"hi": "Hindi",
"id": "Indonesian",
"th": "Thai",
"zh": "Chinese",
"ja": "Japanese",
"vi": "Vietnamese",
"xx": "Multi-language"
},
"EXAMPLE_SENTENCES": {
"en": "This is a sentence.",
"de": "Dies ist ein Satz.",
"fr": "C'est une phrase.",
"es": "Esto es una frase.",
"pt": "Esta é uma frase.",
"it": "Questa è una frase.",
"nl": "Dit is een zin.",
"xx": "This is a sentence about Facebook."
}
}