mirror of
https://github.com/explosion/spaCy.git
synced 2024-11-11 12:18:04 +03:00
✨ project: pySBD - Python Sentence Boundary Disambiguation (#4455)
* ✨ project: pySBD - Python Sentence Boundary Disambiguation * 📝 Update links and description * 🐛 Fix missing comma * Update universe.json pysbd as a spacy component through entrypoints * 🚨 Fix universe.json * 📝 Update code_example
This commit is contained in:
parent
e4820fa667
commit
6316243941
|
@ -1801,6 +1801,32 @@
|
|||
"github": "microsoft"
|
||||
}
|
||||
},
|
||||
{
|
||||
"id": "python-sentence-boundary-disambiguation",
|
||||
"title": "pySBD - python Sentence Boundary Disambiguation",
|
||||
"slogan": "a rule-based sentence boundary detection that works out-of-the-box",
|
||||
"github": "nipunsadvilkar/pySBD",
|
||||
"description": "pySBD is 'real-world' sentence segmenter which extracts a reasonable sentences when the format and domain of the input text are unknown. It is a rules-based algorithm based on [The Golden Rules](https://s3.amazonaws.com/tm-town-nlp-resources/golden_rules.txt) - a set of tests to check accuracy of segmenter in regards to edge case scenarios developed by [TM-Town](https://www.tm-town.com/) dev team. pySBD is python port of ruby gem [Pragmatic Segmenter](https://github.com/diasks2/pragmatic_segmenter).",
|
||||
"pip": "pysbd",
|
||||
"category": ["scientific"],
|
||||
"tags": ["sentence segmentation"],
|
||||
"code_example": [
|
||||
"from pysbd.util import PySBDFactory",
|
||||
"",
|
||||
"nlp = spacy.blank('en')",
|
||||
"nlp.add_pipe(PySBDFactory(nlp))",
|
||||
"",
|
||||
"doc = nlp('My name is Jonas E. Smith. Please turn to p. 55.')",
|
||||
"print(list(doc.sents))",
|
||||
"# [My name is Jonas E. Smith., Please turn to p. 55.]"
|
||||
],
|
||||
"author": "Nipun Sadvilkar",
|
||||
"author_links": {
|
||||
"twitter": "nipunsadvilkar",
|
||||
"github": "nipunsadvilkar",
|
||||
"website": "https://nipunsadvilkar.github.io"
|
||||
}
|
||||
},
|
||||
{
|
||||
"id": "cookiecutter-spacy-fastapi",
|
||||
"title": "cookiecutter-spacy-fastapi",
|
||||
|
|
Loading…
Reference in New Issue
Block a user