mirror of
https://github.com/explosion/spaCy.git
synced 2025-07-27 08:29:51 +03:00
adding rolegal model to the spaCy universe
This commit is contained in:
parent
b4501db6f8
commit
516783b376
|
@ -4469,6 +4469,34 @@
|
|||
},
|
||||
"category": ["pipeline", "standalone"],
|
||||
"tags": ["spans", "rules", "ner"]
|
||||
},
|
||||
{
|
||||
"id": "rolegal",
|
||||
"title": "rolegal - a Spacy Package for Legal Document Processing",
|
||||
"slogan": "A Spacy Package for Romanian Legal Document Processing",
|
||||
"description": "This is a spacy language model for Romanian legal domain trained with floret 4-gram to 5-gram embeddings and `LEGAL` entity recognition. Useful for processing OCR-resulted noisy legal documents.",
|
||||
"github": "senisioi/rolegal",
|
||||
"image": "https://github.com/senisioi/rolegal/blob/main/img/paper.jpeg?raw=true",
|
||||
"pip": "pip install ro-legal-fl",
|
||||
"tags": ["legal", "floret", "ner", "romanian"],
|
||||
"code_example": [
|
||||
"import spacy",
|
||||
"nlp = spacy.load(\"ro_legal_fl\")",
|
||||
"",
|
||||
"doc = nlp(\"Titlul III din LEGEA nr. 255 din 19 iulie 2013, publicată în MONITORUL OFICIAL\")"
|
||||
"# legal entity identification"
|
||||
"for entity in doc.ents:"
|
||||
" print('entity: ', entity, '; entity type: ', entity.label_)"
|
||||
"",
|
||||
"# floret n-gram embeddings robust to typos",
|
||||
"print(nlp('achizit1e public@').similarity(nlp('achiziții publice')))"
|
||||
],
|
||||
"author": "Sergiu Nisioi",
|
||||
"author_links": {
|
||||
"github": "senisioi",
|
||||
"website": "https://nlp.unibuc.ro/people/snisioi.html"
|
||||
},
|
||||
"category": ["pipeline", "training", "models"]
|
||||
}
|
||||
],
|
||||
|
||||
|
|
Loading…
Reference in New Issue
Block a user