adding rolegal model to the spaCy universe

This commit is contained in:
snisioi 2023-09-26 07:58:55 +03:00
parent b4501db6f8
commit 516783b376

View File

@ -4469,6 +4469,34 @@
},
"category": ["pipeline", "standalone"],
"tags": ["spans", "rules", "ner"]
},
{
"id": "rolegal",
"title": "rolegal - a Spacy Package for Legal Document Processing",
"slogan": "A Spacy Package for Romanian Legal Document Processing",
"description": "This is a spacy language model for Romanian legal domain trained with floret 4-gram to 5-gram embeddings and `LEGAL` entity recognition. Useful for processing OCR-resulted noisy legal documents.",
"github": "senisioi/rolegal",
"image": "https://github.com/senisioi/rolegal/blob/main/img/paper.jpeg?raw=true",
"pip": "pip install ro-legal-fl",
"tags": ["legal", "floret", "ner", "romanian"],
"code_example": [
"import spacy",
"nlp = spacy.load(\"ro_legal_fl\")",
"",
"doc = nlp(\"Titlul III din LEGEA nr. 255 din 19 iulie 2013, publicată în MONITORUL OFICIAL\")"
"# legal entity identification"
"for entity in doc.ents:"
" print('entity: ', entity, '; entity type: ', entity.label_)"
"",
"# floret n-gram embeddings robust to typos",
"print(nlp('achizit1e public@').similarity(nlp('achiziții publice')))"
],
"author": "Sergiu Nisioi",
"author_links": {
"github": "senisioi",
"website": "https://nlp.unibuc.ro/people/snisioi.html"
},
"category": ["pipeline", "training", "models"]
}
],