spaCy/spacy/lang/el/lemmatizer/lemma_rules.json
Ines Montani 5ca7dd0f94
💫 WIP: Basic lookup class scaffolding and JSON for all lemmati… (#4167)
* Improve load_language_data helper

* WIP: Add Lookups implementation

* Start moving lemma data over to JSON

* WIP: move data over for more languages

* Convert more languages

* Fix lemmatizer fixtures in tests

* Finish conversion

* Auto-format JSON files

* Fix test for now

* Make sure tables are stored on instance
2019-08-22 14:21:32 +02:00

139 lines
3.9 KiB
JSON
Raw Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

{
"adj": [
["οί", "ός"],
["ών", "ός"],
["ού", "ός"],
["ή", "ός"],
["ής", "ός"],
["ές", "ός"],
["οι", "ος"],
["ων", "ος"],
["ου", "ος"],
["ο", "ος"],
["α", "ος"],
["ώδη", "ώδες"],
["ύτερη", "ός"],
["ύτερης", "ός"],
["ύτερων", "ός"],
["ύτερος", "ός"],
["ύτερου", "ός"]
],
"noun": [
["ιού", "ί"],
["ιά", "ί"],
["ιών", "ί"],
["ηριού", "ήρι"],
["ια", "ι"],
["ηριών", "ήρι"],
["ας", "α"],
["ες", "α"],
["ων", "α"],
["άς", "ά"],
["ές", "ά"],
["ών", "ά"],
["ής", "ή"],
["ές", "ή"],
["ών", "ή"],
["ές", "ής"],
["ών", "ής"],
["ου", "ο"],
["α", "ο"],
["ων", "ο"],
["ητήματος", "ήτημα"],
["ητήματα", "ήτημα"],
["ητημάτων", "ήτημα"],
["τος", ""],
["τα", "α"],
["ομάτων", "όμα"],
["ού", "ός"],
["οί", "ός"],
["ών", "ός"],
["ς", ""],
["ες", "α"],
["ιών", "ία"],
["α", "ας"],
["δων", ""]
],
"verb": [
["εις", "ω"],
["ει", "ω"],
["ουμε", "ω"],
["ετε", "ω"],
["ουνε", "ω"],
["ουν", "ω"],
["είς", "ώ"],
["εί", "ώ"],
["ούν", "ώ"],
["εσαι", "ομαι"],
["εται", "ομαι"],
["ανόμαστε", "άνομαι"],
["εστε", "ομαι"],
["ονται", "ομαι"],
["άς", "ώ"],
["άει", "ώ"],
["άμε", "ώ"],
["άτε", "ώ"],
["άνε", "ώ"],
["άν", "ώ"],
["άω", "ώ"],
["ώ", "άω"],
["ιζόμουν", "ίζομαι"],
["ιζόσουν", "ίζομαι"],
["ιζόταν", "ίζομαι"],
["ιζόμασταν", "ίζομαι"],
["ιζόσασταν", "ίζομαι"],
["ονταν", "ομαι"],
["όμουν", "άμαι"],
["όσουν", "άμαι"],
["όταν", "άμαι"],
["όμασταν", "άμαι"],
["όσασταν", "άμαι"],
["όντουσταν", "άμαι"],
["ούσα", "ώ"],
["ούσες", "ώ"],
["ούσε", "ώ"],
["ούσαμε", "ώ"],
["ούσατε", "ώ"],
["ούσαν", "ώ"],
["ούσανε", "ώ"],
["λαμε", "ζω"],
["λατε", "ζω"],
["ήρα", "άρω"],
["ήρες", "άρω"],
["ήρε", "άρω"],
["ήραμε", "άρω"],
["ήρατε", "άρω"],
["ήρα", "άρω"],
["ένησα", "ενώ"],
["ένησες", "ενώ"],
["ένησε", "ενώ"],
["ενήσαμε", "ενώ"],
["ένησατε", "ενώ"],
["ένησαν", "ενώ"],
["όνεσα", "ονώ"],
["όνεσες", "ονώ"],
["όνεσε", "ονώ"],
["έσαμε", "ώ"],
["έσατε", "ώ"],
["ισα", "ομαι"],
["ισες", "ομαι"],
["ισε", "ομαι"],
["αθίσαμε", "άθομαι"],
["αθίσατε", "άθομαι"],
["ισαν", "ομαι"],
["άπα", "απώ"],
["ά", "ώ"],
["οντας", "ω"],
["ξω", "ζω"],
["ξεις", "ζω"],
["ξουμε", "ζω"],
["ξετε", "ζω"],
["ξουν", "ζω"]
],
"punct": [
["“", "\""],
["”", "\""],
["", "'"],
["", "'"]
]
}