From 41fcfd06b8465749192a16ba5a776f9b26ad3fe7 Mon Sep 17 00:00:00 2001 From: Magnus Burton Date: Fri, 17 Feb 2017 10:04:04 +0100 Subject: [PATCH] Added regular verb rules for Swedish --- spacy/sv/lemma_rules.py | 67 ++++++++++++++++++++++++++++++++++++++++- 1 file changed, 66 insertions(+), 1 deletion(-) diff --git a/spacy/sv/lemma_rules.py b/spacy/sv/lemma_rules.py index 5bdb4284e..66731f5f5 100644 --- a/spacy/sv/lemma_rules.py +++ b/spacy/sv/lemma_rules.py @@ -23,6 +23,71 @@ LEMMA_RULES = { ["larna", "el"] ], + "verb": [ + ["r", ""], + ["de", ""], + ["t", ""], + ["er", ""], + ["te", ""], + ["a", ""], + ["e", ""], + ["t", "d"], + ["tt", "d"], + ["tt", ""], + ["ev", "iv"], + ["ack", "ick"], + ["ög", "yg"], + ["it", ""], + ["uckit", "ick"], + ["ugit", "yg"], + ["it", "et"], + ["id", "ed"], + ["ip", "ep"], + ["iv", "ev"], + ["in", "en"], + ["ik", "ek"], + ["ig", "eg"], + ["ind", ""], + ["inn", "ann"], + ["nder", "nd"], + ["inner", "inn"], + ["and", "ind"], + ["ann", "inn"], + ["s", ""], + ["anns", "inn"], + ["undit", "ind"], + ["unnit", "inn"], + ["unnits", "inn"], + ["uppit", "ipp"], + ["ungit", "ing"], + ["öd", "ud"], + ["öt", "jut"], + ["öt", "ut"], + ["ög", "ug"], + ["ögg", "ugg"], + ["öng", "ung"], + ["önk", "unk"], + ["öt", "yt"], + ["utit", "yt"], + ["ös", "ys"], + ["öv", "yv"], + ["uvit", "yv"], + ["öp", "yp"], + ["upit", "yp"], + ["ök", "yk"], + ["ukit", "yk"], + ["or", "ar"], + ["öll", "all"], + ["ät", "åt"], + ["öll", "åll"], + ["or", "är"], + ["urit", "är"], + ["åt", "ät"], + ["ar", "är"], + ["alt", "ält"], + ["ultit", "ält"] + ], + "adj": [ ["are", ""], ["ast", ""], @@ -33,7 +98,7 @@ LEMMA_RULES = { ["ängre", "ång"], ["ängst", "ång"], ["örre", "or"], - ["örst", "or"], + ["örst", "or"] ], "punct": [