| .. |
|
af
|
|
|
|
am
|
Tidy up and auto-format
|
2021-02-13 12:55:56 +11:00 |
|
ar
|
Simplify language data and revert detailed configs
|
2020-07-24 14:50:26 +02:00 |
|
az
|
Fix Azerbaijani init, extend lang init tests (#8656)
|
2021-07-09 15:36:35 +02:00 |
|
bg
|
Tidy up code
|
2021-06-28 12:08:15 +02:00 |
|
bn
|
Implement overwrite param for all custom lemmatizers (#6794)
|
2021-01-26 14:53:43 +11:00 |
|
ca
|
Update Catalan language data (#8308)
|
2021-06-11 10:21:22 +02:00 |
|
cs
|
|
|
|
da
|
Merge remote-tracking branch 'upstream/master' into chore/update-develop-from-master-rc3
|
2021-01-14 11:49:58 +01:00 |
|
de
|
|
|
|
el
|
Fix non-deterministic deduplication in Greek lemmatizer (#8421)
|
2021-06-17 09:11:01 +02:00 |
|
en
|
Fix/fix en ordinals (#8028)
|
2021-05-07 10:26:42 +02:00 |
|
es
|
Tidy up and auto-format
|
2021-01-30 12:52:33 +11:00 |
|
et
|
Simplify language data and revert detailed configs
|
2020-07-24 14:50:26 +02:00 |
|
eu
|
Simplify language data and revert detailed configs
|
2020-07-24 14:50:26 +02:00 |
|
fa
|
Implement overwrite param for all custom lemmatizers (#6794)
|
2021-01-26 14:53:43 +11:00 |
|
fi
|
Tidy up code
|
2021-06-28 12:08:15 +02:00 |
|
fr
|
Improvements to French stopwords list (#7941)
|
2021-06-02 11:50:49 +02:00 |
|
ga
|
Simplify language data and revert detailed configs
|
2020-07-24 14:50:26 +02:00 |
|
grc
|
Remove extraneous grc test file (#8768)
|
2021-07-20 15:51:15 +02:00 |
|
gu
|
|
|
|
he
|
raise NotImplementedError when noun_chunks iterator is not implemented (#6711)
|
2021-01-17 19:56:05 +08:00 |
|
hi
|
|
|
|
hr
|
|
|
|
hu
|
|
|
|
hy
|
|
|
|
id
|
|
|
|
is
|
|
|
|
it
|
Tidy up code
|
2021-06-28 12:08:15 +02:00 |
|
ja
|
|
|
|
kn
|
|
|
|
ko
|
|
|
|
ky
|
Tidy up and auto-format
|
2021-01-30 12:52:33 +11:00 |
|
lb
|
Remove default initialize lookups
|
2020-10-01 21:54:33 +02:00 |
|
lij
|
|
|
|
lt
|
Fix escape sequence
|
2021-01-30 12:39:58 +11:00 |
|
lv
|
|
|
|
mk
|
Tidy up and auto-format
|
2021-01-30 12:52:33 +11:00 |
|
ml
|
|
|
|
mr
|
|
|
|
nb
|
Add / to nb infixes (#7991)
|
2021-05-04 11:00:10 +02:00 |
|
ne
|
|
|
|
nl
|
Adding noun_chunks to the DUTCH language model (nl) (#8529)
|
2021-07-14 14:01:02 +02:00 |
|
pl
|
Implement overwrite param for all custom lemmatizers (#6794)
|
2021-01-26 14:53:43 +11:00 |
|
pt
|
Tidy up and auto-format
|
2021-01-15 11:57:36 +11:00 |
|
ro
|
Merge remote-tracking branch 'upstream/master' into chore/update-develop-from-master-rc3
|
2021-01-14 11:49:58 +01:00 |
|
ru
|
Auto-format code with black
|
2021-07-16 08:03:36 +00:00 |
|
sa
|
Tidy up and auto-format
|
2020-09-29 21:39:28 +02:00 |
|
si
|
|
|
|
sk
|
Simplify language data and revert detailed configs
|
2020-07-24 14:50:26 +02:00 |
|
sl
|
|
|
|
sq
|
|
|
|
sr
|
|
|
|
sv
|
Implement overwrite param for all custom lemmatizers (#6794)
|
2021-01-26 14:53:43 +11:00 |
|
ta
|
|
|
|
te
|
Simplify language data and revert detailed configs
|
2020-07-24 14:50:26 +02:00 |
|
th
|
Remove default initialize lookups
|
2020-10-01 21:54:33 +02:00 |
|
ti
|
Tidy up and auto-format
|
2021-01-15 11:57:36 +11:00 |
|
tl
|
|
|
|
tn
|
Tidy up and auto-format
|
2021-02-13 12:55:56 +11:00 |
|
tr
|
Tidy up and auto-format
|
2021-01-05 13:41:53 +11:00 |
|
tt
|
|
|
|
uk
|
Fix ru/uk lemmatizer mp with spawn (#8657)
|
2021-07-09 15:36:56 +02:00 |
|
ur
|
|
|
|
vi
|
Update Vietnamese tokenizer (#8099)
|
2021-05-17 18:16:20 +10:00 |
|
xx
|
|
|
|
yo
|
|
|
|
zh
|
|
|
|
__init__.py
|
|
|
|
char_classes.py
|
Add all symbols in Unicode Currency Symbols block (#8212)
|
2021-05-31 18:03:40 +10:00 |
|
lex_attrs.py
|
|
|
|
norm_exceptions.py
|
|
|
|
punctuation.py
|
|
|
|
tokenizer_exceptions.py
|
Tidy up with flake8: imports, comparisons, etc.
|
2021-06-28 12:08:15 +02:00 |