__init__.py
|
enable syntax iterator and lemma lookup
|
2017-07-27 10:51:15 +07:00 |
_tokenizer_exceptions_list.py
|
more exceptions
|
2017-07-27 19:46:30 +07:00 |
lemmatizer.py
|
updated lemma
|
2017-07-27 19:46:21 +07:00 |
lex_attrs.py
|
updated like_num
|
2017-07-29 17:44:46 +07:00 |
norm_exceptions.py
|
added known currencies
|
2017-07-23 22:56:48 +07:00 |
punctuation.py
|
removed -el from suffix rules
|
2017-07-26 19:28:38 +07:00 |
stop_words.py
|
added stopwords
|
2017-07-23 20:52:37 +07:00 |
syntax_iterators.py
|
wip syntax iterators
|
2017-07-27 10:51:34 +07:00 |
tokenizer_exceptions.py
|
added u-\d+ rules (sports team)
|
2017-07-30 21:23:01 +07:00 |