mirror of
https://github.com/explosion/spaCy.git
synced 2024-11-15 22:27:12 +03:00
46 lines
303 B
Python
46 lines
303 B
Python
|
# coding: utf8
|
||
|
from __future__ import unicode_literals
|
||
|
|
||
|
|
||
|
# Source: https://github.com/stopwords-iso/stopwords-et
|
||
|
|
||
|
STOP_WORDS = set(
|
||
|
"""
|
||
|
aga
|
||
|
ei
|
||
|
et
|
||
|
ja
|
||
|
jah
|
||
|
kas
|
||
|
kui
|
||
|
kõik
|
||
|
ma
|
||
|
me
|
||
|
mida
|
||
|
midagi
|
||
|
mind
|
||
|
minu
|
||
|
mis
|
||
|
mu
|
||
|
mul
|
||
|
mulle
|
||
|
nad
|
||
|
nii
|
||
|
oled
|
||
|
olen
|
||
|
oli
|
||
|
oma
|
||
|
on
|
||
|
pole
|
||
|
sa
|
||
|
seda
|
||
|
see
|
||
|
selle
|
||
|
siin
|
||
|
siis
|
||
|
ta
|
||
|
te
|
||
|
ära
|
||
|
""".split()
|
||
|
)
|