mirror of
				https://github.com/explosion/spaCy.git
				synced 2025-11-04 01:48:04 +03:00 
			
		
		
		
	* Remove unicode declarations * Remove Python 3.5 and 2.7 from CI * Don't require pathlib * Replace compat helpers * Remove OrderedDict * Use f-strings * Set Cython compiler language level * Fix typo * Re-add OrderedDict for Table * Update setup.cfg * Revert CONTRIBUTING.md * Revert lookups.md * Revert top-level.md * Small adjustments and docs [ci skip]
		
			
				
	
	
		
			44 lines
		
	
	
		
			608 B
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			44 lines
		
	
	
		
			608 B
		
	
	
	
		
			Python
		
	
	
	
	
	
STOP_WORDS = set(
 | 
						|
    """
 | 
						|
a ach ag agus an aon ar arna as
 | 
						|
 | 
						|
ba beirt bhúr
 | 
						|
 | 
						|
caoga ceathair ceathrar chomh chuig chun cois céad cúig cúigear
 | 
						|
 | 
						|
daichead dar de deich deichniúr den dhá do don dtí dá dár dó
 | 
						|
 | 
						|
faoi faoin faoina faoinár fara fiche
 | 
						|
 | 
						|
gach gan go gur
 | 
						|
 | 
						|
haon hocht
 | 
						|
 | 
						|
i iad idir in ina ins inár is
 | 
						|
 | 
						|
le leis lena lenár
 | 
						|
 | 
						|
mar mo muid mé
 | 
						|
 | 
						|
na nach naoi naonúr ná ní níor nó nócha
 | 
						|
 | 
						|
ocht ochtar ochtó os
 | 
						|
 | 
						|
roimh
 | 
						|
 | 
						|
sa seacht seachtar seachtó seasca seisear siad sibh sinn sna sé sí
 | 
						|
 | 
						|
tar thar thú triúr trí trína trínár tríocha tú
 | 
						|
 | 
						|
um
 | 
						|
 | 
						|
ár
 | 
						|
 | 
						|
é éis
 | 
						|
 | 
						|
í
 | 
						|
 | 
						|
ó ón óna ónár
 | 
						|
""".split()
 | 
						|
)
 |