mirror of
				https://github.com/explosion/spaCy.git
				synced 2025-11-04 01:48:04 +03:00 
			
		
		
		
	enable tokenizer exceptions
This commit is contained in:
		
							parent
							
								
									ad56c9179a
								
							
						
					
					
						commit
						7aad6718bc
					
				| 
						 | 
				
			
			@ -1,4 +1,11 @@
 | 
			
		|||
# coding: utf8
 | 
			
		||||
from __future__ import unicode_literals
 | 
			
		||||
 | 
			
		||||
TOKENIZER_EXCEPTIONS = {}
 | 
			
		||||
from ._tokenizer_exceptions_list import FR_BASE_EXCEPTIONS
 | 
			
		||||
 | 
			
		||||
_exc = {}
 | 
			
		||||
 | 
			
		||||
for orth in FR_BASE_EXCEPTIONS + ["etc."]:
 | 
			
		||||
    _exc[orth] = [{ORTH: orth}]
 | 
			
		||||
 | 
			
		||||
TOKENIZER_EXCEPTIONS = dict(_exc)
 | 
			
		||||
		Loading…
	
		Reference in New Issue
	
	Block a user