mirror of
				https://github.com/explosion/spaCy.git
				synced 2025-11-04 01:48:04 +03:00 
			
		
		
		
	enable tokenizer exceptions
This commit is contained in:
		
							parent
							
								
									ad56c9179a
								
							
						
					
					
						commit
						7aad6718bc
					
				| 
						 | 
					@ -1,4 +1,11 @@
 | 
				
			||||||
# coding: utf8
 | 
					# coding: utf8
 | 
				
			||||||
from __future__ import unicode_literals
 | 
					from __future__ import unicode_literals
 | 
				
			||||||
 | 
					
 | 
				
			||||||
TOKENIZER_EXCEPTIONS = {}
 | 
					from ._tokenizer_exceptions_list import FR_BASE_EXCEPTIONS
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					_exc = {}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					for orth in FR_BASE_EXCEPTIONS + ["etc."]:
 | 
				
			||||||
 | 
					    _exc[orth] = [{ORTH: orth}]
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					TOKENIZER_EXCEPTIONS = dict(_exc)
 | 
				
			||||||
		Loading…
	
		Reference in New Issue
	
	Block a user