mirror of
				https://github.com/explosion/spaCy.git
				synced 2025-11-04 01:48:04 +03:00 
			
		
		
		
	Tidy up [ci skip]
This commit is contained in:
		
							parent
							
								
									4a0a692875
								
							
						
					
					
						commit
						49f27a2a7b
					
				| 
						 | 
					@ -1,5 +1,5 @@
 | 
				
			||||||
from ..char_classes import LIST_ELLIPSES, LIST_ICONS, HYPHENS
 | 
					from ..char_classes import LIST_ELLIPSES, LIST_ICONS, HYPHENS
 | 
				
			||||||
from ..char_classes import CONCAT_QUOTES, ALPHA_LOWER, ALPHA_UPPER, ALPHA, PUNCT
 | 
					from ..char_classes import CONCAT_QUOTES, ALPHA_LOWER, ALPHA_UPPER, ALPHA
 | 
				
			||||||
 | 
					
 | 
				
			||||||
_infixes = (
 | 
					_infixes = (
 | 
				
			||||||
    LIST_ELLIPSES
 | 
					    LIST_ELLIPSES
 | 
				
			||||||
| 
						 | 
					
 | 
				
			||||||
| 
						 | 
					@ -151,6 +151,6 @@ for orth in ABBREVIATIONS:
 | 
				
			||||||
# Sentences ending in "i." (as in "... peka i."), "m." (as in "...än 2000 m."),
 | 
					# Sentences ending in "i." (as in "... peka i."), "m." (as in "...än 2000 m."),
 | 
				
			||||||
# should be tokenized as two separate tokens.
 | 
					# should be tokenized as two separate tokens.
 | 
				
			||||||
for orth in ["i", "m"]:
 | 
					for orth in ["i", "m"]:
 | 
				
			||||||
    _exc[orth + "."] = [{ORTH: orth, NORM: orth, NORM: orth}, {ORTH: "."}]
 | 
					    _exc[orth + "."] = [{ORTH: orth, NORM: orth}, {ORTH: "."}]
 | 
				
			||||||
 | 
					
 | 
				
			||||||
TOKENIZER_EXCEPTIONS = update_exc(BASE_EXCEPTIONS, _exc)
 | 
					TOKENIZER_EXCEPTIONS = update_exc(BASE_EXCEPTIONS, _exc)
 | 
				
			||||||
| 
						 | 
					
 | 
				
			||||||
		Loading…
	
		Reference in New Issue
	
	Block a user