mirror of
				https://github.com/explosion/spaCy.git
				synced 2025-11-04 01:48:04 +03:00 
			
		
		
		
	* Add canon_case function
This commit is contained in:
		
							parent
							
								
									8bbfadfced
								
							
						
					
					
						commit
						a779275a59
					
				| 
						 | 
				
			
			@ -41,7 +41,16 @@ def can_tag(name, thresh):
 | 
			
		|||
 | 
			
		||||
# String features
 | 
			
		||||
def canon_case(string, prob, cluster, case_stats, tag_stats):
 | 
			
		||||
    return string
 | 
			
		||||
    upper_pc = case_stats['upper']
 | 
			
		||||
    title_pc = case_stats['title']
 | 
			
		||||
    lower_pc = case_stats['lower']
 | 
			
		||||
    
 | 
			
		||||
    if upper_pc >= lower_pc and upper_pc >= title_pc:
 | 
			
		||||
        return string.upper()
 | 
			
		||||
    elif title_pc >= lower_pc:
 | 
			
		||||
        return string.title()
 | 
			
		||||
    else:
 | 
			
		||||
        return string.lower()
 | 
			
		||||
 | 
			
		||||
 | 
			
		||||
def word_shape(string, *args):
 | 
			
		||||
| 
						 | 
				
			
			
 | 
			
		|||
		Loading…
	
		Reference in New Issue
	
	Block a user