mirror of
				https://github.com/explosion/spaCy.git
				synced 2025-11-04 09:57:26 +03:00 
			
		
		
		
	* Start adding parse features to sense_tagger
This commit is contained in:
		
							parent
							
								
									cb628ba352
								
							
						
					
					
						commit
						b61b495024
					
				| 
						 | 
					@ -57,16 +57,31 @@ cdef enum:
 | 
				
			||||||
    N2c6
 | 
					    N2c6
 | 
				
			||||||
    N2c4
 | 
					    N2c4
 | 
				
			||||||
 
 | 
					 
 | 
				
			||||||
 | 
					    Hw
 | 
				
			||||||
 | 
					    Hp
 | 
				
			||||||
 | 
					    Hc
 | 
				
			||||||
 | 
					    Hc6
 | 
				
			||||||
 | 
					    Hc4
 | 
				
			||||||
 | 
					    
 | 
				
			||||||
    N3W
 | 
					    N3W
 | 
				
			||||||
    P3W
 | 
					    P3W
 | 
				
			||||||
 | 
					
 | 
				
			||||||
    P1s
 | 
					    P1s
 | 
				
			||||||
    P2s
 | 
					    P2s
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					   
 | 
				
			||||||
    CONTEXT_SIZE
 | 
					    CONTEXT_SIZE
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					
 | 
				
			||||||
unigrams = (
 | 
					unigrams = (
 | 
				
			||||||
 | 
					    (Hw,),
 | 
				
			||||||
 | 
					    (Hp,),
 | 
				
			||||||
 | 
					    (Hw, Hp),
 | 
				
			||||||
 | 
					    (Hc, Hp),
 | 
				
			||||||
 | 
					    (Hc6, Hp),
 | 
				
			||||||
 | 
					    (Hc4, Hp),
 | 
				
			||||||
 | 
					    (Hc,),
 | 
				
			||||||
 | 
					
 | 
				
			||||||
    (P2W,),
 | 
					    (P2W,),
 | 
				
			||||||
    (P2p,),
 | 
					    (P2p,),
 | 
				
			||||||
    (P2W, P2p),
 | 
					    (P2W, P2p),
 | 
				
			||||||
| 
						 | 
					@ -189,6 +204,7 @@ cdef int fill_context(atom_t* ctxt, const TokenC* token) except -1:
 | 
				
			||||||
 | 
					
 | 
				
			||||||
    fill_token(&ctxt[N1W], token + 1)
 | 
					    fill_token(&ctxt[N1W], token + 1)
 | 
				
			||||||
    fill_token(&ctxt[N2W], token + 2)
 | 
					    fill_token(&ctxt[N2W], token + 2)
 | 
				
			||||||
 | 
					    fill_token(&ctxt[Hw], token + token.head)
 | 
				
			||||||
    ctxt[P1s] = (token - 1).sense
 | 
					    ctxt[P1s] = (token - 1).sense
 | 
				
			||||||
    ctxt[P2s] = (token - 2).sense
 | 
					    ctxt[P2s] = (token - 2).sense
 | 
				
			||||||
    ctxt[N3W] = (token + 3).lemma
 | 
					    ctxt[N3W] = (token + 3).lemma
 | 
				
			||||||
| 
						 | 
					@ -334,7 +350,7 @@ cdef class SenseTagger:
 | 
				
			||||||
                token.sense = 1
 | 
					                token.sense = 1
 | 
				
			||||||
        return cost
 | 
					        return cost
 | 
				
			||||||
 | 
					
 | 
				
			||||||
    cdef dict _perceptron_update(self, const Feature* feats, int n_feats, int guess, int best):
 | 
					    cdef dict _make_update(self, const Feature* feats, int n_feats, int guess, int best):
 | 
				
			||||||
        guess_counts = {}
 | 
					        guess_counts = {}
 | 
				
			||||||
        gold_counts = {}
 | 
					        gold_counts = {}
 | 
				
			||||||
        if guess != best:
 | 
					        if guess != best:
 | 
				
			||||||
| 
						 | 
					
 | 
				
			||||||
		Loading…
	
		Reference in New Issue
	
	Block a user