mirror of
				https://github.com/explosion/spaCy.git
				synced 2025-10-25 05:01:02 +03:00 
			
		
		
		
	Update parser for fine tuning
This commit is contained in:
		
							parent
							
								
									5d837c3776
								
							
						
					
					
						commit
						88bf1cf87c
					
				|  | @ -222,10 +222,10 @@ def Tok2Vec(width, embed_size, preprocess=None): | |||
|                 asarray(Model.ops, dtype='uint64') | ||||
|                 >> uniqued(embed, column=5) | ||||
|                 >> LN(Maxout(width, width*4, pieces=3)) | ||||
|                 >> Residual(ExtractWindow(nW=1) >> SELU(width, width*3)) | ||||
|                 >> Residual(ExtractWindow(nW=1) >> SELU(width, width*3)) | ||||
|                 >> Residual(ExtractWindow(nW=1) >> SELU(width, width*3)) | ||||
|                 >> Residual(ExtractWindow(nW=1) >> SELU(width, width*3)), | ||||
|                 >> Residual(ExtractWindow(nW=1) >> LN(Maxout(width, width*3))) | ||||
|                 >> Residual(ExtractWindow(nW=1) >> Maxout(width, width*3)) | ||||
|                 >> Residual(ExtractWindow(nW=1) >> Maxout(width, width*3)) | ||||
|                 >> Residual(ExtractWindow(nW=1) >> Maxout(width, width*3)), | ||||
|                 pad=4) | ||||
|         ) | ||||
|         if preprocess not in (False, None): | ||||
|  |  | |||
|  | @ -44,7 +44,7 @@ from thinc.neural.util import get_array_module | |||
| from .. import util | ||||
| from ..util import get_async, get_cuda_stream | ||||
| from .._ml import zero_init, PrecomputableAffine, PrecomputableMaxouts | ||||
| from .._ml import Tok2Vec, doc2feats, rebatch | ||||
| from .._ml import Tok2Vec, doc2feats, rebatch, fine_tune | ||||
| from ..compat import json_dumps | ||||
| 
 | ||||
| from . import _parse_features | ||||
|  | @ -237,7 +237,7 @@ cdef class Parser: | |||
|         token_vector_width = util.env_opt('token_vector_width', token_vector_width) | ||||
|         hidden_width = util.env_opt('hidden_width', hidden_width) | ||||
|         parser_maxout_pieces = util.env_opt('parser_maxout_pieces', 2) | ||||
|         tensors = Tok2Vec(token_vector_width, 7500, preprocess=doc2feats()) | ||||
|         tensors = fine_tune(Tok2Vec(token_vector_width, 7500, preprocess=doc2feats())) | ||||
|         if parser_maxout_pieces == 1: | ||||
|             lower = PrecomputableAffine(hidden_width if depth >= 1 else nr_class, | ||||
|                         nF=cls.nr_feature, | ||||
|  | @ -367,7 +367,7 @@ cdef class Parser: | |||
|             tokvecses = [tokvecses] | ||||
| 
 | ||||
|         tokvecs = self.model[0].ops.flatten(tokvecses) | ||||
|         tokvecs += self.model[0].ops.flatten(self.model[0](docs)) | ||||
|         tokvecs += self.model[0].ops.flatten(self.model[0]((docs, tokvecses))) | ||||
| 
 | ||||
|         nr_state = len(docs) | ||||
|         nr_class = self.moves.n_moves | ||||
|  | @ -419,7 +419,7 @@ cdef class Parser: | |||
|         cdef int nr_class = self.moves.n_moves | ||||
|         cdef StateClass stcls, output | ||||
|         tokvecs = self.model[0].ops.flatten(tokvecses) | ||||
|         tokvecs += self.model[0].ops.flatten(self.model[0](docs)) | ||||
|         tokvecs += self.model[0].ops.flatten(self.model[0]((docs, tokvecses))) | ||||
|         cuda_stream = get_cuda_stream() | ||||
|         state2vec, vec2scores = self.get_batch_model(len(docs), tokvecs, | ||||
|                                                      cuda_stream, 0.0) | ||||
|  | @ -460,7 +460,7 @@ cdef class Parser: | |||
|         if isinstance(docs, Doc) and isinstance(golds, GoldParse): | ||||
|             docs = [docs] | ||||
|             golds = [golds] | ||||
|         my_tokvecs, bp_my_tokvecs = self.model[0].begin_update(docs, drop=0.) | ||||
|         my_tokvecs, bp_my_tokvecs = self.model[0].begin_update(docs_tokvecs, drop=0.) | ||||
|         my_tokvecs = self.model[0].ops.flatten(my_tokvecs) | ||||
|         tokvecs += my_tokvecs | ||||
| 
 | ||||
|  |  | |||
		Loading…
	
		Reference in New Issue
	
	Block a user