spaCy/spacy/_theano.pyx

from thinc.api cimport Example, ExampleC
from thinc.typedefs cimport weight_t

from ._ml cimport arg_max_if_true
from ._ml cimport arg_max_if_zero

import numpy
from os import path


cdef class TheanoModel(Model):
    def __init__(self, n_classes, input_spec, train_func, predict_func, model_loc=None,
                 eta=0.001, mu=0.9, debug=None):
        if model_loc is not None and path.isdir(model_loc):
            model_loc = path.join(model_loc, 'model')

        self.eta = eta
        self.mu = mu
        self.t = 1
        initializer = lambda: 0.2 * numpy.random.uniform(-1.0, 1.0)
        self.input_layer = InputLayer(input_spec, initializer)
        self.train_func = train_func
        self.predict_func = predict_func
        self.debug = debug

        self.n_classes = n_classes
        self.n_feats = len(self.input_layer)
        self.model_loc = model_loc
        
    def predict(self, Example eg):
        self.input_layer.fill(eg.embeddings, eg.atoms, use_avg=True)
        theano_scores = self.predict_func(eg.embeddings)[0]
        cdef int i
        for i in range(self.n_classes):
            eg.c.scores[i] = theano_scores[i]
        eg.c.guess = arg_max_if_true(eg.c.scores, eg.c.is_valid, self.n_classes)

    def train(self, Example eg):
        self.input_layer.fill(eg.embeddings, eg.atoms, use_avg=False)
        theano_scores, update, y, loss = self.train_func(eg.embeddings, eg.costs,
                                                         self.eta, self.mu)
        self.input_layer.update(update, eg.atoms, self.t, self.eta, self.mu)
        for i in range(self.n_classes):
            eg.c.scores[i] = theano_scores[i]
        eg.c.guess = arg_max_if_true(eg.c.scores, eg.c.is_valid, self.n_classes)
        eg.c.best = arg_max_if_zero(eg.c.scores, eg.c.costs, self.n_classes)
        eg.c.cost = eg.c.costs[eg.c.guess]
        eg.c.loss = loss
        self.t += 1

    def end_training(self):
        pass
* Use new Example class 2015-06-28 23:36:03 +03:00			`from thinc.api cimport Example, ExampleC`
* Prepare for new models to be plugged in by using Example class 2015-06-26 14:51:39 +03:00			`from thinc.typedefs cimport weight_t`

			`from ._ml cimport arg_max_if_true`
			`from ._ml cimport arg_max_if_zero`

			`import numpy`
			`from os import path`
* Work on a theano-driven model for the parser 2015-06-23 23:55:58 +03:00

			`cdef class TheanoModel(Model):`
* Merge changes, and adjust Example to use memoryview 2015-06-28 12:36:11 +03:00			`def __init__(self, n_classes, input_spec, train_func, predict_func, model_loc=None,`
* Begin reorganizing neuralnet work 2015-06-30 15:26:32 +03:00			`eta=0.001, mu=0.9, debug=None):`
* Work on a theano-driven model for the parser 2015-06-23 23:55:58 +03:00			`if model_loc is not None and path.isdir(model_loc):`
			`model_loc = path.join(model_loc, 'model')`

* Wire eta and mu parameters up for neural net 2015-06-29 08:10:33 +03:00			`self.eta = eta`
			`self.mu = mu`
* Prepare for new models to be plugged in by using Example class 2015-06-26 14:51:39 +03:00			`self.t = 1`
			`initializer = lambda: 0.2 * numpy.random.uniform(-1.0, 1.0)`
			`self.input_layer = InputLayer(input_spec, initializer)`
* Work on a theano-driven model for the parser 2015-06-23 23:55:58 +03:00			`self.train_func = train_func`
			`self.predict_func = predict_func`
* Merge changes, and adjust Example to use memoryview 2015-06-28 12:36:11 +03:00			`self.debug = debug`
* Work on a theano-driven model for the parser 2015-06-23 23:55:58 +03:00
* Prepare for new models to be plugged in by using Example class 2015-06-26 14:51:39 +03:00			`self.n_classes = n_classes`
			`self.n_feats = len(self.input_layer)`
* Work on a theano-driven model for the parser 2015-06-23 23:55:58 +03:00			`self.model_loc = model_loc`
* Prepare for new models to be plugged in by using Example class 2015-06-26 14:51:39 +03:00
			`def predict(self, Example eg):`
* Reenable averaging 2015-06-29 17:44:42 +03:00			`self.input_layer.fill(eg.embeddings, eg.atoms, use_avg=True)`
* Merge changes, and adjust Example to use memoryview 2015-06-28 12:36:11 +03:00			`theano_scores = self.predict_func(eg.embeddings)[0]`
* Prepare for new models to be plugged in by using Example class 2015-06-26 14:51:39 +03:00			`cdef int i`
* Work on a theano-driven model for the parser 2015-06-23 23:55:58 +03:00			`for i in range(self.n_classes):`
* Wire eta and mu parameters up for neural net 2015-06-29 08:10:33 +03:00			`eg.c.scores[i] = theano_scores[i]`
			`eg.c.guess = arg_max_if_true(eg.c.scores, eg.c.is_valid, self.n_classes)`
* Prepare for new models to be plugged in by using Example class 2015-06-26 14:51:39 +03:00
			`def train(self, Example eg):`
* Remove hard-coding of vector lengths 2015-06-27 05:18:47 +03:00			`self.input_layer.fill(eg.embeddings, eg.atoms, use_avg=False)`
* Wire eta and mu parameters up for neural net 2015-06-29 08:10:33 +03:00			`theano_scores, update, y, loss = self.train_func(eg.embeddings, eg.costs,`
			`self.eta, self.mu)`
* Merge changes, and adjust Example to use memoryview 2015-06-28 12:36:11 +03:00			`self.input_layer.update(update, eg.atoms, self.t, self.eta, self.mu)`
			`for i in range(self.n_classes):`
* Use new Example class 2015-06-28 23:36:03 +03:00			`eg.c.scores[i] = theano_scores[i]`
* Wire eta and mu parameters up for neural net 2015-06-29 08:10:33 +03:00			`eg.c.guess = arg_max_if_true(eg.c.scores, eg.c.is_valid, self.n_classes)`
			`eg.c.best = arg_max_if_zero(eg.c.scores, eg.c.costs, self.n_classes)`
			`eg.c.cost = eg.c.costs[eg.c.guess]`
			`eg.c.loss = loss`
* Prepare for new models to be plugged in by using Example class 2015-06-26 14:51:39 +03:00			`self.t += 1`
* Merge changes, and adjust Example to use memoryview 2015-06-28 12:36:11 +03:00
			`def end_training(self):`
			`pass`