spaCy/spacy/_ml.pyx

# cython: infer_types=True
# cython: profile=True
# cython: cdivision=True

from libcpp.vector cimport vector
from libc.stdint cimport uint64_t, uint32_t, int32_t
from libc.string cimport memcpy, memset
cimport libcpp.algorithm
from libc.math cimport exp

from cymem.cymem cimport Pool
from thinc.linalg cimport Vec, VecVec
from murmurhash.mrmr cimport hash64
cimport numpy as np
import numpy
np.import_array()

from thinc.neural.optimizers import Adam
from thinc.neural.ops import NumpyOps


cdef class LinearModel:
    def __init__(self, int nr_class, templates, weight_t learn_rate=0.001,
            size=2**18):
        self.extracter = ConjunctionExtracter(templates)
        self.nr_weight = size
        self.nr_class = nr_class
        self.learn_rate = learn_rate
        self.mem = Pool()
        self.W = <weight_t*>self.mem.alloc(self.nr_weight * self.nr_class,
                                           sizeof(weight_t))
        self.d_W = <weight_t*>self.mem.alloc(self.nr_weight * self.nr_class,
                                           sizeof(weight_t))
        self._indices = new vector[uint64_t]()

    def __dealloc__(self):
        del self._indices

    cdef void hinge_lossC(self, weight_t* d_scores,
            const weight_t* scores, const weight_t* costs) nogil:
        guess = 0
        best = -1
        for i in range(1, self.nr_class):
            if scores[i] > scores[guess]:
                guess = i
            if costs[i] == 0 and (best == -1 or scores[i] > scores[best]):
                best = i
        if best != -1 and scores[guess] >= scores[best]:
            d_scores[guess] = 1.
            d_scores[best] = -1.

    cdef void log_lossC(self, weight_t* d_scores,
            const weight_t* scores, const weight_t* costs) nogil:
        for i in range(self.nr_class):
            if costs[i] <= 0:
                break
        else:
            return
        cdef double Z = 1e-10
        cdef double gZ = 1e-10
        cdef double max_ = scores[0]
        cdef double g_max = -9000
        for i in range(self.nr_class):
            max_ = max(max_, scores[i])
            if costs[i] <= 0:
                g_max = max(g_max, scores[i])
        for i in range(self.nr_class):
            Z += exp(scores[i]-max_)
            if costs[i] <= 0:
                gZ += exp(scores[i]-g_max)
        for i in range(self.nr_class):
            score = exp(scores[i]-max_)
            if costs[i] >= 1:
                d_scores[i] = score / Z
            else:
                g_score = exp(scores[i]-g_max)
                d_scores[i] = (score / Z) - (g_score / gZ)

    cdef void regression_lossC(self, weight_t* d_scores,
            const weight_t* scores, const weight_t* costs) nogil:
        best = -1
        for i in range(self.nr_class):
            if costs[i] <= 0:
                if best == -1:
                    best = i
                elif scores[i] > scores[best]:
                    best = i
        if best == -1:
            return
        for i in range(self.nr_class):
            if scores[i] < scores[best]:
                d_scores[i] = 0
            elif costs[i] <= 0 and scores[i] == best:
                continue
            else:
                d_scores[i] = scores[i] - -costs[i]

    cdef void set_scoresC(self, weight_t* scores,
            const FeatureC* features, int nr_feat) nogil:
        cdef uint64_t nr_weight = self.nr_weight
        cdef int nr_class = self.nr_class
        cdef vector[uint64_t] indices
        # Collect all feature indices
        cdef uint32_t[2] hashed
        cdef FeatureC feat
        cdef uint64_t hash2
        for feat in features[:nr_feat]:
            if feat.value == 0:
                continue
            memcpy(hashed, &feat.key, sizeof(hashed))
            indices.push_back(hashed[0] % nr_weight)
            indices.push_back(hashed[1] % nr_weight)

        # Sort them, to improve memory access pattern
        libcpp.algorithm.sort(indices.begin(), indices.end())
        for idx in indices:
            W = &self.W[idx * nr_class]
            for clas in range(nr_class):
                scores[clas] += W[clas]

    cdef void set_gradientC(self, const weight_t* d_scores, const FeatureC*
            features, int nr_feat) nogil:
        cdef uint64_t nr_weight = self.nr_weight
        cdef int nr_class = self.nr_class
        cdef vector[uint64_t] indices
        # Collect all feature indices
        cdef uint32_t[2] hashed
        cdef uint64_t hash2
        for feat in features[:nr_feat]:
            if feat.value == 0:
                continue
            memcpy(hashed, &feat.key, sizeof(hashed))
            indices.push_back(hashed[0] % nr_weight)
            indices.push_back(hashed[1] % nr_weight)

        # Sort them, to improve memory access pattern
        libcpp.algorithm.sort(indices.begin(), indices.end())
        for idx in indices:
            d_W = &self.d_W[idx * nr_class]
            for clas in range(nr_class):
                if d_scores[clas] < 0:
                    d_W[clas] += max(-10., d_scores[clas])
                else:
                    d_W[clas] += min(10., d_scores[clas])

    def finish_update(self, optimizer):
        cdef np.npy_intp[1] shape
        shape[0] = self.nr_weight * self.nr_class
        W_arr = np.PyArray_SimpleNewFromData(1, shape, np.NPY_FLOAT, self.W)
        dW_arr = np.PyArray_SimpleNewFromData(1, shape, np.NPY_FLOAT, self.d_W)
        optimizer(W_arr, dW_arr, key=1)

    @property
    def nr_active_feat(self):
        return self.nr_weight

    @property
    def nr_feat(self):
        return self.extracter.nr_templ

    def end_training(self, *args, **kwargs):
        pass

    def dump(self, *args, **kwargs):
        pass
WIP on hash kernel 2017-03-14 23:28:43 +03:00			`# cython: infer_types=True`
			`# cython: profile=True`
			`# cython: cdivision=True`

			`from libcpp.vector cimport vector`
			`from libc.stdint cimport uint64_t, uint32_t, int32_t`
			`from libc.string cimport memcpy, memset`
			`cimport libcpp.algorithm`
			`from libc.math cimport exp`

			`from cymem.cymem cimport Pool`
			`from thinc.linalg cimport Vec, VecVec`
			`from murmurhash.mrmr cimport hash64`
			`cimport numpy as np`
			`import numpy`
			`np.import_array()`

Track which indices are being used 2017-03-24 02:23:32 +03:00			`from thinc.neural.optimizers import Adam`
			`from thinc.neural.ops import NumpyOps`

WIP on hash kernel 2017-03-14 23:28:43 +03:00
			`cdef class LinearModel:`
			`def __init__(self, int nr_class, templates, weight_t learn_rate=0.001,`
			`size=2**18):`
			`self.extracter = ConjunctionExtracter(templates)`
			`self.nr_weight = size`
			`self.nr_class = nr_class`
			`self.learn_rate = learn_rate`
			`self.mem = Pool()`
			`self.W = <weight_t>self.mem.alloc(self.nr_weight self.nr_class,`
			`sizeof(weight_t))`
			`self.d_W = <weight_t>self.mem.alloc(self.nr_weight self.nr_class,`
			`sizeof(weight_t))`
Track which indices are being used 2017-03-24 02:23:32 +03:00			`self._indices = new vector[uint64_t]()`

			`def __dealloc__(self):`
			`del self._indices`
WIP on hash kernel 2017-03-14 23:28:43 +03:00
			`cdef void hinge_lossC(self, weight_t* d_scores,`
			`const weight_t* scores, const weight_t* costs) nogil:`
			`guess = 0`
			`best = -1`
			`for i in range(1, self.nr_class):`
			`if scores[i] > scores[guess]:`
			`guess = i`
			`if costs[i] == 0 and (best == -1 or scores[i] > scores[best]):`
			`best = i`
			`if best != -1 and scores[guess] >= scores[best]:`
			`d_scores[guess] = 1.`
			`d_scores[best] = -1.`

			`cdef void log_lossC(self, weight_t* d_scores,`
			`const weight_t* scores, const weight_t* costs) nogil:`
			`for i in range(self.nr_class):`
			`if costs[i] <= 0:`
			`break`
			`else:`
			`return`
			`cdef double Z = 1e-10`
			`cdef double gZ = 1e-10`
			`cdef double max_ = scores[0]`
			`cdef double g_max = -9000`
			`for i in range(self.nr_class):`
			`max_ = max(max_, scores[i])`
			`if costs[i] <= 0:`
			`g_max = max(g_max, scores[i])`
			`for i in range(self.nr_class):`
			`Z += exp(scores[i]-max_)`
			`if costs[i] <= 0:`
			`gZ += exp(scores[i]-g_max)`
			`for i in range(self.nr_class):`
			`score = exp(scores[i]-max_)`
			`if costs[i] >= 1:`
			`d_scores[i] = score / Z`
			`else:`
			`g_score = exp(scores[i]-g_max)`
			`d_scores[i] = (score / Z) - (g_score / gZ)`

			`cdef void regression_lossC(self, weight_t* d_scores,`
			`const weight_t* scores, const weight_t* costs) nogil:`
			`best = -1`
			`for i in range(self.nr_class):`
			`if costs[i] <= 0:`
			`if best == -1:`
			`best = i`
			`elif scores[i] > scores[best]:`
			`best = i`
			`if best == -1:`
			`return`
			`for i in range(self.nr_class):`
			`if scores[i] < scores[best]:`
			`d_scores[i] = 0`
			`elif costs[i] <= 0 and scores[i] == best:`
			`continue`
			`else:`
			`d_scores[i] = scores[i] - -costs[i]`

			`cdef void set_scoresC(self, weight_t* scores,`
			`const FeatureC* features, int nr_feat) nogil:`
			`cdef uint64_t nr_weight = self.nr_weight`
			`cdef int nr_class = self.nr_class`
			`cdef vector[uint64_t] indices`
			`# Collect all feature indices`
			`cdef uint32_t[2] hashed`
			`cdef FeatureC feat`
			`cdef uint64_t hash2`
			`for feat in features[:nr_feat]:`
			`if feat.value == 0:`
			`continue`
			`memcpy(hashed, &feat.key, sizeof(hashed))`
			`indices.push_back(hashed[0] % nr_weight)`
			`indices.push_back(hashed[1] % nr_weight)`

			`# Sort them, to improve memory access pattern`
			`libcpp.algorithm.sort(indices.begin(), indices.end())`
			`for idx in indices:`
			`W = &self.W[idx * nr_class]`
			`for clas in range(nr_class):`
			`scores[clas] += W[clas]`

			`cdef void set_gradientC(self, const weight_t* d_scores, const FeatureC*`
			`features, int nr_feat) nogil:`
			`cdef uint64_t nr_weight = self.nr_weight`
			`cdef int nr_class = self.nr_class`
			`cdef vector[uint64_t] indices`
			`# Collect all feature indices`
			`cdef uint32_t[2] hashed`
			`cdef uint64_t hash2`
			`for feat in features[:nr_feat]:`
			`if feat.value == 0:`
			`continue`
			`memcpy(hashed, &feat.key, sizeof(hashed))`
			`indices.push_back(hashed[0] % nr_weight)`
			`indices.push_back(hashed[1] % nr_weight)`

			`# Sort them, to improve memory access pattern`
			`libcpp.algorithm.sort(indices.begin(), indices.end())`
			`for idx in indices:`
Track which indices are being used 2017-03-24 02:23:32 +03:00			`d_W = &self.d_W[idx * nr_class]`
WIP on hash kernel 2017-03-14 23:28:43 +03:00			`for clas in range(nr_class):`
			`if d_scores[clas] < 0:`
Track which indices are being used 2017-03-24 02:23:32 +03:00			`d_W[clas] += max(-10., d_scores[clas])`
WIP on hash kernel 2017-03-14 23:28:43 +03:00			`else:`
Track which indices are being used 2017-03-24 02:23:32 +03:00			`d_W[clas] += min(10., d_scores[clas])`

			`def finish_update(self, optimizer):`
			`cdef np.npy_intp[1] shape`
			`shape[0] = self.nr_weight * self.nr_class`
			`W_arr = np.PyArray_SimpleNewFromData(1, shape, np.NPY_FLOAT, self.W)`
			`dW_arr = np.PyArray_SimpleNewFromData(1, shape, np.NPY_FLOAT, self.d_W)`
			`optimizer(W_arr, dW_arr, key=1)`
WIP on hash kernel 2017-03-14 23:28:43 +03:00
			`@property`
			`def nr_active_feat(self):`
			`return self.nr_weight`

			`@property`
			`def nr_feat(self):`
			`return self.extracter.nr_templ`

			`def end_training(self, args, *kwargs):`
			`pass`

			`def dump(self, args, *kwargs):`
			`pass`