mirror of
https://github.com/explosion/spaCy.git
synced 2024-11-10 19:57:17 +03:00
85dd2b6c04
* Parser: use C saxpy/sgemm provided by the Ops implementation This is a backport of https://github.com/explosion/spaCy/pull/10747 from the parser refactor branch. It eliminates the explicit calls to BLIS, instead using the saxpy/sgemm provided by the Ops implementation. This allows us to use Accelerate in the parser on M1 Macs (with an updated thinc-apple-ops). Performance of the de_core_news_lg pipe: BLIS 0.7.0, no thinc-apple-ops: 6385 WPS BLIS 0.7.0, thinc-apple-ops: 36455 WPS BLIS 0.9.0, no thinc-apple-ops: 19188 WPS BLIS 0.9.0, thinc-apple-ops: 36682 WPS This PR, thinc-apple-ops: 38726 WPS Performance of the de_core_news_lg pipe (only tok2vec -> parser): BLIS 0.7.0, no thinc-apple-ops: 13907 WPS BLIS 0.7.0, thinc-apple-ops: 73172 WPS BLIS 0.9.0, no thinc-apple-ops: 41576 WPS BLIS 0.9.0, thinc-apple-ops: 72569 WPS This PR, thinc-apple-ops: 87061 WPS * Require thinc >=8.1.0,<8.2.0 * Lower thinc lowerbound to 8.1.0.dev0 * Use best CPU ops for CBLAS when the parser model is on the GPU * Fix another unguarded cblas() call * Fix: use ops as a shorthand for self.model.ops Co-authored-by: Madeesh Kannan <shadeMe@users.noreply.github.com> Co-authored-by: Madeesh Kannan <shadeMe@users.noreply.github.com>
50 lines
1.1 KiB
Cython
50 lines
1.1 KiB
Cython
from libc.string cimport memset, memcpy
|
|
from thinc.backends.cblas cimport CBlas
|
|
from ..typedefs cimport weight_t, hash_t
|
|
from ..pipeline._parser_internals._state cimport StateC
|
|
|
|
|
|
cdef struct SizesC:
|
|
int states
|
|
int classes
|
|
int hiddens
|
|
int pieces
|
|
int feats
|
|
int embed_width
|
|
|
|
|
|
cdef struct WeightsC:
|
|
const float* feat_weights
|
|
const float* feat_bias
|
|
const float* hidden_bias
|
|
const float* hidden_weights
|
|
const float* seen_classes
|
|
|
|
|
|
cdef struct ActivationsC:
|
|
int* token_ids
|
|
float* unmaxed
|
|
float* scores
|
|
float* hiddens
|
|
int* is_valid
|
|
int _curr_size
|
|
int _max_size
|
|
|
|
|
|
cdef WeightsC get_c_weights(model) except *
|
|
|
|
cdef SizesC get_c_sizes(model, int batch_size) except *
|
|
|
|
cdef ActivationsC alloc_activations(SizesC n) nogil
|
|
|
|
cdef void free_activations(const ActivationsC* A) nogil
|
|
|
|
cdef void predict_states(CBlas cblas, ActivationsC* A, StateC** states,
|
|
const WeightsC* W, SizesC n) nogil
|
|
|
|
cdef int arg_max_if_valid(const weight_t* scores, const int* is_valid, int n) nogil
|
|
|
|
cdef void cpu_log_loss(float* d_scores,
|
|
const float* costs, const int* is_valid, const float* scores, int O) nogil
|
|
|