mirror of
https://github.com/explosion/spaCy.git
synced 2025-01-26 09:14:32 +03:00
Fix shape inference in begin_training
This commit is contained in:
parent
1729165e90
commit
f075655deb
|
@ -15,10 +15,9 @@ def build_tb_parser_model(
|
||||||
use_upper=True,
|
use_upper=True,
|
||||||
nO=None,
|
nO=None,
|
||||||
):
|
):
|
||||||
token_vector_width = tok2vec.get_dim("nO")
|
|
||||||
tok2vec = chain(
|
tok2vec = chain(
|
||||||
tok2vec,
|
tok2vec,
|
||||||
with_array(Linear(hidden_width, token_vector_width)),
|
with_array(Linear(hidden_width)),
|
||||||
list2array(),
|
list2array(),
|
||||||
)
|
)
|
||||||
tok2vec.set_dim("nO", hidden_width)
|
tok2vec.set_dim("nO", hidden_width)
|
||||||
|
|
|
@ -6,9 +6,8 @@ from ...util import registry
|
||||||
|
|
||||||
@registry.architectures.register("spacy.Tagger.v1")
|
@registry.architectures.register("spacy.Tagger.v1")
|
||||||
def build_tagger_model(tok2vec, nO=None) -> Model:
|
def build_tagger_model(tok2vec, nO=None) -> Model:
|
||||||
token_vector_width = tok2vec.get_dim("nO")
|
|
||||||
# TODO: glorot_uniform_init seems to work a bit better than zero_init here?!
|
# TODO: glorot_uniform_init seems to work a bit better than zero_init here?!
|
||||||
output_layer = Softmax(nO, nI=token_vector_width, init_W=zero_init)
|
output_layer = Softmax(nO, init_W=zero_init)
|
||||||
softmax = with_array(output_layer)
|
softmax = with_array(output_layer)
|
||||||
model = chain(tok2vec, softmax)
|
model = chain(tok2vec, softmax)
|
||||||
model.set_ref("tok2vec", tok2vec)
|
model.set_ref("tok2vec", tok2vec)
|
||||||
|
|
|
@ -38,8 +38,8 @@ def forward(model, X, is_train):
|
||||||
|
|
||||||
|
|
||||||
def init(model, X=None, Y=None):
|
def init(model, X=None, Y=None):
|
||||||
tok2vec = model.get_ref("tok2vec").initialize()
|
tok2vec = model.get_ref("tok2vec").initialize(X=X)
|
||||||
lower = model.get_ref("lower").initialize(X=X)
|
lower = model.get_ref("lower").initialize()
|
||||||
if model.attrs["has_upper"]:
|
if model.attrs["has_upper"]:
|
||||||
statevecs = model.ops.alloc2f(2, lower.get_dim("nO"))
|
statevecs = model.ops.alloc2f(2, lower.get_dim("nO"))
|
||||||
model.get_ref("upper").initialize(X=statevecs)
|
model.get_ref("upper").initialize(X=statevecs)
|
||||||
|
|
|
@ -531,7 +531,12 @@ class Tagger(Pipe):
|
||||||
vocab.morphology.lemmatizer,
|
vocab.morphology.lemmatizer,
|
||||||
exc=vocab.morphology.exc)
|
exc=vocab.morphology.exc)
|
||||||
self.set_output(len(self.labels))
|
self.set_output(len(self.labels))
|
||||||
self.model.initialize()
|
doc_sample = [Doc(self.vocab, words=["hello", "world"])]
|
||||||
|
for name, component in pipeline:
|
||||||
|
if component is self:
|
||||||
|
break
|
||||||
|
doc_sample = list(component.pipe(doc_sample))
|
||||||
|
self.model.initialize(X=doc_sample)
|
||||||
# Get batch of example docs, example outputs to call begin_training().
|
# Get batch of example docs, example outputs to call begin_training().
|
||||||
# This lets the model infer shapes.
|
# This lets the model infer shapes.
|
||||||
link_vectors_to_models(self.vocab)
|
link_vectors_to_models(self.vocab)
|
||||||
|
|
|
@ -629,6 +629,10 @@ cdef class Parser:
|
||||||
for doc, gold in parses:
|
for doc, gold in parses:
|
||||||
doc_sample.append(doc)
|
doc_sample.append(doc)
|
||||||
gold_sample.append(gold)
|
gold_sample.append(gold)
|
||||||
|
for name, component in pipeline:
|
||||||
|
if component is self:
|
||||||
|
break
|
||||||
|
doc_sample = list(component.pipe(doc_sample))
|
||||||
self.model.initialize(doc_sample, gold_sample)
|
self.model.initialize(doc_sample, gold_sample)
|
||||||
if pipeline is not None:
|
if pipeline is not None:
|
||||||
self.init_multitask_objectives(get_examples, pipeline, sgd=sgd, **self.cfg)
|
self.init_multitask_objectives(get_examples, pipeline, sgd=sgd, **self.cfg)
|
||||||
|
|
Loading…
Reference in New Issue
Block a user