mirror of
https://github.com/explosion/spaCy.git
synced 2024-12-26 09:56:28 +03:00
Default to former TextCategorizer model
* Keep TextCategorizer default model same as v2.0 * Add option 'architecture' that allows "simple_cnn" to switch to simpler model. * Add option exclusive_classes, defaulting to False. If set to True, the model treats classes as mutually exclusive, i.e. only one class can be true per instance.
This commit is contained in:
parent
829c9091a4
commit
ce1e4eace2
|
@ -24,7 +24,8 @@ from ..vocab cimport Vocab
|
||||||
from ..syntax import nonproj
|
from ..syntax import nonproj
|
||||||
from ..attrs import POS, ID
|
from ..attrs import POS, ID
|
||||||
from ..parts_of_speech import X
|
from ..parts_of_speech import X
|
||||||
from .._ml import Tok2Vec, build_tagger_model, build_simple_cnn_text_classifier
|
from .._ml import Tok2Vec, build_tagger_model
|
||||||
|
from .._ml import build_text_classifier, build_simple_cnn_text_classifier
|
||||||
from .._ml import link_vectors_to_models, zero_init, flatten
|
from .._ml import link_vectors_to_models, zero_init, flatten
|
||||||
from .._ml import masked_language_model, create_default_optimizer
|
from .._ml import masked_language_model, create_default_optimizer
|
||||||
from ..errors import Errors, TempErrors
|
from ..errors import Errors, TempErrors
|
||||||
|
@ -862,8 +863,11 @@ class TextCategorizer(Pipe):
|
||||||
token_vector_width = cfg["token_vector_width"]
|
token_vector_width = cfg["token_vector_width"]
|
||||||
else:
|
else:
|
||||||
token_vector_width = util.env_opt("token_vector_width", 96)
|
token_vector_width = util.env_opt("token_vector_width", 96)
|
||||||
tok2vec = Tok2Vec(token_vector_width, embed_size, **cfg)
|
if cfg.get('architecture') == 'simple_cnn':
|
||||||
return build_simple_cnn_text_classifier(tok2vec, nr_class, **cfg)
|
tok2vec = Tok2Vec(token_vector_width, embed_size, **cfg)
|
||||||
|
return build_simple_cnn_text_classifier(tok2vec, nr_class, **cfg)
|
||||||
|
else:
|
||||||
|
return build_text_classifier(nr_class, **cfg)
|
||||||
|
|
||||||
@property
|
@property
|
||||||
def tok2vec(self):
|
def tok2vec(self):
|
||||||
|
|
Loading…
Reference in New Issue
Block a user