mirror of
https://github.com/explosion/spaCy.git
synced 2025-01-23 15:54:13 +03:00
Update textcat exampe
This commit is contained in:
parent
774f5732bd
commit
79a94bc166
|
@ -1,3 +1,7 @@
|
||||||
|
'''Train a multi-label convolutional neural network text classifier,
|
||||||
|
using the spacy.pipeline.TextCategorizer component. The model is then added
|
||||||
|
to spacy.pipeline, and predictions are available at `doc.cats`.
|
||||||
|
'''
|
||||||
from __future__ import unicode_literals
|
from __future__ import unicode_literals
|
||||||
import plac
|
import plac
|
||||||
import random
|
import random
|
||||||
|
@ -31,7 +35,7 @@ def train_textcat(tokenizer, textcat,
|
||||||
train_data = tqdm.tqdm(train_data, leave=False) # Progress bar
|
train_data = tqdm.tqdm(train_data, leave=False) # Progress bar
|
||||||
for batch in minibatch(train_data, size=batch_sizes):
|
for batch in minibatch(train_data, size=batch_sizes):
|
||||||
docs, golds = zip(*batch)
|
docs, golds = zip(*batch)
|
||||||
textcat.update((docs, None), golds, sgd=optimizer, drop=0.2,
|
textcat.update(docs, golds, sgd=optimizer, drop=0.2,
|
||||||
losses=losses)
|
losses=losses)
|
||||||
with textcat.model.use_params(optimizer.averages):
|
with textcat.model.use_params(optimizer.averages):
|
||||||
scores = evaluate(tokenizer, textcat, dev_texts, dev_cats)
|
scores = evaluate(tokenizer, textcat, dev_texts, dev_cats)
|
||||||
|
|
Loading…
Reference in New Issue
Block a user