mirror of
https://github.com/explosion/spaCy.git
synced 2024-12-24 17:06:29 +03:00
Remove has_letters in config template (#11465)
Due to problems with the javascript conversion in the website quickstart, remove the `has_letters` setting to simplify generating `attrs` for the default `tok2vec`. Additionally reduce `PREFIX` as in the trained pipelines.
This commit is contained in:
parent
0c72c6bb2c
commit
8a86a35eab
|
@ -271,13 +271,8 @@ factory = "tok2vec"
|
||||||
[components.tok2vec.model.embed]
|
[components.tok2vec.model.embed]
|
||||||
@architectures = "spacy.MultiHashEmbed.v2"
|
@architectures = "spacy.MultiHashEmbed.v2"
|
||||||
width = ${components.tok2vec.model.encode.width}
|
width = ${components.tok2vec.model.encode.width}
|
||||||
{% if has_letters -%}
|
|
||||||
attrs = ["NORM", "PREFIX", "SUFFIX", "SHAPE"]
|
attrs = ["NORM", "PREFIX", "SUFFIX", "SHAPE"]
|
||||||
rows = [5000, 2500, 2500, 2500]
|
rows = [5000, 1000, 2500, 2500]
|
||||||
{% else -%}
|
|
||||||
attrs = ["ORTH", "SHAPE"]
|
|
||||||
rows = [5000, 2500]
|
|
||||||
{% endif -%}
|
|
||||||
include_static_vectors = {{ "true" if optimize == "accuracy" else "false" }}
|
include_static_vectors = {{ "true" if optimize == "accuracy" else "false" }}
|
||||||
|
|
||||||
[components.tok2vec.model.encode]
|
[components.tok2vec.model.encode]
|
||||||
|
|
|
@ -271,4 +271,3 @@ zh:
|
||||||
accuracy:
|
accuracy:
|
||||||
name: bert-base-chinese
|
name: bert-base-chinese
|
||||||
size_factor: 3
|
size_factor: 3
|
||||||
has_letters: false
|
|
||||||
|
|
Loading…
Reference in New Issue
Block a user