mirror of
https://github.com/explosion/spaCy.git
synced 2024-11-11 04:08:09 +03:00
Merge branch 'master' into spacy.io
This commit is contained in:
commit
a9ad735241
|
@ -404,7 +404,7 @@ class BadHTMLMerger(object):
|
|||
for match_id, start, end in matches:
|
||||
spans.append(doc[start:end])
|
||||
with doc.retokenize() as retokenizer:
|
||||
for span in spans:
|
||||
for span in hashtags:
|
||||
retokenizer.merge(span)
|
||||
for token in span:
|
||||
token._.bad_html = True # Mark token as bad HTML
|
||||
|
|
Loading…
Reference in New Issue
Block a user