mirror of
https://github.com/explosion/spaCy.git
synced 2024-12-26 18:06:29 +03:00
Fix typos in docs (closes #3802) [ci skip]
This commit is contained in:
parent
1f13005751
commit
0c74506c9c
|
@ -405,7 +405,7 @@ class BadHTMLMerger(object):
|
||||||
for match_id, start, end in matches:
|
for match_id, start, end in matches:
|
||||||
spans.append(doc[start:end])
|
spans.append(doc[start:end])
|
||||||
with doc.retokenize() as retokenizer:
|
with doc.retokenize() as retokenizer:
|
||||||
for span in hashtags:
|
for span in spans:
|
||||||
retokenizer.merge(span)
|
retokenizer.merge(span)
|
||||||
for token in span:
|
for token in span:
|
||||||
token._.bad_html = True # Mark token as bad HTML
|
token._.bad_html = True # Mark token as bad HTML
|
||||||
|
@ -679,7 +679,7 @@ for match_id, start, end in matches:
|
||||||
if doc.vocab.strings[match_id] == "HASHTAG":
|
if doc.vocab.strings[match_id] == "HASHTAG":
|
||||||
hashtags.append(doc[start:end])
|
hashtags.append(doc[start:end])
|
||||||
with doc.retokenize() as retokenizer:
|
with doc.retokenize() as retokenizer:
|
||||||
for span in spans:
|
for span in hashtags:
|
||||||
retokenizer.merge(span)
|
retokenizer.merge(span)
|
||||||
for token in span:
|
for token in span:
|
||||||
token._.is_hashtag = True
|
token._.is_hashtag = True
|
||||||
|
|
Loading…
Reference in New Issue
Block a user