mirror of
https://github.com/explosion/spaCy.git
synced 2024-11-14 05:37:03 +03:00
Add missing we've and hardcoded 's and 'S
This commit is contained in:
parent
a5e0a0073b
commit
5876248109
|
@ -94,7 +94,7 @@ starting_tokens = {
|
||||||
"there": {"'d": [], "'d've": [], "'s": ["contrLower", "contrUpper"]},
|
"there": {"'d": [], "'d've": [], "'s": ["contrLower", "contrUpper"]},
|
||||||
"they": {"'d": [], "'d've": [], "'ll": [], "'re": [], "'ve": []},
|
"they": {"'d": [], "'d've": [], "'ll": [], "'re": [], "'ve": []},
|
||||||
"was": {"n't": []},
|
"was": {"n't": []},
|
||||||
"we": {"'d": ["contrLower", "contrUpper"], "'d've": [], "'ll": ["contrLower", "contrUpper"], "'re": ["contrLower", "contrUpper"]},
|
"we": {"'d": ["contrLower", "contrUpper"], "'d've": [], "'ll": ["contrLower", "contrUpper"], "'re": ["contrLower", "contrUpper"], "'ve": []},
|
||||||
"were": {"n't": []},
|
"were": {"n't": []},
|
||||||
"what": {"'ll": [], "'re": [], "'s": [], "'ve": []},
|
"what": {"'ll": [], "'re": [], "'s": [], "'ve": []},
|
||||||
"when": {"'s": []},
|
"when": {"'s": []},
|
||||||
|
@ -110,6 +110,11 @@ starting_tokens = {
|
||||||
# other specials that don't really have contractions
|
# other specials that don't really have contractions
|
||||||
# so they are hardcoded
|
# so they are hardcoded
|
||||||
hardcoded_specials = {
|
hardcoded_specials = {
|
||||||
|
|
||||||
|
"'s": [{"F": "'s", "L": "'s"}],
|
||||||
|
|
||||||
|
"'S": [{"F": "'S", "L": "'s"}],
|
||||||
|
|
||||||
"'em": [{"F": "'em"}],
|
"'em": [{"F": "'em"}],
|
||||||
|
|
||||||
"'ol": [{"F": "'ol"}],
|
"'ol": [{"F": "'ol"}],
|
||||||
|
|
File diff suppressed because one or more lines are too long
Loading…
Reference in New Issue
Block a user