mirror of
https://github.com/explosion/spaCy.git
synced 2024-12-25 09:26:27 +03:00
Fix FUZZY operator definition (#12318)
* Fix FUZZY operator definition The default length of the FUZZY operator is 2 and not 3. * adjust edit distance in matcher usage docs too --------- Co-authored-by: svlandeg <svlandeg@github.com>
This commit is contained in:
parent
80bc140533
commit
daedc45d05
|
@ -384,10 +384,10 @@ the more specific attributes `FUZZY1`..`FUZZY9` you can specify the maximum
|
||||||
allowed edit distance directly.
|
allowed edit distance directly.
|
||||||
|
|
||||||
```python
|
```python
|
||||||
# Match lowercase with fuzzy matching (allows 3 edits)
|
# Match lowercase with fuzzy matching (allows 2 edits by default)
|
||||||
pattern = [{"LOWER": {"FUZZY": "definitely"}}]
|
pattern = [{"LOWER": {"FUZZY": "definitely"}}]
|
||||||
|
|
||||||
# Match custom attribute values with fuzzy matching (allows 3 edits)
|
# Match custom attribute values with fuzzy matching (allows 2 edits by default)
|
||||||
pattern = [{"_": {"country": {"FUZZY": "Kyrgyzstan"}}}]
|
pattern = [{"_": {"country": {"FUZZY": "Kyrgyzstan"}}}]
|
||||||
|
|
||||||
# Match with exact Levenshtein edit distance limits (allows 4 edits)
|
# Match with exact Levenshtein edit distance limits (allows 4 edits)
|
||||||
|
|
|
@ -70,13 +70,13 @@ distance of 2 and up to 30% of the pattern string length. `FUZZY1`..`FUZZY9` can
|
||||||
be used to specify the exact number of allowed edits.
|
be used to specify the exact number of allowed edits.
|
||||||
|
|
||||||
```python
|
```python
|
||||||
# Match lowercase with fuzzy matching (allows up to 3 edits)
|
# Match lowercase with fuzzy matching (allows 2 edits by default)
|
||||||
pattern = [{"LOWER": {"FUZZY": "definitely"}}]
|
pattern = [{"LOWER": {"FUZZY": "definitely"}}]
|
||||||
|
|
||||||
# Match custom attribute values with fuzzy matching (allows up to 3 edits)
|
# Match custom attribute values with fuzzy matching (allows 2 edits by default)
|
||||||
pattern = [{"_": {"country": {"FUZZY": "Kyrgyzstan"}}}]
|
pattern = [{"_": {"country": {"FUZZY": "Kyrgyzstan"}}}]
|
||||||
|
|
||||||
# Match with exact Levenshtein edit distance limits (allows up to 4 edits)
|
# Match with exact Levenshtein edit distance limits (allows 4 edits)
|
||||||
pattern = [{"_": {"country": {"FUZZY4": "Kyrgyzstan"}}}]
|
pattern = [{"_": {"country": {"FUZZY4": "Kyrgyzstan"}}}]
|
||||||
```
|
```
|
||||||
|
|
||||||
|
|
Loading…
Reference in New Issue
Block a user