mirror of
https://github.com/Findus23/cr-search.git
synced 2024-09-11 06:03:45 +02:00
add comments
This commit is contained in:
parent
473dfa3b4d
commit
92ce4c3859
2 changed files with 9 additions and 0 deletions
|
@ -1,3 +1,8 @@
|
|||
"""
|
||||
from https://github.com/explosion/spaCy/blob/master/spacy/lang/en/stop_words.py
|
||||
|
||||
without contractions
|
||||
"""
|
||||
STOP_WORDS = set(
|
||||
"""
|
||||
a about above across after afterwards again against all almost alone along
|
||||
|
|
4
typo.py
4
typo.py
|
@ -1,3 +1,7 @@
|
|||
"""
|
||||
replace common typos of names to unify them in the database
|
||||
"""
|
||||
|
||||
typos = {
|
||||
"Matt": {"Mat", "Mattt", "\"Matt"},
|
||||
"Sam": {"San", "Nott", "Sma", "Sasm", "Sm"},
|
||||
|
|
Loading…
Reference in a new issue