1
0
Fork 0
mirror of https://github.com/Findus23/cr-search.git synced 2024-09-19 15:23:44 +02:00

add comments

This commit is contained in:
Lukas Winkler 2020-03-07 10:51:44 +01:00
parent 473dfa3b4d
commit 92ce4c3859
Signed by: lukas
GPG key ID: 54DE4D798D244853
2 changed files with 9 additions and 0 deletions

View file

@ -1,3 +1,8 @@
"""
from https://github.com/explosion/spaCy/blob/master/spacy/lang/en/stop_words.py
without contractions
"""
STOP_WORDS = set(
"""
a about above across after afterwards again against all almost alone along

View file

@ -1,3 +1,7 @@
"""
replace common typos of names to unify them in the database
"""
typos = {
"Matt": {"Mat", "Mattt", "\"Matt"},
"Sam": {"San", "Nott", "Sma", "Sasm", "Sm"},