This commit is contained in:
s434732 2022-04-03 17:50:02 +02:00
parent 2b584a30dc
commit e362ba345c

6
run.py
View File

@ -13,12 +13,6 @@ import csv
import re
# In[172]:
def clean_text(text):
text = text.lower().replace('-\\n', '').replace('\\n', ' ')
text = re.sub(r'\p{P}', '', text)
return text
model = defaultdict(lambda: defaultdict(lambda: 0))