diff --git a/.gitignore b/.gitignore index 2aec18a..6d5a8a3 100644 --- a/.gitignore +++ b/.gitignore @@ -6,3 +6,4 @@ .idea/polish-urban-legends-public.iml .idea/vcs.xml .idea/inspectionProfiles/profiles_settings.xml +.idea diff --git a/classifier.py b/solution.py similarity index 90% rename from classifier.py rename to solution.py index 5b9cb50..5c69755 100644 --- a/classifier.py +++ b/solution.py @@ -8,7 +8,7 @@ with open('stopwords') as f: stopwords = [line.rstrip() for line in f] -def classify(path, n_clusters): +def create_clusters(path, n_clusters): with open(path + 'in.tsv') as f: docs = [line.rstrip() for line in f] docs_preprocessed = [] @@ -26,5 +26,5 @@ def classify(path, n_clusters): file.write("%i\n" % label) -classify('dev-0/', n_clusters=10) -classify('test-A/', n_clusters=10) \ No newline at end of file +create_clusters('dev-0/', n_clusters=10) +create_clusters('test-A/', n_clusters=10) \ No newline at end of file