From 22853ee945a6d1784cb4bb888d8367feda6ac2db Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=C5=81ukasz=20J=C4=99dyk?= Date: Fri, 21 May 2021 13:16:42 +0200 Subject: [PATCH] final version --- main.py | 1 - 1 file changed, 1 deletion(-) diff --git a/main.py b/main.py index e91b6d4..0af190a 100644 --- a/main.py +++ b/main.py @@ -42,7 +42,6 @@ X_dev = [word_tokenize(content) for content in X_dev] X_test = [word_tokenize(content) for content in X_test] # word2vec -#word2vec = Word2Vec(X_train, vector_size=50, window=5, min_count=1) word2vec = gensim.downloader.load('word2vec-google-news-300') X_train = [np.mean([word2vec[word] for word in content if word in word2vec] or [np.zeros(300)], axis=0) for content in X_train] X_dev = [np.mean([word2vec[word] for word in content if word in word2vec] or [np.zeros(300)], axis=0) for content in X_dev]