paranormal-or-skeptic/train_word2vec.py

12 lines
368 B
Python

import csv
from gensim.test.utils import common_texts
from gensim.models import Word2Vec
with open("train/in.tsv") as f:
texts = csv.reader(f, delimiter="\t")
model = Word2Vec(sentences=common_texts, vector_size=100, window=5, min_count=1, workers=4)
model.save("word2vec.model")
word_vectors = model.wv
word_vectors.save("word2vec.wordvectors")