This commit is contained in:
Mateusz 2024-05-19 12:03:31 +02:00
parent 3817604049
commit 10b830e7a0
4 changed files with 1888 additions and 1886 deletions

12
.gitignore vendored
View File

@ -1,5 +1,7 @@
word2vec_100_3_polish.bin
word2vec_100_3_polish.bin.syn0.npy
word2vec_300_3_polish.bin
word2vec_300_3_polish.bin.trainables.syn1neg.npy
word2vec_300_3_polish.bin.wv.vectors.npy
fasttext_100_3_polish.bin
fasttext_100_3_polish.bin.trainables.syn1neg.npy
fasttext_100_3_polish.bin.trainables.vectors_ngrams_lockf.npy
fasttext_100_3_polish.bin.trainables.vectors_vocab_lockf.npy
fasttext_100_3_polish.bin.wv.vectors_ngrams.npy
fasttext_100_3_polish.bin.wv.vectors_vocab.npy
fasttext_100_3_polish.bin.wv.vectors.npy

File diff suppressed because it is too large Load Diff

4
run.py
View File

@ -31,10 +31,10 @@ def main():
train_dataset, dev_0_dataset, test_A_dataset = read_data()
# Word2Vec parameters
vector_size = 300
vector_size = 100
# Training the Word2Vec model
word2vec = KeyedVectors.load("word2vec_300_3_polish.bin")
word2vec = KeyedVectors.load("fasttext_100_3_polish.bin")
# Convert text to vectors
train_vectors = np.array(

File diff suppressed because it is too large Load Diff