test 10 version

This commit is contained in:
pietrzakkuba 2022-04-03 14:14:56 +02:00
parent c02c81943b
commit 8318a7ab4b
3 changed files with 11003 additions and 15418 deletions

File diff suppressed because it is too large Load Diff

View File

@ -63,12 +63,13 @@ for index, words_1_3 in enumerate(model):
print(f'normalizacja: {index / model_len}')
count = sum(model[words_1_3].values())
for word_2 in model[words_1_3]:
model[words_1_3][word_2] /= float(count)
model[words_1_3][word_2] += 1
model[words_1_3][word_2] /= float(count + len(word_2)))
def make_prediction(file):
file_in = pd.read_csv(f'{file}/in.tsv.xz', sep='\t', on_bad_lines='skip', header=None, quoting=csv.QUOTE_NONE)
with open(f'{file}/out.tsv', 'w') as file_out:
with open(f'{file}/out.tsv', 'w', encoding='utf-8') as file_out:
print(f'zapisywanie {file}')
for line_in in file_in.iterrows():
before = line_in[1][6]

File diff suppressed because it is too large Load Diff