test 10 version
This commit is contained in:
parent
c02c81943b
commit
8318a7ab4b
14548
dev-0/out.tsv
14548
dev-0/out.tsv
File diff suppressed because it is too large
Load Diff
5
model.py
5
model.py
@ -63,12 +63,13 @@ for index, words_1_3 in enumerate(model):
|
||||
print(f'normalizacja: {index / model_len}')
|
||||
count = sum(model[words_1_3].values())
|
||||
for word_2 in model[words_1_3]:
|
||||
model[words_1_3][word_2] /= float(count)
|
||||
model[words_1_3][word_2] += 1
|
||||
model[words_1_3][word_2] /= float(count + len(word_2)))
|
||||
|
||||
|
||||
def make_prediction(file):
|
||||
file_in = pd.read_csv(f'{file}/in.tsv.xz', sep='\t', on_bad_lines='skip', header=None, quoting=csv.QUOTE_NONE)
|
||||
with open(f'{file}/out.tsv', 'w') as file_out:
|
||||
with open(f'{file}/out.tsv', 'w', encoding='utf-8') as file_out:
|
||||
print(f'zapisywanie {file}')
|
||||
for line_in in file_in.iterrows():
|
||||
before = line_in[1][6]
|
||||
|
11868
test-A/out.tsv
11868
test-A/out.tsv
File diff suppressed because it is too large
Load Diff
Loading…
Reference in New Issue
Block a user