current_month_mean_from_train

This commit is contained in:
kubapok 2021-12-23 15:27:58 +01:00
parent 402e7b90ac
commit ec4be03ea1
3 changed files with 1339 additions and 1320 deletions

View File

@ -0,0 +1,19 @@
import pandas as pd
train_in = pd.read_csv('../train/in.tsv', header = None, names = ['id', 'nazwa','typ_zbioru', 'rok', 'miesiąc'], sep='\t')
train_exp = pd.read_csv('../train/expected.tsv', header = None, names = ['opad'], sep='\t')
train = train_in.copy()
train['opad'] = train_exp
by_miesiac = train.groupby(['rok', 'miesiąc']).mean()
for dataset in ('dev-0', 'test-A'):
with open(f'../{dataset}/out.tsv','w') as f_out, open(f'../{dataset}/in.tsv', 'r') as f_in:
for line in f_in:
_, _, _, rok, miesiac = line.rstrip().split('\t')
srednia = by_miesiac.loc[int(rok), int(miesiac)]['opad']
f_out.write(str(srednia) + '\n')

File diff suppressed because it is too large Load Diff

File diff suppressed because it is too large Load Diff