Update 'process_dataset.py'
All checks were successful
s449288-evaluation/pipeline/head This commit looks good
s449288-training/pipeline/head This commit looks good

This commit is contained in:
Kacper Dudzic 2022-05-09 11:28:14 +02:00
parent 674c95103e
commit 166c30997e

View File

@ -18,10 +18,10 @@ print(lego)
print(lego.describe(include='all')) print(lego.describe(include='all'))
# pierwszy podzial, wydzielamy zbior treningowy # pierwszy podzial, wydzielamy zbior treningowy
lego_train, lego_rem = train_test_split(lego, train_size=0.8, random_state=1) lego_train, lego_rem = train_test_split(lego, train_size=0.8)
# drugi podział, wydzielamy walidacyjny i testowy # drugi podział, wydzielamy walidacyjny i testowy
lego_valid, lego_test = train_test_split(lego_rem, test_size=0.5, random_state=1) lego_valid, lego_test = train_test_split(lego_rem, test_size=0.5)
# zapis # zapis
lego.to_csv('lego_sets_clean.csv', index=None, header=True) lego.to_csv('lego_sets_clean.csv', index=None, header=True)