cutoff parameter

This commit is contained in:
patrycjalazna 2021-03-28 16:22:31 +02:00
parent a95c33308e
commit 58db37cb76

View File

@ -4,17 +4,22 @@
kaggle datasets download -d timmate/avocado-prices-2020 kaggle datasets download -d timmate/avocado-prices-2020
unzip -o avocado-prices-2020.zip unzip -o avocado-prices-2020.zip
wc -l avocado-updated-2020.csv wc -l avocado-updated-2020.csv
echo "$1 'AAAAAAAAAAAAAAAAA"
# przetwarzanie pliku # przetwarzanie pliku
grep -P "^$" -n avocado-updated-2020.csv grep -P "^$" -n avocado-updated-2020.csv
# usuniecie zbednej kolumny year (redundantne dane) # usuniecie zbednej kolumny year (redundantne dane)
cut -d -f12 --complement avocado-updated-2020.csv cut -d ',' -f12 --complement avocado-updated-2020.csv
head -n 1 avocado-updated-2020.csv > header.csv head -n 1 avocado-updated-2020.csv > header.csv
head -n -1 avocado-updated-2020.csv | shuf > avocado-updated-2020-shuf.csv head -n -1 avocado-updated-2020.csv | shuf > avocado-updated-2020-shuf.csv
echo "$1 AAAAAAAAAAAAAAAAA"
head -n "-$1" avocado-updated-2020-shuf.csv > avocado-2020.csv
wc -l avocado-2020.csv
# podzial na train/dev/test # podzial na train/dev/test
head -n 6609 avocado-updated-2020-shuf.csv > avocado-updated-2020-test.csv head -n 6609 avocado-updated-2020-shuf.csv > avocado-updated-2020-test.csv
head -n 13218 avocado-updated-2020-shuf.csv | tail -n 6609 > avocado-updated-2020-dev.csv head -n 13218 avocado-updated-2020-shuf.csv | tail -n 6609 > avocado-updated-2020-dev.csv