cutoff parameter
This commit is contained in:
parent
a95c33308e
commit
58db37cb76
@ -4,17 +4,22 @@
|
|||||||
kaggle datasets download -d timmate/avocado-prices-2020
|
kaggle datasets download -d timmate/avocado-prices-2020
|
||||||
unzip -o avocado-prices-2020.zip
|
unzip -o avocado-prices-2020.zip
|
||||||
wc -l avocado-updated-2020.csv
|
wc -l avocado-updated-2020.csv
|
||||||
echo "$1 'AAAAAAAAAAAAAAAAA"
|
|
||||||
|
|
||||||
# przetwarzanie pliku
|
# przetwarzanie pliku
|
||||||
grep -P "^$" -n avocado-updated-2020.csv
|
grep -P "^$" -n avocado-updated-2020.csv
|
||||||
|
|
||||||
# usuniecie zbednej kolumny year (redundantne dane)
|
# usuniecie zbednej kolumny year (redundantne dane)
|
||||||
cut -d -f12 --complement avocado-updated-2020.csv
|
cut -d ',' -f12 --complement avocado-updated-2020.csv
|
||||||
|
|
||||||
head -n 1 avocado-updated-2020.csv> header.csv
|
head -n 1 avocado-updated-2020.csv > header.csv
|
||||||
head -n -1 avocado-updated-2020.csv | shuf > avocado-updated-2020-shuf.csv
|
head -n -1 avocado-updated-2020.csv | shuf > avocado-updated-2020-shuf.csv
|
||||||
|
|
||||||
|
echo "$1 AAAAAAAAAAAAAAAAA"
|
||||||
|
head -n "-$1" avocado-updated-2020-shuf.csv > avocado-2020.csv
|
||||||
|
wc -l avocado-2020.csv
|
||||||
|
|
||||||
|
|
||||||
# podzial na train/dev/test
|
# podzial na train/dev/test
|
||||||
head -n 6609 avocado-updated-2020-shuf.csv > avocado-updated-2020-test.csv
|
head -n 6609 avocado-updated-2020-shuf.csv > avocado-updated-2020-test.csv
|
||||||
head -n 13218 avocado-updated-2020-shuf.csv | tail -n 6609 > avocado-updated-2020-dev.csv
|
head -n 13218 avocado-updated-2020-shuf.csv | tail -n 6609 > avocado-updated-2020-dev.csv
|
||||||
|
Loading…
Reference in New Issue
Block a user