cutoff
This commit is contained in:
parent
ae19f828c0
commit
b6c1bb0227
@ -4,7 +4,7 @@
|
|||||||
kaggle datasets download -d timmate/avocado-prices-2020
|
kaggle datasets download -d timmate/avocado-prices-2020
|
||||||
unzip -o avocado-prices-2020.zip
|
unzip -o avocado-prices-2020.zip
|
||||||
TOTAL_SIZE=$(wc -l avocado-updated-2020.csv)
|
TOTAL_SIZE=$(wc -l avocado-updated-2020.csv)
|
||||||
echo size $TOTAL_SIZE
|
echo "size $TOTAL_SIZE"
|
||||||
|
|
||||||
# przetwarzanie pliku
|
# przetwarzanie pliku
|
||||||
grep -P "^$" -n avocado-updated-2020.csv
|
grep -P "^$" -n avocado-updated-2020.csv
|
||||||
@ -17,7 +17,7 @@ head -n -1 avocado-updated-2020.csv | shuf > avocado-updated-2020-shuf.csv
|
|||||||
|
|
||||||
head -n "$1" avocado-updated-2020-shuf.csv > avocado-2020.csv
|
head -n "$1" avocado-updated-2020-shuf.csv > avocado-2020.csv
|
||||||
TRUNCATED_SIZE=$(wc -l avocado-2020.csv)
|
TRUNCATED_SIZE=$(wc -l avocado-2020.csv)
|
||||||
echo truncated size $TRUNCATED_SIZE
|
echo "truncated size $TRUNCATED_SIZE"
|
||||||
|
|
||||||
# podzial na train/dev/test 6/2/2
|
# podzial na train/dev/test 6/2/2
|
||||||
head -n 6609 avocado-2020.csv > avocado-updated-2020-test.csv
|
head -n 6609 avocado-2020.csv > avocado-updated-2020-test.csv
|
||||||
|
Loading…
Reference in New Issue
Block a user