diff --git a/avocado-preprocessing.sh b/avocado-preprocessing.sh index b74ccfb..872f9dd 100755 --- a/avocado-preprocessing.sh +++ b/avocado-preprocessing.sh @@ -3,8 +3,8 @@ # pobranie zbioru danych kaggle datasets download -d timmate/avocado-prices-2020 unzip -o avocado-prices-2020.zip -TOTAL_SIZE= $(wc -l avocado-updated-2020.csv) -echo size $TOTAL_SIZE +TOTAL_SIZE=$(wc -l avocado-updated-2020.csv) +echo "size $TOTAL_SIZE" # przetwarzanie pliku grep -P "^$" -n avocado-updated-2020.csv @@ -16,8 +16,8 @@ head -n 1 avocado-updated-2020.csv > header.csv head -n -1 avocado-updated-2020.csv | shuf > avocado-updated-2020-shuf.csv head -n "$1" avocado-updated-2020-shuf.csv > avocado-2020.csv -TRUNCATED_SIZE = $(wc -l avocado-2020.csv) -echo truncated size $TRUNCATED_SIZE +TRUNCATED_SIZE=$(wc -l avocado-2020.csv) +echo "truncated size $TRUNCATED_SIZE" # podzial na train/dev/test 6/2/2 head -n 6609 avocado-2020.csv > avocado-updated-2020-test.csv