From 08826dbe52c7cd54148b22d4f2b815756a100582 Mon Sep 17 00:00:00 2001 From: Maciej Date: Mon, 29 Mar 2021 02:30:55 +0200 Subject: [PATCH] Added cutoff parameter --- preparations.sh | 21 ++++++++++++++------- 1 file changed, 14 insertions(+), 7 deletions(-) diff --git a/preparations.sh b/preparations.sh index e21eee5..fda0db1 100755 --- a/preparations.sh +++ b/preparations.sh @@ -4,23 +4,30 @@ curl -OL https://git.wmi.amu.edu.pl/s434784/ium_434784/raw/branch/master/who_sui head -n 1 who_suicide_statistics.csv > names.csv # Randomizacja zbioru. + sed 1d who_suicide_statistics.csv | shuf > data.shuf -#cp who_suicide_statistics.csv data.shuf +# Ilosc wierszy +NUMROWS=$(cat data.shuf | wc -l) +echo "Initial number of rows ${NUMROWS}" +DELETE=$((NUMROWS - $1)) +echo "Cutting $1 rows" +tail -n $DELETE data.shuf > data.shuf.cut # Podzial na 3 pozbiory - #Ustalenie proporcji 6:2:2 -NUMROWS=$(cat data.shuf | wc -l) +NUMROWS=$(cat data.shuf.cut | wc -l) TEST=$((NUMROWS / 10 * 2 )) DEV=$((NUMROWS / 10 * 4 )) TRAIN=$((NUMROWS - DEV )) -head -n $TEST data.shuf > data.test -head -n $DEV data.shuf | tail -n $TEST > data.dev -head -n $NUMROWS data.shuf | tail -n $TRAIN > data.train +head -n $TEST data.shuf.cut > data.test +head -n $DEV data.shuf.cut | tail -n $TEST > data.dev +head -n $NUMROWS data.shuf.cut | tail -n $TRAIN > data.train + +rm data.shuf.cut echo "Test rows ${TEST}" echo "Dev rows ${TEST}" echo "Train rows ${TRAIN}" echo "All number of rows ${NUMROWS}" -echo $1 \ No newline at end of file +