diff --git a/download_dataset.sh b/download_dataset.sh index 6cccb15..a38e13e 100644 --- a/download_dataset.sh +++ b/download_dataset.sh @@ -22,6 +22,7 @@ fi head -n $(expr $data_size / 10 \* 8) data.csv > train.csv tail -n $(expr $data_size / 10 \* 2) data.csv > dev.csv.tmp +# Get number of rows in dev.csv.tmp dev_size=$(wc -l < dev.csv.tmp) head -n $(expr $dev_size / 10 \* 5) dev.csv.tmp > dev.csv