diff --git a/download_dataset.sh b/download_dataset.sh index f9e0abb..a653825 100644 --- a/download_dataset.sh +++ b/download_dataset.sh @@ -2,6 +2,6 @@ kaggle datasets download -d sohier/crime-in-baltimore unzip crime-in-baltimore.zip -head -n 8000 BPD_Part_1_Victim_Based_Crime_Data.csv > baltimore_train.csv +head -n 10000 BPD_Part_1_Victim_Based_Crime_Data.csv > baltimore_train.csv tail -n 2000 BPD_Part_1_Victim_Based_Crime_Data.csv > baltimore_test.csv head -n 2000 baltimore_train.csv > baltimore_dev.csv