Added script downloading and splitting data

This commit is contained in:
s444380 2022-03-27 11:29:22 +02:00
parent 22a0d94899
commit 98939fc551

8
download_data.sh Executable file
View File

@ -0,0 +1,8 @@
#!/bin/bash
kaggle datasets download -d AnalyzeBoston/crimes-in-boston
unzip crimes-in-boston.zip
shuf crime.csv > crime.shuf
head -n 30000 crime.shuf > crime.test
head -n 60000 crime.shuf | tail -n 30000 > crime.dev
tail -n +60001 crime.shuf > crime.train