ium_444380/download_data.sh

10 lines
348 B
Bash
Raw Normal View History

#!/bin/bash
2022-03-27 12:32:35 +02:00
kaggle datasets download -d AnalyzeBoston/crimes-in-boston --force
unzip -o crimes-in-boston.zip
2022-04-03 17:26:05 +02:00
iconv -f "windows-1252" -t "UTF-8" crime.csv > crime_conv.csv
#shuf crime.csv | head -n $1 > crime.shuf
#head -n 30000 crime.shuf > crime.test
#head -n 60000 crime.shuf | tail -n 30000 > crime.dev
#tail -n +60001 crime.shuf > crime.train