ium_z444510/create-dataset.sh

15 lines
625 B
Bash
Raw Permalink Normal View History

2023-04-20 23:03:49 +02:00
#!/bin/bash
2023-04-20 22:27:59 +02:00
2023-04-20 23:15:39 +02:00
export KAGGLE_USERNAME=$KAGGLE_USERNAME
export KAGGLE_KEY=$KAGGLE_KEY
kaggle datasets download -d thedevastator/airbnb-prices-in-european-cities
unzip airbnb-prices-in-european-cities.zip -d data
rm airbnb-prices-in-european-cities.zip
head -n $CUTOFF data/barcelona_weekends.csv | shuf > data/barcelona_weekends.shuf.csv
2023-04-21 00:07:49 +02:00
head -n 25 data/barcelona_weekends.shuf.csv > data/barcelona_weekends.test.csv
head -n 50 data/barcelona_weekends.shuf.csv | tail -n 25 > data/barcelona_weekends.dev.csv
tail -n +51 data/barcelona_weekends.shuf.csv > data/barcelona_weekends.train.csv
2023-04-20 23:15:39 +02:00
rm data/barcelona_weekends.shuf.csv