ium_z444510/create-dataset.sh
piotrwrzodak 3a16591ae5 revert
2023-04-21 00:07:49 +02:00

15 lines
625 B
Bash

#!/bin/bash
export KAGGLE_USERNAME=$KAGGLE_USERNAME
export KAGGLE_KEY=$KAGGLE_KEY
kaggle datasets download -d thedevastator/airbnb-prices-in-european-cities
unzip airbnb-prices-in-european-cities.zip -d data
rm airbnb-prices-in-european-cities.zip
head -n $CUTOFF data/barcelona_weekends.csv | shuf > data/barcelona_weekends.shuf.csv
head -n 25 data/barcelona_weekends.shuf.csv > data/barcelona_weekends.test.csv
head -n 50 data/barcelona_weekends.shuf.csv | tail -n 25 > data/barcelona_weekends.dev.csv
tail -n +51 data/barcelona_weekends.shuf.csv > data/barcelona_weekends.train.csv
rm data/barcelona_weekends.shuf.csv