2021-03-28 20:35:30 +02:00
|
|
|
#!/bin/bash
|
2021-03-28 21:00:30 +02:00
|
|
|
echo "pobieram dane"
|
2021-03-28 20:35:30 +02:00
|
|
|
curl -OL https://git.wmi.amu.edu.pl/s434804/ium_434804/raw/branch/master/country_vaccinations.csv
|
2021-03-28 21:00:30 +02:00
|
|
|
echo "CUTOFF danych"
|
2021-03-28 20:35:30 +02:00
|
|
|
head -n -1 country_vaccinations.csv | tail -n +$((${CUTOFF}+1)) > country_vaccinations.csv | shuf > vaccines.csv.shuf
|
2021-03-28 21:00:30 +02:00
|
|
|
echo "Wielkość zbioru"
|
2021-03-28 20:35:30 +02:00
|
|
|
wc -l vaccines.csv
|
|
|
|
head -n 1468 vaccines.csv.shuf > test.csv
|
|
|
|
head -n 2936 vaccines.csv.shuf | tail -n 1468 > validation.csv
|
|
|
|
tail -n +2936 vaccines.csv.shuf > train.csv
|
|
|
|
wc -l *.csv
|