ium_452639/prepare-ztm-data.sh

33 lines
620 B
Bash
Raw Normal View History

2023-03-20 23:02:03 +01:00
#!/usr/bin/env bash
2023-03-21 01:00:51 +01:00
set -xe -o pipefail
make normalize csv2tsv/csv2tsv
2023-03-20 23:02:03 +01:00
keep=(stops.txt trips.txt stop_times.txt)
mkdir -p data && cd data
parallel -j 8 -- wget --no-verbose --no-clobber <../ztm-data.txt
for file in $(find . -name 'index*.zip'); do
dir="${file##*=}"
dir="${dir%.zip}"
if [ ! -d "$dir" ]; then
mkdir "$dir"
unzip "$file" -d "$dir" "${keep[@]}"
fi
done
cd ..
for k in "${keep[@]}"; do
2023-03-21 01:00:51 +01:00
csv="${k%.txt}.csv"
tsv="${k%.txt}.tsv"
if [ ! -f "$tsv" ]; then
cat $(find data -name "$k") > "$csv"
csv2tsv/csv2tsv <"$csv" >"$tsv"
fi
2023-03-20 23:02:03 +01:00
done
2023-03-21 01:00:51 +01:00
./normalize <stop_times.tsv >stop_times.normalized.tsv