From 2400ef5b8949d3dcfc8b40bc9030daf264a910b2 Mon Sep 17 00:00:00 2001 From: Karolina Oparczyk Date: Wed, 14 Apr 2021 20:25:53 +0200 Subject: [PATCH] Docker image --- Dockerfile | 12 ++++++++++++ get_data.sh | 2 +- 2 files changed, 13 insertions(+), 1 deletion(-) create mode 100644 Dockerfile diff --git a/Dockerfile b/Dockerfile new file mode 100644 index 0000000..ac8ca5f --- /dev/null +++ b/Dockerfile @@ -0,0 +1,12 @@ +FROM ubuntu:latest +RUN apt update +RUN apt install -y python3 +RUN apt install -y python3-pip +RUN apt install -y unzip +RUN pip3 install pandas +RUN pip3 install kaggle +COPY ./get_data.sh ./ +COPY ./main.py ./ +ENV KAGGLE_USERNAME karopa +ARG key +ENV KAGGLE_KEY $key \ No newline at end of file diff --git a/get_data.sh b/get_data.sh index 8ab956d..53d0b62 100644 --- a/get_data.sh +++ b/get_data.sh @@ -16,5 +16,5 @@ if kaggle datasets download -d sgonkaggle/youtube-trend-with-subscriber && unzip wc -l "data_dev" echo "Train dataset" wc -l "data_train" - python main.py USvideos_modified.csv + python3 main.py USvideos_modified.csv fi \ No newline at end of file