2022-04-03 17:26:46 +02:00
|
|
|
FROM ubuntu
|
|
|
|
|
|
|
|
ARG KAGGLE_USERNAME
|
|
|
|
ARG KAGGLE_KEY
|
|
|
|
ARG CUTOFF
|
|
|
|
ENV CUTOFF=${CUTOFF:-260000}
|
2022-04-03 18:26:37 +02:00
|
|
|
ENV IS_DOCKER=True
|
2022-04-03 17:26:46 +02:00
|
|
|
|
|
|
|
WORKDIR /app
|
|
|
|
COPY ./download_data.sh calc_stats.sh ./
|
|
|
|
COPY ./clean_and_split_data.py calc_stats.py ./
|
2022-05-15 20:15:27 +02:00
|
|
|
COPY ./train_model.py ./train_model_mlflow.py ./
|
2022-05-03 20:52:59 +02:00
|
|
|
COPY ./evaluate.py ./
|
2022-04-03 17:26:46 +02:00
|
|
|
|
2022-06-05 15:59:11 +02:00
|
|
|
RUN apt-get update && apt-get install -y python3-pip unzip sshpass openssh-client && rm -rf /var/lib/apt/lists/*
|
2022-04-03 17:26:46 +02:00
|
|
|
|
|
|
|
RUN export PATH="$PATH:/root/.local/bin"
|
|
|
|
|
2022-06-05 15:59:11 +02:00
|
|
|
RUN pip3 install kaggle pandas scikit-learn tensorflow keras matplotlib numpy sacred mlflow dvc 'dvc[ssh]' paramiko
|
2022-04-03 17:26:46 +02:00
|
|
|
|
2022-04-10 18:08:07 +02:00
|
|
|
RUN mkdir /.kaggle && chmod o+w /.kaggle
|
2022-06-05 15:59:11 +02:00
|
|
|
|
|
|
|
RUN useradd -r -u 111 jenkins
|