From e3d5fa89f139b57a8605e2183d1e4a06e2386cc7 Mon Sep 17 00:00:00 2001 From: Mateusz Date: Mon, 1 Apr 2024 17:09:39 +0200 Subject: [PATCH] Dockerfile --- Jenkinsfile | 2 +- create-dataset.py | 22 +++++++++++----------- 2 files changed, 12 insertions(+), 12 deletions(-) diff --git a/Jenkinsfile b/Jenkinsfile index 81562f1..8340e67 100644 --- a/Jenkinsfile +++ b/Jenkinsfile @@ -31,7 +31,7 @@ pipeline { } stage('Archive Artifacts') { steps { - archiveArtifacts artifacts: '/data/*', onlyIfSuccessful: true + archiveArtifacts artifacts: 'data/*', onlyIfSuccessful: true } } } diff --git a/create-dataset.py b/create-dataset.py index 97fef25..e4ebc8c 100644 --- a/create-dataset.py +++ b/create-dataset.py @@ -72,11 +72,11 @@ def save_undersample_data( y_train_undersample, y_test_undersample, ): - undersample_data.to_csv("/data/undersample_data.csv", index=False) - X_train_undersample.to_csv("/data/X_train_undersample.csv", index=False) - X_test_undersample.to_csv("/data/X_test_undersample.csv", index=False) - y_train_undersample.to_csv("/data/y_train_undersample.csv", index=False) - y_test_undersample.to_csv("/data/y_test_undersample.csv", index=False) + undersample_data.to_csv("data/undersample_data.csv", index=False) + X_train_undersample.to_csv("data/X_train_undersample.csv", index=False) + X_test_undersample.to_csv("data/X_test_undersample.csv", index=False) + y_train_undersample.to_csv("data/y_train_undersample.csv", index=False) + y_test_undersample.to_csv("data/y_test_undersample.csv", index=False) def split_whole_data(df): @@ -90,16 +90,16 @@ def split_whole_data(df): def save_whole_data(df, X_train, X_test, y_train, y_test): - df.to_csv("/data/creditcard.csv", index=False) - X_train.to_csv("/data/X_train.csv", index=False) - X_test.to_csv("/data/X_test.csv", index=False) - y_train.to_csv("/data/y_train.csv", index=False) - y_test.to_csv("/data/y_test.csv", index=False) + df.to_csv("data/creditcard.csv", index=False) + X_train.to_csv("data/X_train.csv", index=False) + X_test.to_csv("data/X_test.csv", index=False) + y_train.to_csv("data/y_train.csv", index=False) + y_test.to_csv("data/y_test.csv", index=False) def main(): download_kaggle_dataset() - os.makedirs("/data", exist_ok=True) + os.makedirs("data", exist_ok=True) df = load_data("creditcard.csv") df = normalize_data(df)