diff --git a/Jenkinsfile b/Jenkinsfile index a019bd3..d1dbf02 100644 --- a/Jenkinsfile +++ b/Jenkinsfile @@ -2,7 +2,7 @@ pipeline { agent { dockerfile { filename 'Dockerfile' - args '-u root' + args '-u root -v -v $HOME:/app' } } @@ -24,17 +24,16 @@ pipeline { stage('Run create-dataset script') { steps { withEnv (["KAGGLE_USERNAME=${params.KAGGLE_USERNAME}", "KAGGLE_KEY=${params.KAGGLE_KEY}"]) { - sh 'mkdir /.kaggle' - sh 'echo "{\"username\":\"$KAGGLE_USERNAME\",\"key\":\"$KAGGLE_KEY\"}" > /.kaggle/kaggle.json' - sh 'chmod 600 /.kaggle/kaggle.json' - sh 'chmod +x create-dataset.py' - sh 'python3 ./create-dataset.py' + dir ('/app') { + sh 'chmod +x create-dataset.py' + sh 'python3 ./create-dataset.py' + } } } } stage('Archive Artifacts') { steps { - archiveArtifacts artifacts: '/data/*', onlyIfSuccessful: true + archiveArtifacts artifacts: '/app/data/*', onlyIfSuccessful: true } } } diff --git a/create-dataset.py b/create-dataset.py index a09e03c..85fdcef 100644 --- a/create-dataset.py +++ b/create-dataset.py @@ -70,11 +70,11 @@ def save_undersample_data( y_train_undersample, y_test_undersample, ): - undersample_data.to_csv("/data/undersample_data.csv", index=False) - X_train_undersample.to_csv("/data/X_train_undersample.csv", index=False) - X_test_undersample.to_csv("/data/X_test_undersample.csv", index=False) - y_train_undersample.to_csv("/data/y_train_undersample.csv", index=False) - y_test_undersample.to_csv("/data/y_test_undersample.csv", index=False) + undersample_data.to_csv("data/undersample_data.csv", index=False) + X_train_undersample.to_csv("data/X_train_undersample.csv", index=False) + X_test_undersample.to_csv("data/X_test_undersample.csv", index=False) + y_train_undersample.to_csv("data/y_train_undersample.csv", index=False) + y_test_undersample.to_csv("data/y_test_undersample.csv", index=False) def split_whole_data(df): @@ -88,11 +88,11 @@ def split_whole_data(df): def save_whole_data(df, X_train, X_test, y_train, y_test): - df.to_csv("/data/creditcard.csv", index=False) - X_train.to_csv("/data/X_train.csv", index=False) - X_test.to_csv("/data/X_test.csv", index=False) - y_train.to_csv("/data/y_train.csv", index=False) - y_test.to_csv("/data/y_test.csv", index=False) + df.to_csv("data/creditcard.csv", index=False) + X_train.to_csv("data/X_train.csv", index=False) + X_test.to_csv("data/X_test.csv", index=False) + y_train.to_csv("data/y_train.csv", index=False) + y_test.to_csv("data/y_test.csv", index=False) def main():