pipeline { agent { dockerfile { filename 'Dockerfile' args '-u root' } } parameters { password ( name: 'KAGGLE_USERNAME', defaultValue: '', description: 'Kaggle username' ) password ( name: 'KAGGLE_KEY', defaultValue: '', description: 'Kaggle API key' ) string ( name: 'CUTOFF', defaultValue: '500', description: 'Get only the first CUTOFF rows of the dataset' ) } stages { stage('Clone repository') { steps { checkout scm } } stage('Download dataset') { steps { withEnv(["KAGGLE_USERNAME=${params.KAGGLE_USERNAME}", "KAGGLE_KEY=${params.KAGGLE_KEY}", "CUTOFF=${params.CUTOFF}"]) { sh "KAGGLE_USERNAME=${params.KAGGLE_USERNAME} KAGGLE_KEY=${params.KAGGLE_KEY} kaggle datasets download -d uciml/breast-cancer-wisconsin-data" sh "unzip -o breast-cancer-wisconsin-data.zip" sh "mkdir datasets" sh "mv data.csv datasets/data.csv" sh "sudo chmod +x ./download_dataset.py" sh "python3 ./download_dataset.py $CUTOFF" archiveArtifacts artifacts: './datasets/data.csv,./datasets/train.csv,./datasets/dev.csv,./datasets/test.csv', onlyIfSuccessful: true } } } } }