ium_464863/Jenkinsfile

pipeline {
    agent any

    parameters {
        password (
            name: 'KAGGLE_USERNAME',
            defaultValue: '',
            description: 'Kaggle username'
        )
        password (
            name: 'KAGGLE_KEY',
            defaultValue: '',
            description: 'Kaggle API key'
        )
        string (
            name: 'CUTOFF',
            defaultValue: '500',
            description: 'Get only the first CUTOFF rows of the dataset'
        )
    }

    stages {
        stage('Clone repository') {
            steps {
                checkout scm
            }
        }

        stage('Download dataset') {
            steps {
                withEnv(["KAGGLE_USERNAME=${params.KAGGLE_USERNAME}", "KAGGLE_KEY=${params.KAGGLE_KEY}"]) {
                    sh "kaggle datasets download -d uciml/breast-cancer-wisconsin-data"
                    sh "unzip -o breast-cancer-wisconsin-data.zip"
                    sh "mkdir -p datasets"
                    sh "mv data.csv datasets/data.csv"
                }
            }
        }

        stage('Preprocess data') {
            agent {
                dockerfile {
                    filename 'Dockerfile'
                    reuseNode true
                }
            }

            steps {
                sh "chmod +x ./download_dataset.py"
                sh "python3 ./download_dataset.py ${params.CUTOFF}"
                archiveArtifacts artifacts: 'datasets/*', onlyIfSuccessful: true

                build job: 's464863-training/main', wait: false
            }
        }
    }
}