diff --git a/Jenkinsfile b/Jenkinsfile index 640d763..85bc5c0 100644 --- a/Jenkinsfile +++ b/Jenkinsfile @@ -30,9 +30,9 @@ pipeline { } stage('Download dataset') { steps { - withEnv(["USERNAME=${params.USERNAME}", "API_KEY=${params.API_KEY}", "DATA_TRAIN_RATIO=${params.DATA_TRAIN_RATIO}"]) { + withEnv(["USERNAME=${params.USERNAME}", "API_KEY=${params.API_KEY}", "DATA_TRAIN_RATIO=${params.DATA_TRAIN_RATIO}", "CUTOFF=${params.CUTOFF}"]) { sh "chmod +x download_dataset.sh" - sh "./download_dataset.sh $DATA_TRAIN_RATIO" + sh "./download_dataset.sh $DATA_TRAIN_RATIO" $CUTOFF archiveArtifacts artifacts: 'data.csv,train.csv,test.csv', onlyIfSuccessful: true } } diff --git a/download_dataset.sh b/download_dataset.sh index 71bad14..2ffb017 100644 --- a/download_dataset.sh +++ b/download_dataset.sh @@ -5,7 +5,6 @@ kaggle datasets download -d nikhil7280/student-performance-multiple-linear-regre # change dataset name to data.csv mv Student_Performance.csv data.csv -echo "$2" # cut off rows head -n "$2" data.csv > data.csv.tmp && mv data.csv.tmp data.csv