diff --git a/Jenkinsfile b/Jenkinsfile index 9040aea..5fd32e6 100644 --- a/Jenkinsfile +++ b/Jenkinsfile @@ -4,7 +4,7 @@ pipeline { parameters { string(name: 'KAGGLE_USERNAME', defaultValue: 'gulczas', description: 'Kaggle username') password(name: 'KAGGLE_KEY', defaultValue: '', description: 'Kaggle API key') - string(name: 'CUTOFF', defaultValue: '10', description: 'Number of rows to cut') + string(name: 'CUTOFF', defaultValue: '90', description: 'Number of rows to cut') } stages { diff --git a/download_dataset.sh b/download_dataset.sh index 02c1c7d..dc9259b 100644 --- a/download_dataset.sh +++ b/download_dataset.sh @@ -9,7 +9,7 @@ unzip -o spotify-dataset.zip echo "------------------ Shufle ------------------" shuf Spotify_Dataset.csv -o shuffled_spotify.csv -echo "------------------ Cut off top: $1 rows ------------------" +echo "------------------ Cut off to top $1 rows ------------------" head -n $1 shuffled_spotify.csv > cutoff_spotify.csv echo "------------------ Split ------------------"