Added download script
This commit is contained in:
parent
d83fc31434
commit
0cda5fe099
48
Jenkinsfile
vendored
48
Jenkinsfile
vendored
@ -1,27 +1,23 @@
|
|||||||
node {
|
pipeline {
|
||||||
stage('Preparation') {
|
agent any
|
||||||
properties([
|
|
||||||
parameters([
|
stages {
|
||||||
string(
|
stage('Clone Repository') {
|
||||||
defaultValue: 'tomaszzitkiewicz',
|
steps {
|
||||||
description: 'Kaggle username',
|
git 'https://git.wmi.amu.edu.pl/s464953/ium_464953.git'
|
||||||
name: 'KAGGLE_USERNAME',
|
}
|
||||||
trim: false
|
}
|
||||||
),
|
stage('Run Script') {
|
||||||
password(
|
steps {
|
||||||
defaultValue: '',
|
script {
|
||||||
description: 'Kaggle token taken from kaggle.json file, as described in https://github.com/Kaggle/kaggle-api#api-credentials',
|
sh 'bash download_dataset.sh $KAGGLE_USERNAME $KAGGLE_KEY'
|
||||||
name: 'KAGGLE_KEY'
|
}
|
||||||
)
|
}
|
||||||
])
|
}
|
||||||
])
|
stage('Archive Artifacts') {
|
||||||
}
|
steps {
|
||||||
stage('Build') {
|
archiveArtifacts artifacts: 'artifacts/*', onlyIfSuccessful: true
|
||||||
// Run the maven build
|
}
|
||||||
withEnv(["KAGGLE_USERNAME=${params.KAGGLE_USERNAME}",
|
}
|
||||||
"KAGGLE_KEY=${params.KAGGLE_KEY}" ]) {
|
}
|
||||||
sh 'echo KAGGLE_USERNAME: $KAGGLE_USERNAME'
|
|
||||||
sh 'kaggle datasets list'
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
}
|
46
download_dataset.sh
Normal file
46
download_dataset.sh
Normal file
@ -0,0 +1,46 @@
|
|||||||
|
#!/bin/bash
|
||||||
|
|
||||||
|
pip install kaggle --upgrade
|
||||||
|
|
||||||
|
kaggle_username=$1
|
||||||
|
kaggle_key=$2
|
||||||
|
|
||||||
|
# Ustawienie zmiennych środowiskowych
|
||||||
|
export KAGGLE_USERNAME=$kaggle_username
|
||||||
|
export KAGGLE_KEY=$kaggle_key
|
||||||
|
|
||||||
|
kaggle datasets download brunoalercon123/top-200-spotify-songs-dataset
|
||||||
|
|
||||||
|
unzip top-200-spotify-songs-dataset.zip
|
||||||
|
|
||||||
|
shuf Spotify-200-Songs.csv -o shuffled_spotify.csv
|
||||||
|
|
||||||
|
head -n 100 shuffled_spotify.csv > subset1.csv
|
||||||
|
tail -n 100 shuffled_spotify.csv > subset2.csv
|
||||||
|
|
||||||
|
cut -d ',' -f 1,2,3 shuffled_spotify.csv > trimmed_spotify.csv
|
||||||
|
|
||||||
|
cut -d ',' -f 1,2,4,5,6 shuffled_spotify.csv > processed_spotify.csv
|
||||||
|
|
||||||
|
echo "Shuffled dataset:" > results.txt
|
||||||
|
head shuffled_spotify.csv >> results.txt
|
||||||
|
echo "" >> results.txt
|
||||||
|
|
||||||
|
echo "Subset 1:" >> results.txt
|
||||||
|
head subset1.csv >> results.txt
|
||||||
|
echo "" >> results.txt
|
||||||
|
|
||||||
|
echo "Subset 2:" >> results.txt
|
||||||
|
head subset2.csv >> results.txt
|
||||||
|
echo "" >> results.txt
|
||||||
|
|
||||||
|
echo "Trimmed dataset:" >> results.txt
|
||||||
|
head trimmed_spotify.csv >> results.txt
|
||||||
|
echo "" >> results.txt
|
||||||
|
|
||||||
|
echo "Processed dataset:" >> results.txt
|
||||||
|
head processed_spotify.csv >> results.txt
|
||||||
|
echo "" >> results.txt
|
||||||
|
|
||||||
|
mkdir -p artifacts
|
||||||
|
mv shuffled_spotify.csv subset1.csv subset2.csv trimmed_spotify.csv processed_spotify.csv results.txt artifacts/
|
Loading…
Reference in New Issue
Block a user