dataset stats

This commit is contained in:
wojciechbatruszewicz 2023-06-26 19:18:24 +02:00
parent 178f324d58
commit c8c63d20dc
2 changed files with 43 additions and 0 deletions

34
JenkinsfileDatasetStats Normal file
View File

@ -0,0 +1,34 @@
pipeline {
agent any
parameters {
buildSelector(
name: 'BUILD_SELECTOR',
defaultSelector: lastSuccessful(),
description: 'A build to take the artifacts from'
)
}
stages {
stage('Copy artifacts') {
steps {
script {
copyArtifacts(
projectName: 'x1-create-dataset',
selector: buildParameter('BUILD_SELECTOR'),
target: './datasetStats'
)
}
}
}
stage('Run sh file') {
steps {
script {
sh 'ls -l'
docker.image('docker-image').inside {
sh 'ls -l'
sh 'python3 ./datasetStats.py'
}
}
}
}
}
}

9
datasetStats.py Normal file
View File

@ -0,0 +1,9 @@
import pandas as pd
home_loan_train = pd.read_csv('gender_classification_train.csv')
home_loan_test = pd.read_csv('gender_classification_test.csv')
home_loan_val = pd.read_csv('gender_classification_val.csv')
home_loan_train.describe()
home_loan_test.describe()
home_loan_val.describe()