Update Jenkinsfile, bash script ver 1.6
This commit is contained in:
parent
0267eaa861
commit
acdb4cb429
2
Jenkinsfile
vendored
2
Jenkinsfile
vendored
@ -13,7 +13,7 @@ pipeline {
|
|||||||
name: 'KAGGLE_KEY'
|
name: 'KAGGLE_KEY'
|
||||||
)
|
)
|
||||||
string(
|
string(
|
||||||
defaultValue: '10',
|
defaultValue: '10841',
|
||||||
description: 'cutoff parameter',
|
description: 'cutoff parameter',
|
||||||
name: 'CUTOFF'
|
name: 'CUTOFF'
|
||||||
)
|
)
|
||||||
|
26
data_prep.sh
26
data_prep.sh
@ -1,12 +1,24 @@
|
|||||||
#!/bin/bash
|
#!/bin/bash
|
||||||
|
|
||||||
kaggle datasets download -d lava18/google-play-store-apps
|
#kaggle datasets download -d lava18/google-play-store-apps
|
||||||
unzip -o google-play-store-apps.zip
|
unzip -o google-play-store-apps.zip
|
||||||
sed -i '1d' googleplaystore.csv
|
sed -i '1d' googleplaystore.csv
|
||||||
shuf googleplaystore.csv > apps_shuf.csv
|
shuf googleplaystore.csv > apps_shuf_.csv
|
||||||
|
head -n $CUTOFF apps_shuf_.csv > apps_shuf.csv
|
||||||
|
|
||||||
|
total=$(wc -l apps_shuf.csv | awk '{print $1}')
|
||||||
|
test_set=$(( (total*60+50) / 100 ))
|
||||||
|
train_val_set=$(( (total*20+50) / 100 ))
|
||||||
|
|
||||||
#cp apps_shuf.csv apps_shuf_copy.csv
|
#cp apps_shuf.csv apps_shuf_copy.csv
|
||||||
head -n 6505 apps_shuf.csv > apps_train.csv
|
|
||||||
sed -i '1,6505d' apps_shuf.csv
|
head -n $test_set apps_shuf.csv > apps_train.csv
|
||||||
head -n 2168 apps_shuf.csv > apps_test.csv
|
lines="1,$test_set"
|
||||||
sed -i '1,2168d' apps_shuf.csv
|
sed -i "$lines"'d' apps_shuf.csv
|
||||||
head -n 2168 apps_shuf.csv > apps_validate.csv
|
head -n $train_val_set apps_shuf.csv > apps_test.csv
|
||||||
|
lines="1,$train_val_set"
|
||||||
|
sed -i "$lines"'d' apps_shuf.csv
|
||||||
|
head -n $train_val_set apps_shuf.csv > apps_validate.csv
|
||||||
|
wc -l apps_train.csv
|
||||||
|
wc -l apps_test.csv
|
||||||
|
wc -l apps_validate.csv
|
Loading…
Reference in New Issue
Block a user