r
This commit is contained in:
parent
9700a1349d
commit
d83a35ed0e
@ -5,7 +5,7 @@ import numpy as np
|
||||
|
||||
# kaggle.api.authenticate()
|
||||
# kaggle.api.dataset_download_files('shivamb/real-or-fake-fake-jobposting-prediction', path='fake_job_postings.csv', unzip=True)
|
||||
data=pd.read_csv('fake_job_postings.csv')
|
||||
data=pd.read_csv('/data/fake_job_postings.csv')
|
||||
data = data.replace(np.nan, '', regex=True)
|
||||
|
||||
print("="*20)
|
||||
|
@ -3,6 +3,7 @@ echo "Download data from kaggle"
|
||||
echo $KAGGLE_USERNAME
|
||||
kaggle datasets download -d shivamb/real-or-fake-fake-jobposting-prediction
|
||||
unzip -o real-or-fake-fake-jobposting-prediction.zip
|
||||
cp fake_job_postings.csv.csv /data/fake_job_postings.csv
|
||||
echo "Save column titles"
|
||||
head -n 1 fake_job_postings.csv > column_titles.csv
|
||||
tail -n +2 fake_job_postings.csv > data_not_shuf.csv
|
||||
|
Loading…
Reference in New Issue
Block a user