ium_478831/evaluate_data.py
JulianZablonski ec2a3d1c51 DVC
2022-06-05 14:57:08 +02:00

11 lines
476 B
Python

import pandas as pd
df=pd.read_csv('adult-income-dataset.csv')
df['income_if_<=50k'] = df['income'].apply(lambda x: True if x == '<=50K' else False)
df['if_male'] = df['gender'].apply(lambda x: True if x == 'Male' else False)
df['income_if_<=50k']= df['income_if_<=50k'].astype(int)
df['if_male']= df['if_male'].astype(int)
df = df[df.workclass != '?']
df = df.reset_index(drop=True)
df.to_csv('evaluate_data.csv', index=False)
df.to_csv('evaluate_data_dvc.csv', index=False)