diff --git a/data_processing.py b/data_processing.py index f11e556..480b6c2 100644 --- a/data_processing.py +++ b/data_processing.py @@ -1,10 +1,11 @@ import sklearn +from sklearn.model_selection import train_test_split import pandas as pd housing_price_dataset = pd.read_csv('housing_price_dataset.csv') -hp_train_test, hp_dev = sklearn.model_selection.train_test_split(housing_price_dataset, test_size=0.1) -hp_train, hp_test = sklearn.model_selection.train_test_split(hp_train_test, test_size=1000) +hp_train_test, hp_dev = train_test_split(housing_price_dataset, test_size=0.1) +hp_train, hp_test = train_test_split(hp_train_test, test_size=1000) hp_train = pd.get_dummies(hp_train, columns=['Neighborhood']) hp_dev = pd.get_dummies(hp_dev, columns=['Neighborhood'])