ium_z486867/dataset-stats.py
2023-04-20 21:08:39 +02:00

21 lines
837 B
Python

import pandas
X_train = pandas.read_csv('X_train.csv',
engine='python',
encoding='ISO-8859-1',
sep=',')
X_dev = pandas.read_csv('X_dev.csv',
engine='python',
encoding='ISO-8859-1',
sep=',')
X_test = pandas.read_csv('X_test.csv',
engine='python',
encoding='ISO-8859-1',
sep=',')
X_train.describe(include='all').to_csv('X_train_stats.csv', index=True)
X_dev.describe(include='all').to_csv('X_dev_stats.csv', index=True)
X_test.describe(include='all').to_csv('X_test_stats.csv', index=True)
print(X_train.describe(include='all'))
print(X_dev.describe(include='all'))
print(X_test.describe(include='all'))