ium_434766/lab2.ipynb

282 lines
137 KiB
Plaintext
Raw Normal View History

2021-03-20 20:04:51 +01:00
{
"metadata": {
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.8.5"
2021-03-20 20:04:51 +01:00
},
"orig_nbformat": 2,
"kernelspec": {
"name": "python385jvsc74a57bd02cef13873963874fd5439bd04a135498d1dd9725d9d90f40de0b76178a8e03b1",
"display_name": "Python 3.8.5 64-bit ('base': conda)"
2021-03-20 20:04:51 +01:00
}
},
"nbformat": 4,
"nbformat_minor": 2,
"cells": [
{
"cell_type": "code",
"execution_count": 1,
2021-03-20 20:04:51 +01:00
"metadata": {},
"outputs": [
{
"output_type": "stream",
"name": "stdout",
"text": [
"Whole dataset size: 61320\nTrain dataset size: 35340\nTest dataset size: 11784\nValidate dataset size: 11784\n id gender age hypertension heart_disease \\\ncount 5110.000000 5110 5110.000000 5110.000000 5110.000000 \nunique NaN 3 NaN NaN NaN \ntop NaN Female NaN NaN NaN \nfreq NaN 2994 NaN NaN NaN \nmean 36517.829354 NaN 43.226614 0.097456 0.054012 \nstd 21161.721625 NaN 22.612647 0.296607 0.226063 \nmin 67.000000 NaN 0.080000 0.000000 0.000000 \n25% 17741.250000 NaN 25.000000 0.000000 0.000000 \n50% 36932.000000 NaN 45.000000 0.000000 0.000000 \n75% 54682.000000 NaN 61.000000 0.000000 0.000000 \nmax 72940.000000 NaN 82.000000 1.000000 1.000000 \n\n ever_married work_type Residence_type avg_glucose_level bmi \\\ncount 5110 5110 5110 5110.000000 4909.000000 \nunique 2 5 2 NaN NaN \ntop Yes Private Urban NaN NaN \nfreq 3353 2925 2596 NaN NaN \nmean NaN NaN NaN 106.147677 28.893237 \nstd NaN NaN NaN 45.283560 7.854067 \nmin NaN NaN NaN 55.120000 10.300000 \n25% NaN NaN NaN 77.245000 23.500000 \n50% NaN NaN NaN 91.885000 28.100000 \n75% NaN NaN NaN 114.090000 33.100000 \nmax NaN NaN NaN 271.740000 97.600000 \n\n smoking_status stroke \ncount 5110 5110.000000 \nunique 4 NaN \ntop never smoked NaN \nfreq 1892 NaN \nmean NaN 0.048728 \nstd NaN 0.215320 \nmin NaN 0.000000 \n25% NaN 0.000000 \n50% NaN 0.000000 \n75% NaN 0.000000 \nmax NaN 1.000000 \n"
]
}
],
"source": [
2021-03-28 20:50:30 +02:00
"import kaggle\n",
"import os\n",
2021-03-20 20:04:51 +01:00
"import numpy as np\n",
"import pandas as pd\n",
"from sklearn.preprocessing import MinMaxScaler\n",
"from sklearn.model_selection import train_test_split\n",
"\n",
"def downloadCSV():\n",
2021-03-28 20:50:30 +02:00
" kaggle.api.authenticate()\n",
" kaggle.api.dataset_download_files('fedesoriano/stroke-prediction-dataset', path='.', unzip=True)\n",
" data = pd.read_csv('healthcare-dataset-stroke-data.csv')\n",
2021-03-20 20:04:51 +01:00
"\n",
"def dropNaN():\n",
" data = pd.read_csv('healthcare-dataset-stroke-data.csv')\n",
" data = data.dropna()\n",
" return data\n",
"\n",
"def NormalizeData(data):\n",
" data = data.astype({\"age\": np.int64})\n",
" for col in data.columns:\n",
" if data[col].dtype == object: # STRINGS TO LOWERCASE\n",
" data[col] = data[col].str.lower()\n",
" if data[col].dtype == np.float64: # FLOATS TO VALUES IN [ 0, 1]\n",
" dataReshaped = data[col].values.reshape(-1,1)\n",
" scaler = MinMaxScaler(feature_range=(0, 1))\n",
" data[col] = scaler.fit_transform(dataReshaped)\n",
" if col == 'ever_married': # YES/NO TO 1/0\n",
" data[col] = data[col].map(dict(yes=1, no=0))\n",
" if col == 'smoking_status':\n",
" data[col] = data[col].str.replace(\" \", \"_\")\n",
" if col == 'work_type':\n",
" data[col] = data[col].str.replace(\"-\", \"_\")\n",
" return data\n",
"\n",
"def saveToCSV(data1,data2,data3):\n",
" data1.to_csv(\"data_train.csv\", index=False)\n",
" data2.to_csv(\"data_test.csv\",index=False)\n",
" data3.to_csv(\"data_val.csv\",index=False)\n",
"\n",
"def describeDataset(dt, dt2, dv):\n",
" data = pd.read_csv('healthcare-dataset-stroke-data.csv')\n",
" print(\"Whole dataset size: \", data.size)\n",
" print(\"Train dataset size: \", dt.size)\n",
" print(\"Test dataset size: \", dt2.size)\n",
" print(\"Validate dataset size: \", dv.size)\n",
" print(data.describe(include='all'))\n",
"\n",
"\n",
"# downloadCSV()\n",
2021-03-20 20:04:51 +01:00
"data = dropNaN()\n",
"data = NormalizeData(data)\n",
"\n",
"data_train, data_test = train_test_split(data, test_size=0.2, random_state=1)\n",
"data_train, data_val = train_test_split(data_train, test_size=0.25, random_state=1) ## Twice to get 0.6, 0.2, 0.2\n",
"saveToCSV(data_train,data_test,data_val)\n",
"describeDataset(data_train,data_test,data_val)\n",
"\n"
]
},
{
"cell_type": "code",
"execution_count": 6,
"metadata": {},
"outputs": [
{
"output_type": "execute_result",
"data": {
"text/plain": [
"array(['private', 'self_employed', 'govt_job', 'children', 'never_worked'],\n",
" dtype=object)"
]
},
"metadata": {},
"execution_count": 6
}
],
"source": [
"pd.unique(data['work_type'])"
]
},
2021-03-20 20:04:51 +01:00
{
"cell_type": "code",
"execution_count": 27,
"metadata": {},
"outputs": [
{
"output_type": "execute_result",
"data": {
"text/plain": [
"<AxesSubplot:>"
]
},
"metadata": {},
"execution_count": 27
},
{
"output_type": "display_data",
"data": {
"text/plain": "<Figure size 432x288 with 1 Axes>",
"image/svg+xml": "<?xml version=\"1.0\" encoding=\"utf-8\" standalone=\"no\"?>\r\n<!DOCTYPE svg PUBLIC \"-//W3C//DTD SVG 1.1//EN\"\r\n \"http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd\">\r\n<!-- Created with matplotlib (https://matplotlib.org/) -->\r\n<svg height=\"310.257188pt\" version=\"1.1\" viewBox=\"0 0 381.65 310.257188\" width=\"381.65pt\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\">\r\n <metadata>\r\n <rdf:RDF xmlns:cc=\"http://creativecommons.org/ns#\" xmlns:dc=\"http://purl.org/dc/elements/1.1/\" xmlns:rdf=\"http://www.w3.org/1999/02/22-rdf-syntax-ns#\">\r\n <cc:Work>\r\n <dc:type rdf:resource=\"http://purl.org/dc/dcmitype/StillImage\"/>\r\n <dc:date>2021-03-20T19:59:50.630059</dc:date>\r\n <dc:format>image/svg+xml</dc:format>\r\n <dc:creator>\r\n <cc:Agent>\r\n <dc:title>Matplotlib v3.3.2, https://matplotlib.org/</dc:title>\r\n </cc:Agent>\r\n </dc:creator>\r\n </cc:Work>\r\n </rdf:RDF>\r\n </metadata>\r\n <defs>\r\n <style type=\"text/css\">*{stroke-linecap:butt;stroke-linejoin:round;}</style>\r\n </defs>\r\n <g id=\"figure_1\">\r\n <g id=\"patch_1\">\r\n <path d=\"M -0 310.257188 \r\nL 381.65 310.257188 \r\nL 381.65 0 \r\nL -0 0 \r\nz\r\n\" style=\"fill:none;\"/>\r\n </g>\r\n <g id=\"axes_1\">\r\n <g id=\"patch_2\">\r\n <path d=\"M 39.65 224.64 \r\nL 374.45 224.64 \r\nL 374.45 7.2 \r\nL 39.65 7.2 \r\nz\r\n\" style=\"fill:#ffffff;\"/>\r\n </g>\r\n <g id=\"patch_3\">\r\n <path clip-path=\"url(#p8ec1192c17)\" d=\"M 56.39 224.64 \r\nL 89.87 224.64 \r\nL 89.87 17.554286 \r\nL 56.39 17.554286 \r\nz\r\n\" style=\"fill:#1f77b4;\"/>\r\n </g>\r\n <g id=\"patch_4\">\r\n <path clip-path=\"url(#p8ec1192c17)\" d=\"M 123.35 224.64 \r\nL 156.83 224.64 \r\nL 156.83 166.656 \r\nL 123.35 166.656 \r\nz\r\n\" style=\"fill:#1f77b4;\"/>\r\n </g>\r\n <g id=\"patch_5\">\r\n <path clip-path=\"url(#p8ec1192c17)\" d=\"M 190.31 224.64 \r\nL 223.79 224.64 \r\nL 223.79 176.001407 \r\nL 190.31 176.001407 \r\nz\r\n\" style=\"fill:#1f77b4;\"/>\r\n </g>\r\n <g id=\"patch_6\">\r\n <path clip-path=\"url(#p8ec1192c17)\" d=\"M 257.27 224.64 \r\nL 290.75 224.64 \r\nL 290.75 178.125363 \r\nL 257.27 178.125363 \r\nz\r\n\" style=\"fill:#1f77b4;\"/>\r\n </g>\r\n <g id=\"patch_7\">\r\n <path clip-path=\"url(#p8ec1192c17)\" d=\"M 324.23 224.64 \r\nL 357.71 224.64 \r\nL 357.71 223.082432 \r\nL 324.23 223.082432 \r\nz\r\n\" style=\"fill:#1f77b4;\"/>\r\n </g>\r\n <g id=\"matplotlib.axis_1\">\r\n <g id=\"xtick_1\">\r\n <g id=\"line2d_1\">\r\n <defs>\r\n <path d=\"M 0 0 \r\nL 0 3.5 \r\n\" id=\"m367ef2167c\" style=\"stroke:#000000;stroke-width:0.8;\"/>\r\n </defs>\r\n <g>\r\n <use style=\"stroke:#000000;stroke-width:0.8;\" x=\"73.13\" xlink:href=\"#m367ef2167c\" y=\"224.64\"/>\r\n </g>\r\n </g>\r\n <g id=\"text_1\">\r\n <!-- Private -->\r\n <g transform=\"translate(75.889375 266.504063)rotate(-90)scale(0.1 -0.1)\">\r\n <defs>\r\n <path d=\"M 19.671875 64.796875 \r\nL 19.671875 37.40625 \r\nL 32.078125 37.40625 \r\nQ 38.96875 37.40625 42.71875 40.96875 \r\nQ 46.484375 44.53125 46.484375 51.125 \r\nQ 46.484375 57.671875 42.71875 61.234375 \r\nQ 38.96875 64.796875 32.078125 64.796875 \r\nz\r\nM 9.8125 72.90625 \r\nL 32.078125 72.90625 \r\nQ 44.34375 72.90625 50.609375 67.359375 \r\nQ 56.890625 61.8125 56.890625 51.125 \r\nQ 56.890625 40.328125 50.609375 34.8125 \r\nQ 44.34375 29.296875 32.078125 29.296875 \r\nL 19.671875 29.296875 \r\nL 19.671875 0 \r\nL 9.8125 0 \r\nz\r\n\" id=\"DejaVuSans-80\"/>\r\n <path d=\"M 41.109375 46.296875 \r\nQ 39.59375 47.171875 37.8125 47.578125 \r\nQ 36.03125 48 33.890625 48 \r\nQ 26.265625 48 22.1875 43.046875 \r\nQ 18.109375 38.09375 18.109375 28.8125 \r\nL 18.109375 0 \r\nL 9.078125 0 \r\nL 9.078125 54.6875 \r\nL 18.109375 54.6875 \r\nL 18.109375 46.1875 \r\nQ 20.953125 51.171875 25.484375 53.578125 \r\nQ 30.03125 56 36.53125 56 \r\nQ 37.453125 56 38.578125 55.875 \r\nQ 39.703125 55.765625 41.0625 55.515625 \r\nz\r\n\" id=
"image/png": "iVBORw0KGgoAAAANSUhEUgAAAX0AAAE2CAYAAACN5kL+AAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjMuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8vihELAAAACXBIWXMAAAsTAAALEwEAmpwYAAAcp0lEQVR4nO3de7xdZX3n8c+XAJEKqTAcmDQJBjHMCKgIMYPKVCsqsUqDWDCIEpUaijjFjq2C9qVWmxmnDl7wJVQsl6COMV5JNVQQFYgi8QSRcJGSV0GSJkPiPVInmPidP9ZzzOZkn0tue+3wfN+v136dvZ691j6/vZP9PWs/61nPkm0iIqIOe7VdQERE9E5CPyKiIgn9iIiKJPQjIiqS0I+IqEhCPyKiInu3XcBYDj74YE+fPr3tMiIi9igrVqz4se2B4e1jhr6kJwA3AxPL+p+3/W5JBwGfBaYDDwJn2P5Z2eYi4BxgC/AXtr9W2o8Hrgb2A5YCF3iMEwWmT5/O4ODg+F5lREQAIOlH3drH072zCXih7WcCxwKzJZ0AXAjcaHsGcGNZRtJRwFzgaGA2cKmkCeW5LgPmAzPKbfaOvqCIiNh+Y4a+G78qi/uUm4E5wMLSvhA4tdyfAyyyvcn2A8AqYJakycAk27eWvftrOraJiIgeGNeBXEkTJN0BrAdusH0bcKjtdQDl5yFl9SnA6o7N15S2KeX+8PaIiOiRcYW+7S22jwWm0uy1HzPK6ur2FKO0b/sE0nxJg5IGN2zYMJ4SIyJiHLZryKbtnwPfoumLf7h02VB+ri+rrQGmdWw2FVhb2qd2ae/2ey63PdP2zIGBbQ4+R0TEDhoz9CUNSHpSub8f8CLgh8ASYF5ZbR5wbbm/BJgraaKkw2kO2C4vXUAbJZ0gScDZHdtEREQPjGec/mRgYRmBsxew2PZXJN0KLJZ0DvAQcDqA7bslLQbuATYD59veUp7rPLYO2byu3CIiokfU7/Ppz5w50xmnHxGxfSStsD1zeHvfn5G7s6Zf+NW2SwDgwfe/rO0SIiIy905ERE0S+hERFUnoR0RUJKEfEVGRhH5EREUS+hERFUnoR0RUJKEfEVGRhH5EREUS+hERFUnoR0RUJKEfEVGRhH5EREUS+hERFUnoR0RUJKEfEVGRhH5EREUS+hERFUnoR0RUJKEfEVGRhH5EREUS+hERFUnoR0RUJKEfEVGRhH5EREUS+hERFRkz9CVNk/RNSfdKulvSBaX9PZL+TdId5fbHHdtcJGmVpPskndzRfrykleWxSyRp97ysiIjoZu9xrLMZeKvt2yUdAKyQdEN57EO2/3fnypKOAuYCRwN/AHxd0pG2twCXAfOB7wJLgdnAdbvmpURExFjG3NO3vc727eX+RuBeYMoom8wBFtneZPsBYBUwS9JkYJLtW20buAY4dWdfQEREjN929elLmg48C7itNL1Z0p2SrpR0YGmbAqzu2GxNaZtS7g9vj4iIHhl36EvaH/gC8Bbbv6TpqjkCOBZYB1w8tGqXzT1Ke7ffNV/SoKTBDRs2jLfEiIgYw7hCX9I+NIH/adtfBLD9sO0ttn8LfAKYVVZfA0zr2HwqsLa0T+3Svg3bl9ueaXvmwMDA9ryeiIgYxXhG7wi4ArjX9gc72id3rPYK4K5yfwkwV9JESYcDM4DlttcBGyWdUJ7zbODaXfQ6IiJiHMYzeud5wGuBlZLuKG3vAM6UdCxNF82DwLkAtu+WtBi4h2bkz/ll5A7AecDVwH40o3YycicioofGDH3by+jeH790lG0WAAu6tA8Cx2xPgRERsevkjNyIiIok9CMiKpLQj4ioSEI/IqIiCf2IiIok9CMiKpLQj4ioSEI/IqIiCf2IiIok9CMiKpLQj4ioSEI/IqIiCf2IiIok9CMiKpLQj4ioSEI/IqIiCf2IiIok9CMiKpLQj4ioSEI/IqIiCf2IiIok9CMiKpLQj4ioSEI/IqIiCf2IiIok9CMiKjJm6EuaJumbku6VdLekC0r7QZJukHR/+XlgxzYXSVol6T5JJ3e0Hy9pZXnsEknaPS8rIiK6Gc+e/mbgrbafBpwAnC/pKOBC4EbbM4AbyzLlsbnA0cBs4FJJE8pzXQbMB2aU2+xd+FoiImIMY4a+7XW2by/3NwL3AlOAOcDCstpC4NRyfw6wyPYm2w8Aq4BZkiYDk2zfatvANR3bRERED2xXn76k6cCzgNuAQ22vg+YPA3BIWW0KsLpjszWlbUq5P7w9IiJ6ZNyhL2l/4AvAW2z/crRVu7R5lPZuv2u+pEFJgxs2bBhviRERMYZxhb6kfWgC/9O2v1iaHy5dNpSf60v7GmBax+ZTgbWlfWqX9m3Yvtz2TNszBwYGxvtaIiJiDOMZvSPgCuBe2x/seGgJMK/cnwdc29E+V9JESYfTHLBdXrqANko6oTzn2R3bRERED+w9jnWeB7wWWCnpjtL2DuD9wGJJ5wAPAacD2L5b0mLgHpqRP+fb3lK2Ow+4GtgPuK7cIiKiR8YMfdvL6N4fD3DSCNssABZ0aR8EjtmeAiMiYtfJGbkRERVJ6EdEVCShHxFRkYR+RERFEvoRERVJ6EdEVCShHxFRkYR+RERFEvoRERVJ6EdEVCShHxFRkYR+RERFEvoRERVJ6EdEVCShHxFRkYR+RERFEvoRERVJ6EdEVCShHxFRkYR+RERFEvoRERVJ6EdEVCShHxFRkYR+RERFEvoRERVJ6EdEVGTM0Jd0paT1ku7qaHuPpH+TdEe5/XHHYxdJWiXpPkknd7QfL2lleewSSdr1LyciIkYznj39q4HZXdo/ZPvYclsKIOkoYC5wdNnmUkkTyvqXAfOBGeXW7TkjImI3GjP0bd8M/HSczzcHWGR7k+0HgFXALEmTgUm2b7Vt4Brg1B2sOSIidtDO9Om/WdKdpfvnwNI2BVjdsc6a0jal3B/eHhERPbSjoX8ZcARwLLAOuLi0d+un9yjtXUmaL2lQ0uCGDRt2sMSIiBhuh0Lf9sO2t9j+LfAJYFZ5aA0wrWPVqcDa0j61S/tIz3+57Zm2Zw4MDOxIiRER0cUOhX7pox/yCmBoZM8SYK6kiZIOpzlgu9z2OmCjpBPKqJ2zgWt3ou6IiNgBe4+1gqTPAC8ADpa0Bng38AJJx9J00TwInAtg+25Ji4F7gM3A+ba3lKc6j2Yk0H7AdeUWERE9NGbo2z6zS/MVo6y/AFjQpX0QOGa7qouIiF0qZ+RGRFQkoR8RUZGEfkRERRL6EREVSehHRFQkoR8RUZGEfkRERRL6EREVSehHRFQkoR8RUZGEfkRERRL6EREVSehHRFQkoR8RUZGEfkRERRL6EREVSehHRFQkoR8RUZGEfkRERRL6EREVSehHRFQkoR8RUZGEfkRERRL6EREVSehHRFQkoR8RUZGEfkRERcYMfUlXSlov6a6OtoMk3SDp/vLzwI7HLpK0StJ9kk7uaD9e0sry2CWStOtfTkREjGY8e/pXA7OHtV0I3Gh7BnBjWUbSUcBc4OiyzaWSJpRtLgPmAzPKbfhzRkTEbjZm6Nu+GfjpsOY5wMJyfyFwakf7ItubbD8ArAJmSZoMTLJ9q20D13RsExERPbKjffqH2l4HUH4eUtqnAKs71ltT2qaU+8PbIyKih3b1gdxu/fQepb37k0jzJQ1KGtywYcMuKy4ionY7GvoPly4bys/1pX0NMK1jvanA2tI+tUt7V7Yvtz3T9syBgYEdLDEiIobb0dBfAswr9+cB13a0z5U0UdLhNAdsl5cuoI2STiijds7u2CYiInpk77FWkPQZ4AXAwZLWAO8G3g8slnQO8BBwOoDtuyUtBu4BNgPn295Snuo8mpFA+wHXlVtERPTQmKFv+8wRHjpphPUXAAu6tA8Cx2xXdRERsUvljNyIiIok9CMiKpLQj4ioSEI/IqIiCf2IiIok9CMiKpLQj4ioSEI/IqIiY56cFY8f0y/8atslAPDg+1/WdgkR1cqefkRERRL6EREVSehHRFQkoR8RUZGEfkRERRL6EREVSehHRFQkoR8RUZGcnBVVyolqUavs6UdEVCR7+hGVy7eeumRPPyKiIgn9iIi
},
"metadata": {
"needs_background": "light"
}
}
],
"source": [
"data_orginal = pd.read_csv('healthcare-dataset-stroke-data.csv')\n",
"data_orginal['work_type'].value_counts().plot(kind=\"bar\")\n"
]
},
{
"cell_type": "code",
"execution_count": 23,
"metadata": {},
"outputs": [
{
"output_type": "execute_result",
"data": {
"text/plain": [
"<AxesSubplot:>"
]
},
"metadata": {},
"execution_count": 23
},
{
"output_type": "display_data",
"data": {
"text/plain": "<Figure size 432x288 with 1 Axes>",
"image/svg+xml": "<?xml version=\"1.0\" encoding=\"utf-8\" standalone=\"no\"?>\r\n<!DOCTYPE svg PUBLIC \"-//W3C//DTD SVG 1.1//EN\"\r\n \"http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd\">\r\n<!-- Created with matplotlib (https://matplotlib.org/) -->\r\n<svg height=\"245.2025pt\" version=\"1.1\" viewBox=\"0 0 381.65 245.2025\" width=\"381.65pt\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\">\r\n <metadata>\r\n <rdf:RDF xmlns:cc=\"http://creativecommons.org/ns#\" xmlns:dc=\"http://purl.org/dc/elements/1.1/\" xmlns:rdf=\"http://www.w3.org/1999/02/22-rdf-syntax-ns#\">\r\n <cc:Work>\r\n <dc:type rdf:resource=\"http://purl.org/dc/dcmitype/StillImage\"/>\r\n <dc:date>2021-03-20T19:59:23.582020</dc:date>\r\n <dc:format>image/svg+xml</dc:format>\r\n <dc:creator>\r\n <cc:Agent>\r\n <dc:title>Matplotlib v3.3.2, https://matplotlib.org/</dc:title>\r\n </cc:Agent>\r\n </dc:creator>\r\n </cc:Work>\r\n </rdf:RDF>\r\n </metadata>\r\n <defs>\r\n <style type=\"text/css\">*{stroke-linecap:butt;stroke-linejoin:round;}</style>\r\n </defs>\r\n <g id=\"figure_1\">\r\n <g id=\"patch_1\">\r\n <path d=\"M -0 245.2025 \r\nL 381.65 245.2025 \r\nL 381.65 0 \r\nL -0 0 \r\nz\r\n\" style=\"fill:none;\"/>\r\n </g>\r\n <g id=\"axes_1\">\r\n <g id=\"patch_2\">\r\n <path d=\"M 39.65 224.64 \r\nL 374.45 224.64 \r\nL 374.45 7.2 \r\nL 39.65 7.2 \r\nz\r\n\" style=\"fill:#ffffff;\"/>\r\n </g>\r\n <g id=\"patch_3\">\r\n <path clip-path=\"url(#p9286a580eb)\" d=\"M 81.5 224.64 \r\nL 165.2 224.64 \r\nL 165.2 17.554286 \r\nL 81.5 17.554286 \r\nz\r\n\" style=\"fill:#1f77b4;\"/>\r\n </g>\r\n <g id=\"patch_4\">\r\n <path clip-path=\"url(#p9286a580eb)\" d=\"M 248.9 224.64 \r\nL 332.6 224.64 \r\nL 332.6 214.032236 \r\nL 248.9 214.032236 \r\nz\r\n\" style=\"fill:#1f77b4;\"/>\r\n </g>\r\n <g id=\"matplotlib.axis_1\">\r\n <g id=\"xtick_1\">\r\n <g id=\"line2d_1\">\r\n <defs>\r\n <path d=\"M 0 0 \r\nL 0 3.5 \r\n\" id=\"m2d7a9c812c\" style=\"stroke:#000000;stroke-width:0.8;\"/>\r\n </defs>\r\n <g>\r\n <use style=\"stroke:#000000;stroke-width:0.8;\" x=\"123.35\" xlink:href=\"#m2d7a9c812c\" y=\"224.64\"/>\r\n </g>\r\n </g>\r\n <g id=\"text_1\">\r\n <!-- 0 -->\r\n <g transform=\"translate(126.109375 238.0025)rotate(-90)scale(0.1 -0.1)\">\r\n <defs>\r\n <path d=\"M 31.78125 66.40625 \r\nQ 24.171875 66.40625 20.328125 58.90625 \r\nQ 16.5 51.421875 16.5 36.375 \r\nQ 16.5 21.390625 20.328125 13.890625 \r\nQ 24.171875 6.390625 31.78125 6.390625 \r\nQ 39.453125 6.390625 43.28125 13.890625 \r\nQ 47.125 21.390625 47.125 36.375 \r\nQ 47.125 51.421875 43.28125 58.90625 \r\nQ 39.453125 66.40625 31.78125 66.40625 \r\nz\r\nM 31.78125 74.21875 \r\nQ 44.046875 74.21875 50.515625 64.515625 \r\nQ 56.984375 54.828125 56.984375 36.375 \r\nQ 56.984375 17.96875 50.515625 8.265625 \r\nQ 44.046875 -1.421875 31.78125 -1.421875 \r\nQ 19.53125 -1.421875 13.0625 8.265625 \r\nQ 6.59375 17.96875 6.59375 36.375 \r\nQ 6.59375 54.828125 13.0625 64.515625 \r\nQ 19.53125 74.21875 31.78125 74.21875 \r\nz\r\n\" id=\"DejaVuSans-48\"/>\r\n </defs>\r\n <use xlink:href=\"#DejaVuSans-48\"/>\r\n </g>\r\n </g>\r\n </g>\r\n <g id=\"xtick_2\">\r\n <g id=\"line2d_2\">\r\n <g>\r\n <use style=\"stroke:#000000;stroke-width:0.8;\" x=\"290.75\" xlink:href=\"#m2d7a9c812c\" y=\"224.64\"/>\r\n </g>\r\n </g>\r\n <g id=\"text_2\">\r\n <!-- 1 -->\r\n <g transform=\"translate(293.509375 238.0025)rotate(-90)scale(0.1 -0.1)\">\r\n <defs>\r\n <path d=\"M 12.40625 8.296875 \r\nL 28.515625 8.296875 \r\nL 28.515625 63.921875 \r\nL 10.984375 60.40625 \r\nL 10.984375 69.390625 \r\nL 28.421875 72.90625 \r\nL 38.28125 72.90625 \r\nL 38.28125 8.296875 \r\nL 54.390625 8.296875 \r\nL 54.390625 0 \r\nL 12.40625 0 \r\nz\r\n\" id=\"DejaVuSans-49\"/>\r\n </defs>\r\n <use xlink:href=\"#DejaVuSans-49\"/>\r\n </g>\r\n </g>\r\n </g>\r\n </g>\r\n <g id=\"matplotlib.axis_2\">\r\n
"image/png": "iVBORw0KGgoAAAANSUhEUgAAAX0AAAD1CAYAAAC87SVQAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjMuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8vihELAAAACXBIWXMAAAsTAAALEwEAmpwYAAANhUlEQVR4nO3df6jd913H8edryVaDs9jSmxDvzUzAiCYFO3qJgf6jq9jIxPSfSgbaIIELJcMOBE38R/wjUP8RKdhC0NEUdTGgo6GzmyFaRAxLb7SuS7vYYLvkktDczYnZP9Fkb/+4H93h5uTec9vk3C6f5wMO53ve5/s993Mge/bwPT+WqkKS1IePrPYCJEnjY/QlqSNGX5I6YvQlqSNGX5I6YvQlqSNrV3sBy3nggQdq8+bNq70MSfqBcubMmW9V1cTi+UjRT/IucBW4AVyvqukk9wN/CWwG3gV+taq+0/Y/COxr+/9mVX2lzR8GXgDWAX8DPF3LfFFg8+bNzM7OjrJMSVKT5JvD5is5vfPzVfVQVU232weAk1W1FTjZbpNkG7AH2A7sAp5LsqYd8zwwA2xtl10rfSKSpPfvg5zT3w0cadtHgMcH5ker6lpVvQOcB3Yk2QjcW1Wn2qv7FweOkSSNwajRL+Bvk5xJMtNmG6rqMkC7Xt/mk8DFgWPn2myybS+e3yTJTJLZJLPz8/MjLlGStJxR38h9pKouJVkPnEjyjSX2zZBZLTG/eVh1GDgMMD097Y8DSdJtMtIr/aq61K6vAF8EdgDvtVM2tOsrbfc5YNPA4VPApTafGjKXJI3JstFP8sNJfuT/toFfBL4OHAf2tt32Ai+17ePAniT3JNnCwhu2p9spoKtJdiYJ8OTAMZKkMRjl9M4G4IsLnWYt8BdV9eUkrwHHkuwDLgBPAFTV2STHgDeB68D+qrrRHuspvv+RzVfaRZI0Jvmw/57+9PR0+Tl9SVqZJGcGPmL//z7038j9QbH5wJdWewl3jXef+fRqL0G6a/nbO5LUEaMvSR0x+pLUEaMvSR0x+pLUEaMvSR0x+pLUEaMvSR0x+pLUEaMvSR0x+pLUEaMvSR0x+pLUEaMvSR0x+pLUEaMvSR0x+pLUEaMvSR0x+pLUEaMvSR0x+pLUEaMvSR0x+pLUEaMvSR0x+pLUEaMvSR0x+pLUEaMvSR0x+pLUEaMvSR0x+pLUEaMvSR0ZOfpJ1iT5lyQvt9v3JzmR5O12fd/AvgeTnE9yLsljA/OHk7zR7ns2SW7v05EkLWUlr/SfBt4auH0AOFlVW4GT7TZJtgF7gO3ALuC5JGvaMc8DM8DWdtn1gVYvSVqRkaKfZAr4NPAnA+PdwJG2fQR4fGB+tKquVdU7wHlgR5KNwL1VdaqqCnhx4BhJ0hiM+kr/j4DfBr43MNtQVZcB2vX6Np8ELg7sN9dmk2178VySNCbLRj/JLwNXqurMiI857Dx9LTEf9jdnkswmmZ2fnx/xz0qSljPKK/1HgF9J8i5wFPhUkj8D3munbGjXV9r+c8CmgeOngEttPjVkfpOqOlxV01U1PTExsYKnI0layrLRr6qDVTVVVZtZeIP276rq14DjwN62217gpbZ9HNiT5J4kW1h4w/Z0OwV0NcnO9qmdJweOkSSNwdoPcOwzwLEk+4ALwBMAVXU2yTHgTeA6sL+qbrRjngJeANYBr7SLJGlMVhT9qnoVeLVtfxt49Bb7HQIODZnPAg+udJGSpNvDb+RKUkeMviR1xOhLUkeMviR1xOhLUkeMviR1xOhLUkeMviR1xOhLUkeMviR1xOhLUkeMviR1xOhLUkeMviR1xOhLUkeMviR1xOhLUkeMviR1xOhLUkeMviR1xOhLUkeMviR1xOhLUkeMviR1xOhLUkeMviR1xOhLUkeMviR1xOhLUkeMviR1xOhLUkeMviR1xOhLUkeMviR1ZNnoJ/mhJKeT/GuSs0l+v83vT3Iiydvt+r6BYw4mOZ/kXJLHBuYPJ3mj3fdsktyZpyVJGmaUV/rXgE9V1c8ADwG7kuwEDgAnq2orcLLdJsk2YA+wHdgFPJdkTXus54EZYGu77Lp9T0WStJxlo18LvttufrRdCtgNHGnzI8DjbXs3cLSqrlXVO8B5YEeSjcC9VXWqqgp4ceAYSdIYjHROP8maJK8DV4ATVfVVYENVXQZo1+vb7pPAxYHD59pssm0vnkuSxmSk6FfVjap6CJhi4VX7g0vsPuw8fS0xv/kBkpkks0lm5+fnR1miJGkEK/r0TlX9J/AqC+fi32unbGjXV9puc8CmgcOmgEttPjVkPuzvHK6q6aqanpiYWMkSJUlLGOXTOxNJfrRtrwN+AfgGcBzY23bbC7zUto8De5Lck2QLC2/Ynm6ngK4m2dk+tfPkwDGSpDFYO8I+G4Ej7RM4HwGOVdXLSU4Bx5LsAy4ATwBU1dkkx4A3gevA/qq60R7rKeAFYB3wSrtIksZk2ehX1deATw6Zfxt49BbHHAIODZnPAku9HyBJuoP8Rq4kdcToS1JHjL4kdcToS1JHjL4kdcToS1JHjL4kdcToS1JHjL4kdcToS1JHjL4kdcToS1JHjL4kdcToS1JHjL4kdcToS1JHjL4kdcToS1JHjL4kdcToS1JHjL4kdcToS1JHjL4kdcToS1JHjL4kdcToS1JHjL4kdcToS1JHjL4kdcToS1JHjL4kdcToS1JHjL4kdWTZ6CfZlOTvk7yV5GySp9v8/iQnkrzdru8bOOZgkvNJziV5bGD+cJI32n3PJsmdeVqSpGFGeaV/HfitqvppYCewP8k24ABwsqq2Aifbbdp9e4DtwC7guSRr2mM9D8wAW9tl1218LpKkZSwb/aq6XFX/3LavAm8Bk8Bu4Ejb7QjweNveDRytqmtV9Q5wHtiRZCNwb1WdqqoCXhw4RpI0Bis6p59kM/BJ4KvAhqq6DAv/YQDWt90mgYsDh8212WTbXjyXJI3JyNFP8nHgr4DPVdV/LbXrkFktMR/2t2aSzCaZnZ+fH3WJkqRljBT9JB9lIfh/XlV/3cbvtVM2tOsrbT4HbBo4fAq41OZTQ+Y3qarDVTVdVdMTExOjPhdJ0jJG+fROgD8F3qqqPxy46ziwt23vBV4amO9Jck+SLSy8YXu6nQK6mmRne8wnB46RJI3B2hH2eQT4deCNJK+32e8CzwDHkuwDLgBPAFTV2STHgDdZ+OTP/qq60Y57CngBWAe80i6SpDFZNvpV9Y8MPx8P8OgtjjkEHBoynwUeXMkCJUm3j9/IlaSOGH1J6ojRl6SOGH1J6ojRl6SOGH1J6ojRl6SOGH1J6ojRl6SOGH1J6ojRl6SOGH1J6ojRl6SOGH1J6ojRl6SOGH1J6ojRl6SOGH1J6ojRl6SOGH1J6ojRl6SOGH1J6ojRl6SOGH1J6ojRl6SOGH1J6ojRl6SOGH1J6ojRl6SOGH1J6ojRl6SOGH1J6ojRl6SOGH1J6siy0U/y+SRXknx9YHZ/khNJ3m7X9w3cdzDJ+STnkjw2MH84yRvtvmeT5PY/HUnSUkZ5pf8CsGvR7ABwsqq2AifbbZJsA/YA29sxzyVZ0455HpgBtrbL4seUJN1hy0a/qv4B+I9F493AkbZ9BHh8YH60qq5V1TvAeWBHko3AvVV1qqoKeHHgGEnSmLzfc/obquoyQLte3+aTwMWB/ebabLJtL55Lksbodr+RO+w8fS0xH/4gyUyS2SSz8/Pzt21xktS79xv999opG9r1lTafAzYN7DcFXGrzqSHzoarqcFVNV9X0xMTE+1yiJGmx9xv948Detr0XeGlgvifJPUm2sPCG7el2Cuhqkp3tUztPDhwjSRqTtcvtkOQLwM8BDySZA34PeAY4lmQfcAF4AqCqziY5BrwJXAf2V9WN9lBPsfBJoHXAK+0iSRqjZaNfVZ+5xV2P3mL/Q8ChIfNZ4MEVrU6SdFv5jVxJ6ojRl6SOGH1J6ojRl6SOGH1J6ojRl6SOGH1J6ojRl6SOGH1J6ojRl6SOGH1J6ojRl6SOGH1J6ojRl6SOGH1J6ojRl6SOGH1J6ojRl6SOGH1J6ojRl6SOGH1J6ojRl6SOGH1J6oj
},
"metadata": {
"needs_background": "light"
}
}
],
"source": [
"data_orginal['stroke'].value_counts().plot(kind=\"bar\")\n"
]
},
{
"cell_type": "code",
"execution_count": 24,
"metadata": {},
"outputs": [
{
"output_type": "execute_result",
"data": {
"text/plain": [
"<AxesSubplot:>"
]
},
"metadata": {},
"execution_count": 24
},
{
"output_type": "display_data",
"data": {
"text/plain": "<Figure size 432x288 with 1 Axes>",
"image/svg+xml": "<?xml version=\"1.0\" encoding=\"utf-8\" standalone=\"no\"?>\r\n<!DOCTYPE svg PUBLIC \"-//W3C//DTD SVG 1.1//EN\"\r\n \"http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd\">\r\n<!-- Created with matplotlib (https://matplotlib.org/) -->\r\n<svg height=\"245.758775pt\" version=\"1.1\" viewBox=\"0 0 381.65 245.758775\" width=\"381.65pt\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\">\r\n <metadata>\r\n <rdf:RDF xmlns:cc=\"http://creativecommons.org/ns#\" xmlns:dc=\"http://purl.org/dc/elements/1.1/\" xmlns:rdf=\"http://www.w3.org/1999/02/22-rdf-syntax-ns#\">\r\n <cc:Work>\r\n <dc:type rdf:resource=\"http://purl.org/dc/dcmitype/StillImage\"/>\r\n <dc:date>2021-03-20T19:59:26.764208</dc:date>\r\n <dc:format>image/svg+xml</dc:format>\r\n <dc:creator>\r\n <cc:Agent>\r\n <dc:title>Matplotlib v3.3.2, https://matplotlib.org/</dc:title>\r\n </cc:Agent>\r\n </dc:creator>\r\n </cc:Work>\r\n </rdf:RDF>\r\n </metadata>\r\n <defs>\r\n <style type=\"text/css\">*{stroke-linecap:butt;stroke-linejoin:round;}</style>\r\n </defs>\r\n <g id=\"figure_1\">\r\n <g id=\"patch_1\">\r\n <path d=\"M -0 245.758775 \r\nL 381.65 245.758775 \r\nL 381.65 0 \r\nL -0 0 \r\nz\r\n\" style=\"fill:none;\"/>\r\n </g>\r\n <g id=\"axes_1\">\r\n <g id=\"patch_2\">\r\n <path d=\"M 39.65 225.196275 \r\nL 374.45 225.196275 \r\nL 374.45 7.756275 \r\nL 39.65 7.756275 \r\nz\r\n\" style=\"fill:#ffffff;\"/>\r\n </g>\r\n <g id=\"patch_3\">\r\n <path clip-path=\"url(#p773d4bda8f)\" d=\"M 81.5 225.196275 \r\nL 165.2 225.196275 \r\nL 165.2 18.110561 \r\nL 81.5 18.110561 \r\nz\r\n\" style=\"fill:#1f77b4;\"/>\r\n </g>\r\n <g id=\"patch_4\">\r\n <path clip-path=\"url(#p773d4bda8f)\" d=\"M 248.9 225.196275 \r\nL 332.6 225.196275 \r\nL 332.6 213.372598 \r\nL 248.9 213.372598 \r\nz\r\n\" style=\"fill:#1f77b4;\"/>\r\n </g>\r\n <g id=\"matplotlib.axis_1\">\r\n <g id=\"xtick_1\">\r\n <g id=\"line2d_1\">\r\n <defs>\r\n <path d=\"M 0 0 \r\nL 0 3.5 \r\n\" id=\"m89701e199f\" style=\"stroke:#000000;stroke-width:0.8;\"/>\r\n </defs>\r\n <g>\r\n <use style=\"stroke:#000000;stroke-width:0.8;\" x=\"123.35\" xlink:href=\"#m89701e199f\" y=\"225.196275\"/>\r\n </g>\r\n </g>\r\n <g id=\"text_1\">\r\n <!-- 0 -->\r\n <g transform=\"translate(126.109375 238.558775)rotate(-90)scale(0.1 -0.1)\">\r\n <defs>\r\n <path d=\"M 31.78125 66.40625 \r\nQ 24.171875 66.40625 20.328125 58.90625 \r\nQ 16.5 51.421875 16.5 36.375 \r\nQ 16.5 21.390625 20.328125 13.890625 \r\nQ 24.171875 6.390625 31.78125 6.390625 \r\nQ 39.453125 6.390625 43.28125 13.890625 \r\nQ 47.125 21.390625 47.125 36.375 \r\nQ 47.125 51.421875 43.28125 58.90625 \r\nQ 39.453125 66.40625 31.78125 66.40625 \r\nz\r\nM 31.78125 74.21875 \r\nQ 44.046875 74.21875 50.515625 64.515625 \r\nQ 56.984375 54.828125 56.984375 36.375 \r\nQ 56.984375 17.96875 50.515625 8.265625 \r\nQ 44.046875 -1.421875 31.78125 -1.421875 \r\nQ 19.53125 -1.421875 13.0625 8.265625 \r\nQ 6.59375 17.96875 6.59375 36.375 \r\nQ 6.59375 54.828125 13.0625 64.515625 \r\nQ 19.53125 74.21875 31.78125 74.21875 \r\nz\r\n\" id=\"DejaVuSans-48\"/>\r\n </defs>\r\n <use xlink:href=\"#DejaVuSans-48\"/>\r\n </g>\r\n </g>\r\n </g>\r\n <g id=\"xtick_2\">\r\n <g id=\"line2d_2\">\r\n <g>\r\n <use style=\"stroke:#000000;stroke-width:0.8;\" x=\"290.75\" xlink:href=\"#m89701e199f\" y=\"225.196275\"/>\r\n </g>\r\n </g>\r\n <g id=\"text_2\">\r\n <!-- 1 -->\r\n <g transform=\"translate(293.509375 238.558775)rotate(-90)scale(0.1 -0.1)\">\r\n <defs>\r\n <path d=\"M 12.40625 8.296875 \r\nL 28.515625 8.296875 \r\nL 28.515625 63.921875 \r\nL 10.984375 60.40625 \r\nL 10.984375 69.390625 \r\nL 28.421875 72.90625 \r\nL 38.28125 72.90625 \r\nL 38.28125 8.296875 \r\nL 54.390625 8.296875 \r\nL 54.390625 0 \r\nL 12.40625 0 \r\nz\r\n\" id=\"DejaVuSans-49\"/>\r\n </defs>\r\n <use xlink:href=\"#DejaVuSans-49\"/>\r\n </g>\r\n </g>\r\n <
"image/png": "iVBORw0KGgoAAAANSUhEUgAAAX0AAAD1CAYAAAC87SVQAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjMuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8vihELAAAACXBIWXMAAAsTAAALEwEAmpwYAAANiklEQVR4nO3dUYidZ17H8e9vk91ucC22dBKyM1lTMIsmBXfpEAO9USs2umJ6U8mCNkhgoGSxC4KbeiNeBOqNSMEWgi5NUTcGdGno2l1rtCxi3HSqdbtpNzbYbjIkNNN1xexNNdm/F/PIHiYnM2fayZkyz/cDh/Oe/3nfmefA9NvDO++ZpKqQJPXhQ2u9AEnS+Bh9SeqI0Zekjhh9SeqI0Zekjhh9SerIxlF2SvIWcBW4DlyrqukkdwJ/CWwH3gJ+raq+1/Z/DDjY9v+tqvpam98LPA1sAv4GeLSWuWb0rrvuqu3bt6/wZUlS315++eV3qmpi8Xyk6Dc/V1XvDDw+DJyqqseTHG6Pv5BkJ7Af2AV8HPi7JJ+squvAU8AM8M8sRH8v8PxS33T79u3Mzs6uYJmSpCTfGTZ/P6d39gHH2vYx4MGB+fGqereq3gTOA7uTbAVur6rT7d39MwPHSJLGYNToF/C3SV5OMtNmW6rqMkC739zmk8DFgWPn2myybS+e3yDJTJLZJLPz8/MjLlGStJxRT+/cV1WXkmwGXkjy7SX2zZBZLTG/cVh1FDgKMD097d+JkKRVMtI7/aq61O6vAF8GdgNvt1M2tPsrbfc5YNvA4VPApTafGjKXJI3JstFP8iNJfvT/t4FfBL4FnAQOtN0OAM+27ZPA/iS3Jbkb2AGcaaeAribZkyTAwwPHSJLGYJTTO1uALy90mo3AX1TVV5O8BJxIchC4ADwEUFVnk5wAXgOuAYfalTsAj/DDSzafZ5krdyRJqysf9D+tPD09XV6yKUkrk+TlqppePPcTuZLUkZV8OEtL2H74K2u9hHXjrcc/s9ZLkNYt3+lLUkeMviR1xOhLUkeMviR1xOhLUkeMviR1xOhLUkeMviR1xOhLUkeMviR1xOhLUkeMviR1xOhLUkeMviR1xOhLUkeMviR1xOhLUkeMviR1xOhLUkeMviR1xOhLUkeMviR1xOhLUkeMviR1xOhLUkeMviR1xOhLUkeMviR1xOhLUkeMviR1xOhLUkeMviR1ZOToJ9mQ5F+TPNce35nkhSRvtPs7BvZ9LMn5JOeSPDAwvzfJq+25J5JkdV+OJGkpK3mn/yjw+sDjw8CpqtoBnGqPSbIT2A/sAvYCTybZ0I55CpgBdrTb3ve1eknSiowU/SRTwGeAPxkY7wOOte1jwIMD8+NV9W5VvQmcB3Yn2QrcXlWnq6qAZwaOkSSNwajv9P8I+B3gBwOzLVV1GaDdb27zSeDiwH5zbTbZthfPb5BkJslsktn5+fkRlyhJWs6y0U/yK8CVqnp5xK857Dx9LTG/cVh1tKqmq2p6YmJixG8rSVrOxhH2uQ/41SS/DHwUuD3JnwFvJ9laVZfbqZsrbf85YNvA8VPApTafGjKXJI3Jsu/0q+qxqpqqqu0s/IL276vq14GTwIG22wHg2bZ9Etif5LYkd7PwC9sz7RTQ1SR72lU7Dw8cI0kag1He6d/M48CJJAeBC8BDAFV1NskJ4DXgGnCoqq63Yx4BngY2Ac+3myRpTFYU/ap6EXixbX8XuP8m+x0BjgyZzwL3rHSRkqTV4SdyJakjRl+SOmL0JakjRl+SOmL0JakjRl+SOmL0JakjRl+SOmL0JakjRl+SOmL0JakjRl+SOmL0JakjRl+SOmL0JakjRl+SOmL0JakjRl+SOmL0JakjRl+SOmL0JakjRl+SOmL0JakjRl+SOmL0JakjRl+SOmL0JakjRl+SOmL0JakjRl+SOmL0JakjRl+SOmL0JakjRl+SOrJs9JN8NMmZJP+W5GyS32/zO5O8kOSNdn/HwDGPJTmf5FySBwbm9yZ5tT33RJLcmpclSRpmlHf67wI/X1U/DXwK2JtkD3AYOFVVO4BT7TFJdgL7gV3AXuDJJBva13oKmAF2tNve1XspkqTlLBv9WvD99vDD7VbAPuBYmx8DHmzb+4DjVfVuVb0JnAd2J9kK3F5Vp6uqgGcGjpEkjcFI5/STbEjyCnAFeKGqvgFsqarLAO1+c9t9Erg4cPhcm0227cXzYd9vJslsktn5+fkVvBxJ0lJGin5VXa+qTwFTLLxrv2eJ3Yedp68l5sO+39Gqmq6q6YmJiVGWKEkawYqu3qmq/wJeZOFc/NvtlA3t/krbbQ7YNnDYFHCpzaeGzCVJYzLK1TsTSX6sbW8CfgH4NnASONB2OwA827ZPAvuT3JbkbhZ+YXumnQK6mmRPu2rn4YFjJEljsHGEfbYCx9oVOB8CTlTVc0lOAyeSHAQuAA8BVNXZJCeA14BrwKGqut6+1iPA08Am4Pl2kySNybLRr6pvAp8eMv8ucP9NjjkCHBkynwWW+n2AJOkW8hO5ktQRoy9JHTH6ktQRoy9JHTH6ktQRoy9JHTH6ktQRoy9JHTH6ktQRoy9JHTH6ktQRoy9JHTH6ktQRoy9JHTH6ktQRoy9JHTH6ktQRoy9JHTH6ktQRoy9JHTH6ktQRoy9JHTH6ktQRoy9JHTH6ktQRoy9JHTH6ktQRoy9JHTH6ktQRoy9JHTH6ktQRoy9JHTH6ktQRoy9JHVk2+km2JfmHJK8nOZvk0Ta/M8kLSd5o93cMHPNYkvNJziV5YGB+b5JX23NPJMmteVmSpGFGead/DfjtqvopYA9wKMlO4DBwqqp2AKfaY9pz+4FdwF7gySQb2td6CpgBdrTb3lV8LZKkZSwb/aq6XFX/0ravAq8Dk8A+4Fjb7RjwYNveBxyvqner6k3gPLA7yVbg9qo6XVUFPDNwjCRpDFZ0Tj/JduDTwDeALVV1GRb+xwBsbrtNAhcHDptrs8m2vXg+7PvMJJlNMjs/P7+SJUqSljBy9JN8DPgr4PNV9d9L7TpkVkvMbxxWHa2q6aqanpiYGHWJkqRljBT9JB9mIfh/XlV/3cZvt1M2tPsrbT4HbBs4fAq41OZTQ+aSpDEZ5eqdAH8KvF5Vfzjw1EngQNs+ADw7MN+f5LYkd7PwC9sz7RTQ1SR72td8eOAYSdIYbBxhn/uA3wBeTfJKm/0u8DhwIslB4ALwEEBVnU1yAniNhSt/DlXV9XbcI8DTwCbg+XaTJI3JstGvqn9k+Pl4gPtvcswR4MiQ+Sxwz0oWKElaPX4iV5I6YvQlqSNGX5I6YvQlqSNGX5I6YvQlqSNGX5I6YvQlqSNGX5I6YvQlqSNGX5I6YvQlqSNGX5I6YvQlqSNGX5I6YvQlqSNGX5I6YvQlqSNGX5I6YvQlqSNGX5I6YvQlqSNGX5I6YvQlqSNGX5I6YvQlqSNGX5I6YvQlqSNGX5I6YvQlqSNGX5I6YvQlqSNGX5I6YvQlqSPLRj/JF5NcSfKtgdmdSV5I8ka7v2PguceSnE9yLskDA/N7k7zannsiSVb/5UiSljLKO/2ngb2LZoeBU1W1AzjVHpNkJ7Af2NWOeTLJhnbMU8AMsKPdFn9NSdIttmz0q+rrwH8uGu8DjrXtY8CDA/PjVfVuVb0JnAd2J9kK3F5Vp6uqgGcGjpEkjcl7Pae/paouA7T7zW0+CVwc2G+uzSbb9uL5UElmkswmmZ2fn3+PS5QkLbbav8gddp6+lpgPVVVHq2q6qqYnJiZWbXGS1Lv3Gv232ykb2v2VNp8Dtg3sNwVcavOpIXNJ0hi91+ifBA607QPAswPz/UluS3I3C7+wPdNOAV1NsqddtfPwwDGSpDHZuNwOSb4E/CxwV5I54PeAx4ETSQ4CF4CHAKrqbJITwGvANeBQVV1vX+oRFq4E2gQ8326SpDFaNvpV9dmbPHX/TfY/AhwZMp8F7lnR6iRJq8pP5EpSR4y+JHXE6EtSR4y+JHXE6EtSR4y+JHXE6EtSR4y+JHXE6EtSR4y+JHXE6EtSR4y+JHXE6EtSR4y+JHXE6EtSR4y+JHXE6EtSR4y+JHXE6EtSR4y+JHXE6Et
},
"metadata": {
"needs_background": "light"
}
}
],
"source": [
"data_orginal['heart_disease'].value_counts().plot(kind=\"bar\")\n"
]
},
{
"cell_type": "code",
"execution_count": 25,
"metadata": {},
"outputs": [
{
"output_type": "execute_result",
"data": {
"text/plain": [
"<AxesSubplot:>"
]
},
"metadata": {},
"execution_count": 25
},
{
"output_type": "display_data",
"data": {
"text/plain": "<Figure size 432x288 with 1 Axes>",
"image/svg+xml": "<?xml version=\"1.0\" encoding=\"utf-8\" standalone=\"no\"?>\r\n<!DOCTYPE svg PUBLIC \"-//W3C//DTD SVG 1.1//EN\"\r\n \"http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd\">\r\n<!-- Created with matplotlib (https://matplotlib.org/) -->\r\n<svg height=\"323.293125pt\" version=\"1.1\" viewBox=\"0 0 381.65 323.293125\" width=\"381.65pt\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\">\r\n <metadata>\r\n <rdf:RDF xmlns:cc=\"http://creativecommons.org/ns#\" xmlns:dc=\"http://purl.org/dc/elements/1.1/\" xmlns:rdf=\"http://www.w3.org/1999/02/22-rdf-syntax-ns#\">\r\n <cc:Work>\r\n <dc:type rdf:resource=\"http://purl.org/dc/dcmitype/StillImage\"/>\r\n <dc:date>2021-03-20T19:59:30.902892</dc:date>\r\n <dc:format>image/svg+xml</dc:format>\r\n <dc:creator>\r\n <cc:Agent>\r\n <dc:title>Matplotlib v3.3.2, https://matplotlib.org/</dc:title>\r\n </cc:Agent>\r\n </dc:creator>\r\n </cc:Work>\r\n </rdf:RDF>\r\n </metadata>\r\n <defs>\r\n <style type=\"text/css\">*{stroke-linecap:butt;stroke-linejoin:round;}</style>\r\n </defs>\r\n <g id=\"figure_1\">\r\n <g id=\"patch_1\">\r\n <path d=\"M -0 323.293125 \r\nL 381.65 323.293125 \r\nL 381.65 0 \r\nL -0 0 \r\nz\r\n\" style=\"fill:none;\"/>\r\n </g>\r\n <g id=\"axes_1\">\r\n <g id=\"patch_2\">\r\n <path d=\"M 39.65 224.64 \r\nL 374.45 224.64 \r\nL 374.45 7.2 \r\nL 39.65 7.2 \r\nz\r\n\" style=\"fill:#ffffff;\"/>\r\n </g>\r\n <g id=\"patch_3\">\r\n <path clip-path=\"url(#p5adb89c86e)\" d=\"M 60.575 224.64 \r\nL 102.425 224.64 \r\nL 102.425 17.554286 \r\nL 60.575 17.554286 \r\nz\r\n\" style=\"fill:#1f77b4;\"/>\r\n </g>\r\n <g id=\"patch_4\">\r\n <path clip-path=\"url(#p5adb89c86e)\" d=\"M 144.275 224.64 \r\nL 186.125 224.64 \r\nL 186.125 55.644047 \r\nL 144.275 55.644047 \r\nz\r\n\" style=\"fill:#1f77b4;\"/>\r\n </g>\r\n <g id=\"patch_5\">\r\n <path clip-path=\"url(#p5adb89c86e)\" d=\"M 227.975 224.64 \r\nL 269.825 224.64 \r\nL 269.825 127.773796 \r\nL 227.975 127.773796 \r\nz\r\n\" style=\"fill:#1f77b4;\"/>\r\n </g>\r\n <g id=\"patch_6\">\r\n <path clip-path=\"url(#p5adb89c86e)\" d=\"M 311.675 224.64 \r\nL 353.525 224.64 \r\nL 353.525 138.281317 \r\nL 311.675 138.281317 \r\nz\r\n\" style=\"fill:#1f77b4;\"/>\r\n </g>\r\n <g id=\"matplotlib.axis_1\">\r\n <g id=\"xtick_1\">\r\n <g id=\"line2d_1\">\r\n <defs>\r\n <path d=\"M 0 0 \r\nL 0 3.5 \r\n\" id=\"m5a93e58ddd\" style=\"stroke:#000000;stroke-width:0.8;\"/>\r\n </defs>\r\n <g>\r\n <use style=\"stroke:#000000;stroke-width:0.8;\" x=\"81.5\" xlink:href=\"#m5a93e58ddd\" y=\"224.64\"/>\r\n </g>\r\n </g>\r\n <g id=\"text_1\">\r\n <!-- never smoked -->\r\n <g transform=\"translate(84.259375 302.49)rotate(-90)scale(0.1 -0.1)\">\r\n <defs>\r\n <path d=\"M 54.890625 33.015625 \r\nL 54.890625 0 \r\nL 45.90625 0 \r\nL 45.90625 32.71875 \r\nQ 45.90625 40.484375 42.875 44.328125 \r\nQ 39.84375 48.1875 33.796875 48.1875 \r\nQ 26.515625 48.1875 22.3125 43.546875 \r\nQ 18.109375 38.921875 18.109375 30.90625 \r\nL 18.109375 0 \r\nL 9.078125 0 \r\nL 9.078125 54.6875 \r\nL 18.109375 54.6875 \r\nL 18.109375 46.1875 \r\nQ 21.34375 51.125 25.703125 53.5625 \r\nQ 30.078125 56 35.796875 56 \r\nQ 45.21875 56 50.046875 50.171875 \r\nQ 54.890625 44.34375 54.890625 33.015625 \r\nz\r\n\" id=\"DejaVuSans-110\"/>\r\n <path d=\"M 56.203125 29.59375 \r\nL 56.203125 25.203125 \r\nL 14.890625 25.203125 \r\nQ 15.484375 15.921875 20.484375 11.0625 \r\nQ 25.484375 6.203125 34.421875 6.203125 \r\nQ 39.59375 6.203125 44.453125 7.46875 \r\nQ 49.3125 8.734375 54.109375 11.28125 \r\nL 54.109375 2.78125 \r\nQ 49.265625 0.734375 44.1875 -0.34375 \r\nQ 39.109375 -1.421875 33.890625 -1.421875 \r\nQ 20.796875 -1.421875 13.15625 6.1875 \r\nQ 5.515625 13.8125 5.515625 26.8125 \r\nQ 5.515625 40.234375 12.765625 48.109375 \r\nQ 20.015625 56 32.328125 56 \r\nQ 43.359375 56 49.78125 48.890625 \r\nQ 56.203125 41.796875 56.203125 29.59375 \r\nz\r\nM 47.21875 32.234375 \r\nQ 47.125 39.59375 43.09
"image/png": "iVBORw0KGgoAAAANSUhEUgAAAX0AAAFCCAYAAAAdVQ0pAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjMuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8vihELAAAACXBIWXMAAAsTAAALEwEAmpwYAAAcdUlEQVR4nO3dfZRdVZ3m8e9DQLSV9ICUiARJwIATIkaJiI0vKNMQQCG+djIKttIrwoJhbFpH0O7Rtie96FF02jc0NojYAqJIE1tBEFHaF8QKRBLASCBRQzJQSKu0LxkSn/nj7IJLUXmpcyt17q3zfNa6q+7Z99x7f7mr6sm5++yzt2wTERHtsFPTBURExMRJ6EdEtEhCPyKiRRL6EREtktCPiGiRnZsuYFv23HNPT58+vekyIiL6yrJlyx6wPTCyvedDf/r06QwODjZdRkREX5H009Ha070TEdEiCf2IiBZJ6EdEtEhCPyKiRRL6EREtktCPiGiRhH5ERIsk9CMiWiShHxHRIj1/Re6OMP3srzZdwjatPff4pkuIiEkoR/oRES2S0I+IaJGEfkREiyT0IyJaJKEfEdEiCf2IiBZJ6EdEtEhCPyKiRRL6EREtktCPiGiRhH5ERItsM/QlXSjpfkkrO9q+IGl5ua2VtLy0T5f0u47HPtnxnEMlrZC0WtJHJGmH/IsiImKLtmfCtYuAjwEXDzfY/rPh+5LOA37Vsf/dtueM8jrnA4uAm4CvAfOAq8dccURE1LbNI33bNwIPjvZYOVp/A3Dp1l5D0t7AVNvft22q/0Dmj7naiIjoSrd9+i8B7rN9V0fbDEm3Svq2pJeUtn2AdR37rCtto5K0SNKgpMGhoaEuS4yIiGHdhv5CHnuUvwF4pu3nAWcBl0iaCozWf+8tvajtJbbn2p47MDDQZYkRETGs9iIqknYGXgMcOtxmeyOwsdxfJulu4ECqI/tpHU+fBqyv+94REVFPN0f6/wX4se1Hum0kDUiaUu7vD8wE7rG9AXhI0uHlPMDJwFVdvHdERNSwPUM2LwW+DxwkaZ2kU8pDC3j8CdyXArdJ+hHwJeBU28MngU8D/glYDdxNRu5EREy4bXbv2F64hfY/H6XtCuCKLew/CMweY30RETGOckVuRESLJPQjIlokoR8R0SIJ/YiIFknoR0S0SEI/IqJFEvoRES2S0I+IaJGEfkREiyT0IyJaJKEfEdEiCf2IiBZJ6EdEtEhCPyKiRRL6EREtktCPiGiRhH5ERIvUXhg9AmD62V9tuoTtsvbc45suIaInbM8auRdKul/Syo6290m6V9Lycjuu47FzJK2WtErSMR3th0paUR77SFkgPSIiJtD2dO9cBMwbpf3DtueU29cAJM2iWjD94PKcT0iaUvY/H1gEzCy30V4zIiJ2oG2Gvu0bgQe38/VOBC6zvdH2GmA1cJikvYGptr9v28DFwPyaNUdERE3dnMg9Q9Jtpftn99K2D/Dzjn3WlbZ9yv2R7aOStEjSoKTBoaGhLkqMiIhOdUP/fOAAYA6wATivtI/WT++ttI/K9hLbc23PHRgYqFliRESMVCv0bd9ne7PtPwCfBg4rD60D9u3YdRqwvrRPG6U9IiImUK3QL330w14NDI/sWQoskLSrpBlUJ2xvtr0BeEjS4WXUzsnAVV3UHRERNWxznL6kS4EjgT0lrQPeCxwpaQ5VF81a4G0Atm+XdDlwB7AJON325vJSp1GNBHoScHW5RUTEBNpm6NteOErzBVvZfzGweJT2QWD2mKqLiIhxlWkYIiJaJKEfEdEiCf2IiBZJ6EdEtEhCPyKiRRL6EREtktCPiGiRhH5ERIsk9CMiWiShHxHRIgn9iIgWSehHRLRIQj8iokUS+hERLZLQj4hokYR+RESLJPQjIlokoR8R0SIJ/YiIFtlm6Eu6UNL9klZ2tH1A0o8l3SbpSkn/qbRPl/Q7ScvL7ZMdzzlU0gpJqyV9RJJ2yL8oIiK2aHuO9C8C5o1ouw6YbfsQ4CfAOR2P3W17Trmd2tF+PrAImFluI18zIiJ2sG2Gvu0bgQdHtF1re1PZvAmYtrXXkLQ3MNX2920buBiYX6viiIiobTz69N8KXN2xPUPSrZK+LeklpW0fYF3HPutK26gkLZI0KGlwaGhoHEqMiAjoMvQlvQfYBHy+NG0Anmn7ecBZwCWSpgKj9d97S69re4ntubbnDgwMdFNiRER02LnuEyW9GXglcFTpssH2RmBjub9M0t3AgVRH9p1dQNOA9XXfOyIi6ql1pC9pHvAu4ATbv+1oH5A0pdzfn+qE7T22NwAPSTq8jNo5Gbiq6+ojImJMtnmkL+lS4EhgT0nrgPdSjdbZFbiujLy8qYzUeSnwfkmbgM3AqbaHTwKfRjUS6ElU5wA6zwNERMQE2Gbo2144SvMFW9j3CuCKLTw2CMweU3URETGuckVuRESLJPQjIlokoR8R0SIJ/YiIFknoR0S0SEI/IqJFEvoRES2S0I+IaJGEfkREiyT0IyJaJKEfEdEiCf2IiBZJ6EdEtEhCPyKiRRL6EREtktCPiGiRhH5ERIsk9CMiWmSboS/pQkn3S1rZ0baHpOsk3VV+7t7x2DmSVktaJemYjvZDJa0oj32kLJAeERETaHuO9C8C5o1oOxu43vZM4PqyjaRZwALg4PKcT0iaUp5zPrAImFluI18zIiJ2sG2Gvu0bgQdHNJ8IfLbc/ywwv6P9Mtsbba8BVgOHSdobmGr7+7YNXNzxnIiImCB1+/T3sr0BoPx8WmnfB/h5x37rSts+5f7I9lFJWiRpUNLg0NBQzRIjImKk8T6RO1o/vbfSPirbS2zPtT13YGBg3IqLiGi7uqF/X+myofy8v7SvA/bt2G8asL60TxulPSIiJlDd0F8KvLncfzNwVUf7Akm7SppBdcL25tIF9JCkw8uonZM7nhMRERNk523tIOlS4EhgT0nrgPcC5wKXSzoF+BnwegDbt0u6HLgD2AScbntzeanTqEYCPQm4utwiImICbTP0bS/cwkNHbWH/xcDiUdoHgdljqi4iIsZVrsiNiGiRhH5ERIsk9CMiWiShHxHRIgn9iIgWSehHRLRIQj8iokW2OU4/IibO9LO/2nQJ22Xtucc3XULUlCP9iIgWSehHRLRIQj8iokUS+hERLZLQj4hokYR+RESLJPQjIlokoR8R0SIJ/YiIFskVuRExaeUK58fLkX5ERIvUDn1JB0la3nH7taS3S3qfpHs72o/reM45klZLWiXpmPH5J0RExPaq3b1jexUwB0DSFOBe4ErgLcCHbX+wc39Js4AFwMHAM4BvSDrQ9ua6NURExNiMV/fOUcDdtn+6lX1OBC6zvdH2GmA1cNg4vX9ERGyH8Qr9BcClHdtnSLpN0oWSdi9t+wA/79hnXWl7HEmLJA1KGhwaGhqnEiMiouvQl/QE4ATgi6XpfOAAqq6fDcB5w7uO8nSP9pq2l9iea3vuwMBAtyVGREQxHkf6xwK32L4PwPZ9tjfb/gPwaR7twlkH7NvxvGnA+nF4/4iI2E7jEfoL6ejakbR3x2OvBlaW+0uBBZJ2lTQDmAncPA7vHxER26mri7Mk/RHwp8DbOpr/t6Q5VF03a4cfs327pMuBO4BNwOkZuRMRMbG6Cn3bvwWeOqLtpK3svxhY3M17RkREfbkiNyKiRRL6EREtktCPiGiRhH5ERIsk9CMiWiShHxHRIgn9iIgWSehHRLRIQj8iokUS+hERLZLQj4hokYR+RESLJPQjIlokoR8R0SIJ/YiIFknoR0S0SEI/IqJFEvoRES3SVehLWitphaTlkgZL2x6SrpN0V/m5e8f+50haLWmVpGO6LT4iIsZmPI70X257ju25Zfts4HrbM4HryzaSZgELgIOBecAnJE0Zh/ePiIjttCO6d04EPlvufxaY39F+me2NttcAq4HDdsD7R0TEFnQb+gaulbRM0qLStpftDQDl59NK+z7Azzueu660PY6kRZIGJQ0ODQ11WWJERAzbucvnH2F7vaSnAddJ+vFW9tUobR5tR9tLgCUAc+fOHXWfiIgYu66O9G2vLz/vB66k6q65T9LeAOXn/WX
},
"metadata": {
"needs_background": "light"
}
}
],
"source": [
"data_orginal['smoking_status'].value_counts().plot(kind=\"bar\")\n"
]
},
{
"cell_type": "code",
2021-03-26 16:36:45 +01:00
"execution_count": 28,
2021-03-20 20:04:51 +01:00
"metadata": {},
"outputs": [
{
"output_type": "execute_result",
"data": {
"text/plain": [
"<AxesSubplot:>"
]
},
"metadata": {},
2021-03-26 16:36:45 +01:00
"execution_count": 28
2021-03-20 20:04:51 +01:00
},
{
"output_type": "display_data",
"data": {
"text/plain": "<Figure size 432x288 with 1 Axes>",
2021-03-26 16:36:45 +01:00
"image/svg+xml": "<?xml version=\"1.0\" encoding=\"utf-8\" standalone=\"no\"?>\r\n<!DOCTYPE svg PUBLIC \"-//W3C//DTD SVG 1.1//EN\"\r\n \"http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd\">\r\n<!-- Created with matplotlib (https://matplotlib.org/) -->\r\n<svg height=\"269.08375pt\" version=\"1.1\" viewBox=\"0 0 381.65 269.08375\" width=\"381.65pt\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\">\r\n <metadata>\r\n <rdf:RDF xmlns:cc=\"http://creativecommons.org/ns#\" xmlns:dc=\"http://purl.org/dc/elements/1.1/\" xmlns:rdf=\"http://www.w3.org/1999/02/22-rdf-syntax-ns#\">\r\n <cc:Work>\r\n <dc:type rdf:resource=\"http://purl.org/dc/dcmitype/StillImage\"/>\r\n <dc:date>2021-03-20T20:06:01.190561</dc:date>\r\n <dc:format>image/svg+xml</dc:format>\r\n <dc:creator>\r\n <cc:Agent>\r\n <dc:title>Matplotlib v3.3.2, https://matplotlib.org/</dc:title>\r\n </cc:Agent>\r\n </dc:creator>\r\n </cc:Work>\r\n </rdf:RDF>\r\n </metadata>\r\n <defs>\r\n <style type=\"text/css\">*{stroke-linecap:butt;stroke-linejoin:round;}</style>\r\n </defs>\r\n <g id=\"figure_1\">\r\n <g id=\"patch_1\">\r\n <path d=\"M -0 269.08375 \r\nL 381.65 269.08375 \r\nL 381.65 0 \r\nL -0 0 \r\nz\r\n\" style=\"fill:none;\"/>\r\n </g>\r\n <g id=\"axes_1\">\r\n <g id=\"patch_2\">\r\n <path d=\"M 39.65 224.64 \r\nL 374.45 224.64 \r\nL 374.45 7.2 \r\nL 39.65 7.2 \r\nz\r\n\" style=\"fill:#ffffff;\"/>\r\n </g>\r\n <g id=\"patch_3\">\r\n <path clip-path=\"url(#pd3e9aec6be)\" d=\"M 81.5 224.64 \r\nL 165.2 224.64 \r\nL 165.2 17.554286 \r\nL 81.5 17.554286 \r\nz\r\n\" style=\"fill:#1f77b4;\"/>\r\n </g>\r\n <g id=\"patch_4\">\r\n <path clip-path=\"url(#pd3e9aec6be)\" d=\"M 248.9 224.64 \r\nL 332.6 224.64 \r\nL 332.6 24.095514 \r\nL 248.9 24.095514 \r\nz\r\n\" style=\"fill:#1f77b4;\"/>\r\n </g>\r\n <g id=\"matplotlib.axis_1\">\r\n <g id=\"xtick_1\">\r\n <g id=\"line2d_1\">\r\n <defs>\r\n <path d=\"M 0 0 \r\nL 0 3.5 \r\n\" id=\"md6de6d2197\" style=\"stroke:#000000;stroke-width:0.8;\"/>\r\n </defs>\r\n <g>\r\n <use style=\"stroke:#000000;stroke-width:0.8;\" x=\"123.35\" xlink:href=\"#md6de6d2197\" y=\"224.64\"/>\r\n </g>\r\n </g>\r\n <g id=\"text_1\">\r\n <!-- Urban -->\r\n <g transform=\"translate(126.109375 261.88375)rotate(-90)scale(0.1 -0.1)\">\r\n <defs>\r\n <path d=\"M 8.6875 72.90625 \r\nL 18.609375 72.90625 \r\nL 18.609375 28.609375 \r\nQ 18.609375 16.890625 22.84375 11.734375 \r\nQ 27.09375 6.59375 36.625 6.59375 \r\nQ 46.09375 6.59375 50.34375 11.734375 \r\nQ 54.59375 16.890625 54.59375 28.609375 \r\nL 54.59375 72.90625 \r\nL 64.5 72.90625 \r\nL 64.5 27.390625 \r\nQ 64.5 13.140625 57.4375 5.859375 \r\nQ 50.390625 -1.421875 36.625 -1.421875 \r\nQ 22.796875 -1.421875 15.734375 5.859375 \r\nQ 8.6875 13.140625 8.6875 27.390625 \r\nz\r\n\" id=\"DejaVuSans-85\"/>\r\n <path d=\"M 41.109375 46.296875 \r\nQ 39.59375 47.171875 37.8125 47.578125 \r\nQ 36.03125 48 33.890625 48 \r\nQ 26.265625 48 22.1875 43.046875 \r\nQ 18.109375 38.09375 18.109375 28.8125 \r\nL 18.109375 0 \r\nL 9.078125 0 \r\nL 9.078125 54.6875 \r\nL 18.109375 54.6875 \r\nL 18.109375 46.1875 \r\nQ 20.953125 51.171875 25.484375 53.578125 \r\nQ 30.03125 56 36.53125 56 \r\nQ 37.453125 56 38.578125 55.875 \r\nQ 39.703125 55.765625 41.0625 55.515625 \r\nz\r\n\" id=\"DejaVuSans-114\"/>\r\n <path d=\"M 48.6875 27.296875 \r\nQ 48.6875 37.203125 44.609375 42.84375 \r\nQ 40.53125 48.484375 33.40625 48.484375 \r\nQ 26.265625 48.484375 22.1875 42.84375 \r\nQ 18.109375 37.203125 18.109375 27.296875 \r\nQ 18.109375 17.390625 22.1875 11.75 \r\nQ 26.265625 6.109375 33.40625 6.109375 \r\nQ 40.53125 6.109375 44.609375 11.75 \r\nQ 48.6875 17.390625 48.6875 27.296875 \r\nz\r\nM 18.109375 46.390625 \r\nQ 20.953125 51.265625 25.265625 53.625 \r\nQ 29.59375 56 35.59375 56 \r\nQ 45.5625 56 51.78125 48.09375 \r\nQ 58.015625 40.1875 58.015625 27.296875 \r\nQ 58.015625 14.40625 51.78125 6.484375 \r\nQ 45.5625 -1.421875 35.59375 -1.421875 \r\nQ 29.59375 -1.
2021-03-20 20:04:51 +01:00
"image/png": "iVBORw0KGgoAAAANSUhEUgAAAX0AAAENCAYAAADjW7WQAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjMuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8vihELAAAACXBIWXMAAAsTAAALEwEAmpwYAAAQGUlEQVR4nO3df6zddX3H8eeLVpEIGEgvDNtiGemihWUoN00zlkxlG51uFpeQlSzSP0xqSI26uT/AfzRZmrgfasIyWGp0lIWNdVHTJsI2JGSGDMUL6VZK7ewsg2ubtqKbnS5o63t/nO+NZ+3pvbe3t+fA+Twfycn5nvf5fL/nfXJvXvd7P9/v95xUFZKkNlww6gYkScNj6EtSQwx9SWqIoS9JDTH0Jakhhr4kNWTpqBuYy7Jly2rVqlWjbkOSXlWefvrp71bVxKn1V3zor1q1iqmpqVG3IUmvKkn+c1Dd6R1JaoihL0kNMfQlqSGGviQ1xNCXpIYY+pLUEENfkhpi6EtSQ17xF2e9Wqy668ujbmFsPP/Jd4+6BWlsuacvSQ0x9CWpIYa+JDVkztBPsjLJ40n2Jdmb5MNd/RNJvpNkd3d7V986dyc5kGR/klv66jcm2dM9d0+SnJ+3JUkaZD4Hck8AH62qZ5JcAjyd5NHuuc9U1Z/1D06yBtgIXAe8EfhKkl+oqpPAfcBm4GvAw8B64JHFeSuSpLnMuadfVYer6plu+TiwD1g+yyobgIeq6uWqOggcANYmuQq4tKqerKoCHgBuPdc3IEmav7M6ZTPJKuCtwNeBm4APJrkDmKL338D36f1B+FrfatNd7Sfd8ql1SeeRpxMvrlf7KcXzPpCb5GLgC8BHquoH9KZqrgVuAA4Dn5oZOmD1mqU+6LU2J5lKMnXs2LH5tihJmsO8Qj/Ja+gF/oNV9UWAqjpSVSer6qfAZ4G13fBpYGXf6iuAQ119xYD6aapqW1VNVtXkxMRp3/YlSVqg+Zy9E+BzwL6q+nRf/aq+Ye8Fnu2WdwEbk1yY5BpgNfBUVR0GjidZ123zDmDnIr0PSdI8zGdO/ybgfcCeJLu72seA25PcQG+K5nngAwBVtTfJDuA5emf+bOnO3AG4E7gfuIjeWTueuSNJQzRn6FfVEwyej394lnW2AlsH1KeA68+mQUnS4vGKXElqiKEvSQ0x9CWpIYa+JDXE0Jekhhj6ktQQQ1+SGmLoS1JDDH1JaoihL0kNMfQlqSGGviQ1xNCXpIYY+pLUEENfkhpi6EtSQwx9SWqIoS9JDTH0Jakhhr4kNcTQl6SGGPqS1BBDX5IaYuhLUkMMfUlqiKEvSQ0x9CWpIYa+JDXE0Jekhhj6ktQQQ1+SGjJn6CdZmeTxJPuS7E3y4a5+eZJHk3yru7+sb527kxxIsj/JLX31G5Ps6Z67J0nOz9uSJA0ynz39E8BHq+otwDpgS5I1wF3AY1W1Gnise0z33EbgOmA9cG+SJd227gM2A6u72/pFfC+SpDnMGfpVdbiqnumWjwP7gOXABmB7N2w7cGu3vAF4qKperqqDwAFgbZKrgEur6smqKuCBvnUkSUNwVnP6SVYBbwW+DlxZVYeh94cBuKIbthx4sW+16a62vFs+tS5JGpJ5h36Si4EvAB+pqh/MNnRArWapD3qtzUmmkkwdO3Zsvi1KkuYwr9BP8hp6gf9gVX2xKx/ppmzo7o929WlgZd/qK4BDXX3FgPppqmpbVU1W1eTExMR834skaQ7zOXsnwOeAfVX16b6ndgGbuuVNwM6++sYkFya5ht4B26e6KaDjSdZ127yjbx1J0hAsnceYm4D3AXuS7O5qHwM+CexI8n7gBeA2gKram2QH8By9M3+2VNXJbr07gfuBi4BHupskaUjmDP2qeoLB8/EAN59hna3A1gH1KeD6s2lQkrR4vCJXkhpi6EtSQwx9SWqIoS9JDTH0Jakhhr4kNcTQl6SGGPqS1BBDX5IaYuhLUkMMfUlqiKEvSQ0x9CWpIYa+JDXE0Jekhhj6ktQQQ1+SGmLoS1JDDH1JaoihL0kNMfQlqSGGviQ1xNCXpIYY+pLUEENfkhpi6EtSQwx9SWqIoS9JDTH0Jakhhr4kNcTQl6SGzBn6ST6f5GiSZ/tqn0jynSS7u9u7+p67O8mBJPuT3NJXvzHJnu65e5Jk8d+OJGk289nTvx9YP6D+maq6obs9DJBkDbARuK5b594kS7rx9wGbgdXdbdA2JUnn0ZyhX1VfBb43z+1tAB6qqper6iBwAFib5Crg0qp6sqoKeAC4dYE9S5IW6Fzm9D+Y5N+66Z/Lutpy4MW+MdNdbXm3fGpdkjRECw39+4BrgRuAw8CnuvqgefqapT5Qks1JppJMHTt2bIEtSpJOtaDQr6ojVXWyqn4KfBZY2z01DazsG7oCONTVVwyon2n726pqsqomJyYmFtKiJGmABYV+N0c/473AzJk9u4CNSS5Mcg29A7ZPVdVh4HiSdd1ZO3cAO8+hb0nSAiyda0CSvwXeDixLMg18HHh7khvoTdE8D3wAoKr2JtkBPAecALZU1cluU3fSOxPoIuCR7iZJGqI5Q7+qbh9Q/tws47cCWwfUp4Drz6o7SdKi8opcSWqIoS9JDTH0Jakhhr4kNcTQl6SGGPqS1BBDX5IaYuhLUkMMfUlqiKEvSQ0x9CWpIYa+JDXE0Jekhhj6ktQQQ1+SGmLoS1JDDH1JaoihL0kNMfQlqSGGviQ1xNCXpIYY+pLUEENfkhpi6EtSQwx9SWqIoS9JDTH0Jakhhr4kNcTQl6SGGPqS1BBDX5IaMmfoJ/l8kqNJnu2rXZ7k0STf6u4v63vu7iQHkuxPcktf/cYke7rn7kmSxX87kqTZzGdP/35g/Sm1u4DHqmo18Fj3mCRrgI3Add069yZZ0q1zH7AZWN3dTt2mJOk8mzP0q+qrwPdOKW8AtnfL24Fb++oPVdXLVXUQOACsTXIVcGlVPVlVBTzQt44kaUgWOqd/ZVUdBujur+jqy4EX+8ZNd7Xl3fKpdUnSEC32gdxB8/Q1S33wRpLNSaaSTB07dmzRmpOk1i009I90UzZ090e7+jSwsm/cCuBQV18xoD5QVW2rqsmqmpyYmFhgi5KkUy009HcBm7rlTcDOvvrGJBcmuYbeAdunuimg40nWdWft3NG3jiRpSJbONSDJ3wJvB5YlmQY+DnwS2JHk/cALwG0AVbU3yQ7gOeAEsKWqTnabupPemUAXAY90N0nSEM0Z+lV1+xmeuvkM47cCWwfUp4Drz6o7SdKi8opcSWqIoS9JDTH0Jakhhr4kNcTQl6SGGPqS1BBDX5IaYuhLUkMMfUlqiKEvSQ0x9CWpIYa+JDXE0Jekhhj6ktQQQ1+SGmLoS1JDDH1JaoihL0kNMfQlqSGGviQ1xNCXpIYY+pLUEENfkhpi6EtSQwx9SWqIoS9JDTH0Jakhhr4kNcTQl6SGGPqS1BBDX5Iack6hn+T5JHuS7E4y1dUuT/Jokm9195f1jb87yYEk+5Pccq7NS5LOzmLs6b+jqm6oqsnu8V3AY1W1Gnise0ySNcBG4DpgPXBvkiWL8PqSpHk6H9M7G4Dt3fJ24Na++kNV9XJVHQQOAGvPw+tLks7gXEO/gH9K8nSSzV3tyqo6DNDdX9HVlwMv9q073dUkSUOy9BzXv6mqDiW5Ang0yTdnGZsBtRo4sPcHZDPA1VdffY4tSpJmnNOeflUd6u6PAl+iN11zJMlVAN390W74NLCyb/UVwKEzbHdbVU1W1eTExMS5tChJ6rPg0E/y+iSXzCwDvwE8C+wCNnXDNgE7u+VdwMYkFya5BlgNPLXQ15cknb1zmd65EvhSkpnt/E1V/UOSbwA7krwfeAG4DaCq9ibZATwHnAC2VNXJc+peknRWFhz6VfVt4JcG1F8Cbj7DOluBrQt9TUnSufGKXElqiKEvSQ0x9CWpIYa+JDXE0Jekhhj6ktQQQ1+SGmLoS1JDDH1JaoihL0kNMfQlqSGGviQ1xNCXpIYY+pLUEENfkhpi6EtSQwx9SWqIoS9JDTH0Jakhhr4kNcTQl6SGGPqS1BBDX5IaYuhLUkMMfUlqiKEvSQ0
},
"metadata": {
"needs_background": "light"
}
}
],
"source": [
"data_orginal['Residence_type'].value_counts().plot(kind=\"bar\")"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": []
}
]
}