{ "cells": [ { "cell_type": "code", "execution_count": 1, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "hNYAM1jr8P8v", "outputId": "318f51a0-e7a8-4d69-86f3-3412ca800459" }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "/bin/sh: 1: wget: not found\r\n" ] } ], "source": [ "!wget -c https://git.wmi.amu.edu.pl/s434695/ium_434695/raw/commit/2301fb86e434734376f73503307a8f3255a75cc6/vgsales.csv\n" ] }, { "cell_type": "code", "execution_count": 8, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "l6wJKCw7iqQ8", "outputId": "91fcfedc-4cdf-4208-9a9e-a02b56b6db83" }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Requirement already satisfied: pandas in /home/tomasz/snap/jupyter/common/lib/python3.7/site-packages (1.2.3)\n", "Requirement already satisfied: pytz>=2017.3 in /home/tomasz/snap/jupyter/common/lib/python3.7/site-packages (from pandas) (2021.1)\n", "Requirement already satisfied: numpy>=1.16.5 in /home/tomasz/snap/jupyter/common/lib/python3.7/site-packages (from pandas) (1.20.1)\n", "Requirement already satisfied: python-dateutil>=2.7.3 in /snap/jupyter/6/lib/python3.7/site-packages (from pandas) (2.8.0)\n", "Requirement already satisfied: six>=1.5 in /snap/jupyter/6/lib/python3.7/site-packages (from python-dateutil>=2.7.3->pandas) (1.12.0)\n", "Requirement already satisfied: scikit-learn in /home/tomasz/snap/jupyter/common/lib/python3.7/site-packages (0.24.1)\n", "Requirement already satisfied: numpy>=1.13.3 in /home/tomasz/snap/jupyter/common/lib/python3.7/site-packages (from scikit-learn) (1.20.1)\n", "Requirement already satisfied: joblib>=0.11 in /home/tomasz/snap/jupyter/common/lib/python3.7/site-packages (from scikit-learn) (1.0.1)\n", "Requirement already satisfied: threadpoolctl>=2.0.0 in /home/tomasz/snap/jupyter/common/lib/python3.7/site-packages (from scikit-learn) (2.1.0)\n", "Requirement already satisfied: scipy>=0.19.1 in /home/tomasz/snap/jupyter/common/lib/python3.7/site-packages (from scikit-learn) (1.6.1)\n", "Collecting matplotlib\n", "\u001b[?25l Downloading https://files.pythonhosted.org/packages/23/3d/db9a6b3c83c9511301152dbb64a029c3a4313c86eaef12c237b13ecf91d6/matplotlib-3.3.4-cp37-cp37m-manylinux1_x86_64.whl (11.5MB)\n", "\u001b[K |████████████████████████████████| 11.6MB 4.9MB/s eta 0:00:01 |██████████▊ | 3.9MB 1.7MB/s eta 0:00:05\n", "\u001b[?25hCollecting cycler>=0.10 (from matplotlib)\n", " Downloading https://files.pythonhosted.org/packages/f7/d2/e07d3ebb2bd7af696440ce7e754c59dd546ffe1bbe732c8ab68b9c834e61/cycler-0.10.0-py2.py3-none-any.whl\n", "Collecting kiwisolver>=1.0.1 (from matplotlib)\n", "\u001b[?25l Downloading https://files.pythonhosted.org/packages/d2/46/231de802ade4225b76b96cffe419cf3ce52bbe92e3b092cf12db7d11c207/kiwisolver-1.3.1-cp37-cp37m-manylinux1_x86_64.whl (1.1MB)\n", "\u001b[K |████████████████████████████████| 1.1MB 6.1MB/s eta 0:00:01\n", "\u001b[?25hRequirement already satisfied: numpy>=1.15 in /home/tomasz/snap/jupyter/common/lib/python3.7/site-packages (from matplotlib) (1.20.1)\n", "Requirement already satisfied: python-dateutil>=2.1 in /snap/jupyter/6/lib/python3.7/site-packages (from matplotlib) (2.8.0)\n", "Requirement already satisfied: pillow>=6.2.0 in /home/tomasz/snap/jupyter/common/lib/python3.7/site-packages (from matplotlib) (8.1.2)\n", "Collecting pyparsing!=2.0.4,!=2.1.2,!=2.1.6,>=2.0.3 (from matplotlib)\n", "\u001b[?25l Downloading https://files.pythonhosted.org/packages/8a/bb/488841f56197b13700afd5658fc279a2025a39e22449b7cf29864669b15d/pyparsing-2.4.7-py2.py3-none-any.whl (67kB)\n", "\u001b[K |████████████████████████████████| 71kB 5.5MB/s eta 0:00:01\n", "\u001b[?25hRequirement already satisfied: six in /snap/jupyter/6/lib/python3.7/site-packages (from cycler>=0.10->matplotlib) (1.12.0)\n", "Installing collected packages: cycler, kiwisolver, pyparsing, matplotlib\n", "Successfully installed cycler-0.10.0 kiwisolver-1.3.1 matplotlib-3.3.4 pyparsing-2.4.7\n" ] } ], "source": [ "!pip install --user pandas\n", "!pip install --user scikit-learn\n", "!pip install --user matplotlib" ] }, { "cell_type": "code", "execution_count": 3, "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 493 }, "id": "uXRk5Z4tixiJ", "outputId": "ed788406-9f0f-418c-93ef-54398dc4613d" }, "outputs": [ { "data": { "text/html": [ "
\n", " | Rank | \n", "Name | \n", "Platform | \n", "Year | \n", "Genre | \n", "Publisher | \n", "NA_Sales | \n", "EU_Sales | \n", "JP_Sales | \n", "Other_Sales | \n", "Global_Sales | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "1 | \n", "Wii Sports | \n", "Wii | \n", "2006.0 | \n", "Sports | \n", "Nintendo | \n", "41.49 | \n", "29.02 | \n", "3.77 | \n", "8.46 | \n", "82.74 | \n", "
1 | \n", "2 | \n", "Super Mario Bros. | \n", "NES | \n", "1985.0 | \n", "Platform | \n", "Nintendo | \n", "29.08 | \n", "3.58 | \n", "6.81 | \n", "0.77 | \n", "40.24 | \n", "
2 | \n", "3 | \n", "Mario Kart Wii | \n", "Wii | \n", "2008.0 | \n", "Racing | \n", "Nintendo | \n", "15.85 | \n", "12.88 | \n", "3.79 | \n", "3.31 | \n", "35.82 | \n", "
3 | \n", "4 | \n", "Wii Sports Resort | \n", "Wii | \n", "2009.0 | \n", "Sports | \n", "Nintendo | \n", "15.75 | \n", "11.01 | \n", "3.28 | \n", "2.96 | \n", "33.00 | \n", "
4 | \n", "5 | \n", "Pokemon Red/Pokemon Blue | \n", "GB | \n", "1996.0 | \n", "Role-Playing | \n", "Nintendo | \n", "11.27 | \n", "8.89 | \n", "10.22 | \n", "1.00 | \n", "31.37 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
16593 | \n", "16596 | \n", "Woody Woodpecker in Crazy Castle 5 | \n", "GBA | \n", "2002.0 | \n", "Platform | \n", "Kemco | \n", "0.01 | \n", "0.00 | \n", "0.00 | \n", "0.00 | \n", "0.01 | \n", "
16594 | \n", "16597 | \n", "Men in Black II: Alien Escape | \n", "GC | \n", "2003.0 | \n", "Shooter | \n", "Infogrames | \n", "0.01 | \n", "0.00 | \n", "0.00 | \n", "0.00 | \n", "0.01 | \n", "
16595 | \n", "16598 | \n", "SCORE International Baja 1000: The Official Game | \n", "PS2 | \n", "2008.0 | \n", "Racing | \n", "Activision | \n", "0.00 | \n", "0.00 | \n", "0.00 | \n", "0.00 | \n", "0.01 | \n", "
16596 | \n", "16599 | \n", "Know How 2 | \n", "DS | \n", "2010.0 | \n", "Puzzle | \n", "7G//AMES | \n", "0.00 | \n", "0.01 | \n", "0.00 | \n", "0.00 | \n", "0.01 | \n", "
16597 | \n", "16600 | \n", "Spirits & Spells | \n", "GBA | \n", "2003.0 | \n", "Platform | \n", "Wanadoo | \n", "0.01 | \n", "0.00 | \n", "0.00 | \n", "0.00 | \n", "0.01 | \n", "
16598 rows × 11 columns
\n", "\n", " | Rank | \n", "Name | \n", "Platform | \n", "Year | \n", "Genre | \n", "Publisher | \n", "NA_Sales | \n", "EU_Sales | \n", "JP_Sales | \n", "Other_Sales | \n", "Global_Sales | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|
count | \n", "16598.000000 | \n", "16598 | \n", "16598 | \n", "16327.000000 | \n", "16598 | \n", "16540 | \n", "16598.000000 | \n", "16598.000000 | \n", "16598.000000 | \n", "16598.000000 | \n", "16598.000000 | \n", "
unique | \n", "NaN | \n", "11493 | \n", "31 | \n", "NaN | \n", "12 | \n", "578 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "
top | \n", "NaN | \n", "Need for Speed: Most Wanted | \n", "DS | \n", "NaN | \n", "Action | \n", "Electronic Arts | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "
freq | \n", "NaN | \n", "12 | \n", "2163 | \n", "NaN | \n", "3316 | \n", "1351 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "
mean | \n", "8300.605254 | \n", "NaN | \n", "NaN | \n", "2006.406443 | \n", "NaN | \n", "NaN | \n", "0.264667 | \n", "0.146652 | \n", "0.077782 | \n", "0.048063 | \n", "0.537441 | \n", "
std | \n", "4791.853933 | \n", "NaN | \n", "NaN | \n", "5.828981 | \n", "NaN | \n", "NaN | \n", "0.816683 | \n", "0.505351 | \n", "0.309291 | \n", "0.188588 | \n", "1.555028 | \n", "
min | \n", "1.000000 | \n", "NaN | \n", "NaN | \n", "1980.000000 | \n", "NaN | \n", "NaN | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.010000 | \n", "
25% | \n", "4151.250000 | \n", "NaN | \n", "NaN | \n", "2003.000000 | \n", "NaN | \n", "NaN | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.060000 | \n", "
50% | \n", "8300.500000 | \n", "NaN | \n", "NaN | \n", "2007.000000 | \n", "NaN | \n", "NaN | \n", "0.080000 | \n", "0.020000 | \n", "0.000000 | \n", "0.010000 | \n", "0.170000 | \n", "
75% | \n", "12449.750000 | \n", "NaN | \n", "NaN | \n", "2010.000000 | \n", "NaN | \n", "NaN | \n", "0.240000 | \n", "0.110000 | \n", "0.040000 | \n", "0.040000 | \n", "0.470000 | \n", "
max | \n", "16600.000000 | \n", "NaN | \n", "NaN | \n", "2020.000000 | \n", "NaN | \n", "NaN | \n", "41.490000 | \n", "29.020000 | \n", "10.220000 | \n", "10.570000 | \n", "82.740000 | \n", "