{ "cells": [ { "cell_type": "code", "execution_count": 1, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "hNYAM1jr8P8v", "outputId": "318f51a0-e7a8-4d69-86f3-3412ca800459" }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "/bin/sh: 1: wget: not found\r\n" ] } ], "source": [ "!wget -c https://git.wmi.amu.edu.pl/s434695/ium_434695/raw/commit/2301fb86e434734376f73503307a8f3255a75cc6/vgsales.csv\n" ] }, { "cell_type": "code", "execution_count": 13, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "l6wJKCw7iqQ8", "outputId": "91fcfedc-4cdf-4208-9a9e-a02b56b6db83" }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Requirement already satisfied: pandas in /home/tomasz/snap/jupyter/common/lib/python3.7/site-packages (1.2.3)\n", "Requirement already satisfied: pytz>=2017.3 in /home/tomasz/snap/jupyter/common/lib/python3.7/site-packages (from pandas) (2021.1)\n", "Requirement already satisfied: python-dateutil>=2.7.3 in /snap/jupyter/6/lib/python3.7/site-packages (from pandas) (2.8.0)\n", "Requirement already satisfied: numpy>=1.16.5 in /home/tomasz/snap/jupyter/common/lib/python3.7/site-packages (from pandas) (1.20.1)\n", "Requirement already satisfied: six>=1.5 in /snap/jupyter/6/lib/python3.7/site-packages (from python-dateutil>=2.7.3->pandas) (1.12.0)\n", "Requirement already satisfied: scikit-learn in /home/tomasz/snap/jupyter/common/lib/python3.7/site-packages (0.24.1)\n", "Requirement already satisfied: joblib>=0.11 in /home/tomasz/snap/jupyter/common/lib/python3.7/site-packages (from scikit-learn) (1.0.1)\n", "Requirement already satisfied: threadpoolctl>=2.0.0 in /home/tomasz/snap/jupyter/common/lib/python3.7/site-packages (from scikit-learn) (2.1.0)\n", "Requirement already satisfied: numpy>=1.13.3 in /home/tomasz/snap/jupyter/common/lib/python3.7/site-packages (from scikit-learn) (1.20.1)\n", "Requirement already satisfied: scipy>=0.19.1 in /home/tomasz/snap/jupyter/common/lib/python3.7/site-packages (from scikit-learn) (1.6.1)\n", "Requirement already satisfied: matplotlib in /home/tomasz/snap/jupyter/common/lib/python3.7/site-packages (3.3.4)\n", "Requirement already satisfied: kiwisolver>=1.0.1 in /home/tomasz/snap/jupyter/common/lib/python3.7/site-packages (from matplotlib) (1.3.1)\n", "Requirement already satisfied: pillow>=6.2.0 in /home/tomasz/snap/jupyter/common/lib/python3.7/site-packages (from matplotlib) (8.1.2)\n", "Requirement already satisfied: python-dateutil>=2.1 in /snap/jupyter/6/lib/python3.7/site-packages (from matplotlib) (2.8.0)\n", "Requirement already satisfied: numpy>=1.15 in /home/tomasz/snap/jupyter/common/lib/python3.7/site-packages (from matplotlib) (1.20.1)\n", "Requirement already satisfied: cycler>=0.10 in /home/tomasz/snap/jupyter/common/lib/python3.7/site-packages (from matplotlib) (0.10.0)\n", "Requirement already satisfied: pyparsing!=2.0.4,!=2.1.2,!=2.1.6,>=2.0.3 in /home/tomasz/snap/jupyter/common/lib/python3.7/site-packages (from matplotlib) (2.4.7)\n", "Requirement already satisfied: six>=1.5 in /snap/jupyter/6/lib/python3.7/site-packages (from python-dateutil>=2.1->matplotlib) (1.12.0)\n", "Collecting seaborn\n", "\u001b[?25l Downloading https://files.pythonhosted.org/packages/68/ad/6c2406ae175f59ec616714e408979b674fe27b9587f79d59a528ddfbcd5b/seaborn-0.11.1-py3-none-any.whl (285kB)\n", "\u001b[K |████████████████████████████████| 286kB 1.1MB/s eta 0:00:01\n", "\u001b[?25hRequirement already satisfied: scipy>=1.0 in /home/tomasz/snap/jupyter/common/lib/python3.7/site-packages (from seaborn) (1.6.1)\n", "Requirement already satisfied: matplotlib>=2.2 in /home/tomasz/snap/jupyter/common/lib/python3.7/site-packages (from seaborn) (3.3.4)\n", "Requirement already satisfied: numpy>=1.15 in /home/tomasz/snap/jupyter/common/lib/python3.7/site-packages (from seaborn) (1.20.1)\n", "Requirement already satisfied: pandas>=0.23 in /home/tomasz/snap/jupyter/common/lib/python3.7/site-packages (from seaborn) (1.2.3)\n", "Requirement already satisfied: python-dateutil>=2.1 in /snap/jupyter/6/lib/python3.7/site-packages (from matplotlib>=2.2->seaborn) (2.8.0)\n", "Requirement already satisfied: pillow>=6.2.0 in /home/tomasz/snap/jupyter/common/lib/python3.7/site-packages (from matplotlib>=2.2->seaborn) (8.1.2)\n", "Requirement already satisfied: kiwisolver>=1.0.1 in /home/tomasz/snap/jupyter/common/lib/python3.7/site-packages (from matplotlib>=2.2->seaborn) (1.3.1)\n", "Requirement already satisfied: cycler>=0.10 in /home/tomasz/snap/jupyter/common/lib/python3.7/site-packages (from matplotlib>=2.2->seaborn) (0.10.0)\n", "Requirement already satisfied: pyparsing!=2.0.4,!=2.1.2,!=2.1.6,>=2.0.3 in /home/tomasz/snap/jupyter/common/lib/python3.7/site-packages (from matplotlib>=2.2->seaborn) (2.4.7)\n", "Requirement already satisfied: pytz>=2017.3 in /home/tomasz/snap/jupyter/common/lib/python3.7/site-packages (from pandas>=0.23->seaborn) (2021.1)\n", "Requirement already satisfied: six>=1.5 in /snap/jupyter/6/lib/python3.7/site-packages (from python-dateutil>=2.1->matplotlib>=2.2->seaborn) (1.12.0)\n", "Installing collected packages: seaborn\n", "Successfully installed seaborn-0.11.1\n" ] } ], "source": [ "!pip install --user pandas\n", "!pip install --user scikit-learn\n", "!pip install --user matplotlib\n", "!pip install --user seaborn" ] }, { "cell_type": "code", "execution_count": 3, "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 493 }, "id": "uXRk5Z4tixiJ", "outputId": "ed788406-9f0f-418c-93ef-54398dc4613d" }, "outputs": [ { "data": { "text/html": [ "
\n", " | Rank | \n", "Name | \n", "Platform | \n", "Year | \n", "Genre | \n", "Publisher | \n", "NA_Sales | \n", "EU_Sales | \n", "JP_Sales | \n", "Other_Sales | \n", "Global_Sales | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "1 | \n", "Wii Sports | \n", "Wii | \n", "2006.0 | \n", "Sports | \n", "Nintendo | \n", "41.49 | \n", "29.02 | \n", "3.77 | \n", "8.46 | \n", "82.74 | \n", "
1 | \n", "2 | \n", "Super Mario Bros. | \n", "NES | \n", "1985.0 | \n", "Platform | \n", "Nintendo | \n", "29.08 | \n", "3.58 | \n", "6.81 | \n", "0.77 | \n", "40.24 | \n", "
2 | \n", "3 | \n", "Mario Kart Wii | \n", "Wii | \n", "2008.0 | \n", "Racing | \n", "Nintendo | \n", "15.85 | \n", "12.88 | \n", "3.79 | \n", "3.31 | \n", "35.82 | \n", "
3 | \n", "4 | \n", "Wii Sports Resort | \n", "Wii | \n", "2009.0 | \n", "Sports | \n", "Nintendo | \n", "15.75 | \n", "11.01 | \n", "3.28 | \n", "2.96 | \n", "33.00 | \n", "
4 | \n", "5 | \n", "Pokemon Red/Pokemon Blue | \n", "GB | \n", "1996.0 | \n", "Role-Playing | \n", "Nintendo | \n", "11.27 | \n", "8.89 | \n", "10.22 | \n", "1.00 | \n", "31.37 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
16593 | \n", "16596 | \n", "Woody Woodpecker in Crazy Castle 5 | \n", "GBA | \n", "2002.0 | \n", "Platform | \n", "Kemco | \n", "0.01 | \n", "0.00 | \n", "0.00 | \n", "0.00 | \n", "0.01 | \n", "
16594 | \n", "16597 | \n", "Men in Black II: Alien Escape | \n", "GC | \n", "2003.0 | \n", "Shooter | \n", "Infogrames | \n", "0.01 | \n", "0.00 | \n", "0.00 | \n", "0.00 | \n", "0.01 | \n", "
16595 | \n", "16598 | \n", "SCORE International Baja 1000: The Official Game | \n", "PS2 | \n", "2008.0 | \n", "Racing | \n", "Activision | \n", "0.00 | \n", "0.00 | \n", "0.00 | \n", "0.00 | \n", "0.01 | \n", "
16596 | \n", "16599 | \n", "Know How 2 | \n", "DS | \n", "2010.0 | \n", "Puzzle | \n", "7G//AMES | \n", "0.00 | \n", "0.01 | \n", "0.00 | \n", "0.00 | \n", "0.01 | \n", "
16597 | \n", "16600 | \n", "Spirits & Spells | \n", "GBA | \n", "2003.0 | \n", "Platform | \n", "Wanadoo | \n", "0.01 | \n", "0.00 | \n", "0.00 | \n", "0.00 | \n", "0.01 | \n", "
16598 rows × 11 columns
\n", "\n", " | Rank | \n", "Name | \n", "Platform | \n", "Year | \n", "Genre | \n", "Publisher | \n", "NA_Sales | \n", "EU_Sales | \n", "JP_Sales | \n", "Other_Sales | \n", "Global_Sales | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|
count | \n", "16598.000000 | \n", "16598 | \n", "16598 | \n", "16327.000000 | \n", "16598 | \n", "16540 | \n", "16598.000000 | \n", "16598.000000 | \n", "16598.000000 | \n", "16598.000000 | \n", "16598.000000 | \n", "
unique | \n", "NaN | \n", "11493 | \n", "31 | \n", "NaN | \n", "12 | \n", "578 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "
top | \n", "NaN | \n", "Need for Speed: Most Wanted | \n", "DS | \n", "NaN | \n", "Action | \n", "Electronic Arts | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "
freq | \n", "NaN | \n", "12 | \n", "2163 | \n", "NaN | \n", "3316 | \n", "1351 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "
mean | \n", "8300.605254 | \n", "NaN | \n", "NaN | \n", "2006.406443 | \n", "NaN | \n", "NaN | \n", "0.264667 | \n", "0.146652 | \n", "0.077782 | \n", "0.048063 | \n", "0.537441 | \n", "
std | \n", "4791.853933 | \n", "NaN | \n", "NaN | \n", "5.828981 | \n", "NaN | \n", "NaN | \n", "0.816683 | \n", "0.505351 | \n", "0.309291 | \n", "0.188588 | \n", "1.555028 | \n", "
min | \n", "1.000000 | \n", "NaN | \n", "NaN | \n", "1980.000000 | \n", "NaN | \n", "NaN | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.010000 | \n", "
25% | \n", "4151.250000 | \n", "NaN | \n", "NaN | \n", "2003.000000 | \n", "NaN | \n", "NaN | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.060000 | \n", "
50% | \n", "8300.500000 | \n", "NaN | \n", "NaN | \n", "2007.000000 | \n", "NaN | \n", "NaN | \n", "0.080000 | \n", "0.020000 | \n", "0.000000 | \n", "0.010000 | \n", "0.170000 | \n", "
75% | \n", "12449.750000 | \n", "NaN | \n", "NaN | \n", "2010.000000 | \n", "NaN | \n", "NaN | \n", "0.240000 | \n", "0.110000 | \n", "0.040000 | \n", "0.040000 | \n", "0.470000 | \n", "
max | \n", "16600.000000 | \n", "NaN | \n", "NaN | \n", "2020.000000 | \n", "NaN | \n", "NaN | \n", "41.490000 | \n", "29.020000 | \n", "10.220000 | \n", "10.570000 | \n", "82.740000 | \n", "