Python2018/labs06/tasks.py

#!/usr/bin/env python3
# -*- coding: utf-8 -*-

"""
1. Zaimportuj bibliotkę pandas jako pd.
"""

import pandas as pd

"""
2. Wczytaj zbiór danych `311.csv` do zniennej data.
"""

data = pd.read_csv("J:/PycharmProjects/Python2018/labs06/311.csv", low_memory = False)


"""
3. Wyświetl 5 pierwszych wierszy z data.
"""

# print(data.head())


"""
4. Wyświetl nazwy kolumn.
"""

# print(data.info())
#print(data.columns)

"""
5. Wyświetl ile nasz zbiór danych ma kolumn i wierszy.

"""
#shape = data.shape
#rows = shape[0]
#cols = shape[1]

#print(rows, cols)

"""
6. Wyświetl kolumnę 'City' z powyższego zbioru danych.
"""

#print(data['City'])

"""
7. Wyświetl jakie wartoścu przyjmuje kolumna 'City'.

"""
#print(data.City.unique())

"""
8. Wyświetl tabelę rozstawną kolumny City.
"""
#print(data.City.value_counts())

"""
9. Wyświetl tylko pierwsze 4 wiersze z wcześniejszego polecenia.
"""
#print(data.City.value_counts().head(4))

"""
10. Wyświetl, w ilu przypadkach kolumna City zawiera NaN.
"""

#print(data[data['City'] == 'isnull'])


"""
11. Wyświetl data.info()
"""
#print(data.info())
"""
12. Wyświetl tylko kolumny Borough i Agency i tylko 5 ostatnich linii.
"""

#print(data[['Borough', 'Agency']].tail(5))

"""
13. Wyświetl tylko te dane, dla których wartość z kolumny Agency jest równa
NYPD. Zlicz ile jest takich przykładów.

"""
#print(data[data['Agency'] == 'NYPD'])

"""
14. Wyświetl wartość minimalną i maksymalną z kolumny Longitude.
"""
#wartosc = data['Longitude']
#print(wartosc.max())
#print(wartosc.min())
"""
15. Dodaj kolumne diff, która powstanie przez sumowanie kolumn Longitude i Latitude.
"""
x=data['Longitude']
y=data['Latitude']
data['diff'] = x+y
print(data['diff'])
"""
16. Wyświetl tablę rozstawną dla kolumny 'Descriptor', dla której Agency jest
równe NYPD.
"""

p = data[data['Agency'] == 'NYPD']
p.Descriptor.value_counts()
add tasks.py 2018-06-03 08:10:07 +02:00			`#!/usr/bin/env python3`
			`# -- coding: utf-8 --`

			`"""`
			`1. Zaimportuj bibliotkę pandas jako pd.`
			`"""`

tasks 2018-06-03 11:22:04 +02:00			`import pandas as pd`
add tasks.py 2018-06-03 08:10:07 +02:00
			`"""`
Add 311 2018-06-03 09:52:00 +02:00			2. Wczytaj zbiór danych `311.csv` do zniennej data.
add tasks.py 2018-06-03 08:10:07 +02:00			`"""`

tasks 2018-06-03 11:22:04 +02:00			`data = pd.read_csv("J:/PycharmProjects/Python2018/labs06/311.csv", low_memory = False)`

add tasks.py 2018-06-03 08:10:07 +02:00
			`"""`
			`3. Wyświetl 5 pierwszych wierszy z data.`
			`"""`

tasks 2018-06-03 11:22:04 +02:00			`# print(data.head())`

add tasks.py 2018-06-03 08:10:07 +02:00
			`"""`
			`4. Wyświetl nazwy kolumn.`
			`"""`

tasks 2018-06-03 11:22:04 +02:00			`# print(data.info())`
			`#print(data.columns)`
add tasks.py 2018-06-03 08:10:07 +02:00
			`"""`
			`5. Wyświetl ile nasz zbiór danych ma kolumn i wierszy.`
tasks 2018-06-03 11:22:04 +02:00
add tasks.py 2018-06-03 08:10:07 +02:00			`"""`
tasks 2018-06-03 11:22:04 +02:00			`#shape = data.shape`
			`#rows = shape[0]`
			`#cols = shape[1]`
add tasks.py 2018-06-03 08:10:07 +02:00
tasks 2018-06-03 11:22:04 +02:00			`#print(rows, cols)`
add tasks.py 2018-06-03 08:10:07 +02:00
			`"""`
			`6. Wyświetl kolumnę 'City' z powyższego zbioru danych.`
			`"""`

tasks 2018-06-03 11:22:04 +02:00			`#print(data['City'])`
add tasks.py 2018-06-03 08:10:07 +02:00
			`"""`
			`7. Wyświetl jakie wartoścu przyjmuje kolumna 'City'.`
tasks 2018-06-03 11:22:04 +02:00
add tasks.py 2018-06-03 08:10:07 +02:00			`"""`
tasks 2018-06-03 11:22:04 +02:00			`#print(data.City.unique())`
add tasks.py 2018-06-03 08:10:07 +02:00
			`"""`
			`8. Wyświetl tabelę rozstawną kolumny City.`
			`"""`
tasks 2018-06-03 11:22:04 +02:00			`#print(data.City.value_counts())`
add tasks.py 2018-06-03 08:10:07 +02:00
			`"""`
			`9. Wyświetl tylko pierwsze 4 wiersze z wcześniejszego polecenia.`
			`"""`
tasks 2018-06-03 11:22:04 +02:00			`#print(data.City.value_counts().head(4))`
add tasks.py 2018-06-03 08:10:07 +02:00
			`"""`
			`10. Wyświetl, w ilu przypadkach kolumna City zawiera NaN.`
			`"""`

tasks 2018-06-03 11:22:04 +02:00			`#print(data[data['City'] == 'isnull'])`
add tasks.py 2018-06-03 08:10:07 +02:00

			`"""`
			`11. Wyświetl data.info()`
			`"""`
tasks 2018-06-03 11:22:04 +02:00			`#print(data.info())`
add tasks.py 2018-06-03 08:10:07 +02:00			`"""`
			`12. Wyświetl tylko kolumny Borough i Agency i tylko 5 ostatnich linii.`
			`"""`

tasks 2018-06-03 11:22:04 +02:00			`#print(data[['Borough', 'Agency']].tail(5))`
add tasks.py 2018-06-03 08:10:07 +02:00
			`"""`
			`13. Wyświetl tylko te dane, dla których wartość z kolumny Agency jest równa`
			`NYPD. Zlicz ile jest takich przykładów.`
tasks 2018-06-03 11:22:04 +02:00
add tasks.py 2018-06-03 08:10:07 +02:00			`"""`
tasks 2018-06-03 11:22:04 +02:00			`#print(data[data['Agency'] == 'NYPD'])`
add tasks.py 2018-06-03 08:10:07 +02:00
			`"""`
			`14. Wyświetl wartość minimalną i maksymalną z kolumny Longitude.`
			`"""`
tasks 2018-06-03 11:22:04 +02:00			`#wartosc = data['Longitude']`
			`#print(wartosc.max())`
			`#print(wartosc.min())`
add tasks.py 2018-06-03 08:10:07 +02:00			`"""`
			`15. Dodaj kolumne diff, która powstanie przez sumowanie kolumn Longitude i Latitude.`
			`"""`
tasks 2018-06-03 11:22:04 +02:00			`x=data['Longitude']`
			`y=data['Latitude']`
			`data['diff'] = x+y`
			`print(data['diff'])`
add tasks.py 2018-06-03 08:10:07 +02:00			`"""`
			`16. Wyświetl tablę rozstawną dla kolumny 'Descriptor', dla której Agency jest`
			`równe NYPD.`
			`"""`
tasks 2018-06-03 11:22:04 +02:00
			`p = data[data['Agency'] == 'NYPD']`
			`p.Descriptor.value_counts()`