python-scripts/25_ip2geolocation.py

62 lines
1.8 KiB
Python
Raw Normal View History

2015-02-18 19:56:18 +01:00
import csv
import requests
def get_addresses(filename):
"""
Given a CSV file, this function returns a list of lists
where each element (list) in the outer list contains the
row info from the csv file.
"""
all_addresses = []
with open(filename, 'rt') as f:
2015-02-18 19:56:18 +01:00
reader = csv.reader(f)
for row in reader:
all_addresses.append(row)
return all_addresses
def get_geolocation(all_the_ip_address):
"""
Given a list of lists from `get_addresses()`, this function
returns an updated lists of lists containing the geolocation.
"""
print("Getting geo information...")
updated_addresses = []
counter = 1
# update header
header_row = all_the_ip_address.pop(0)
header_row.extend(['Country', 'City'])
# get geolocation
for line in all_the_ip_address:
print("Grabbing geo info for row # {0}".format(counter))
2015-02-18 19:56:18 +01:00
r = requests.get('https://freegeoip.net/json/{0}'.format(line[0]))
line.extend([str(r.json()['country_name']), str(r.json()['city'])])
updated_addresses.append(line)
counter += 1
updated_addresses.insert(0, header_row)
return updated_addresses
def create_csv(updated_address_list):
"""
Given the updated lists of lists from `get_geolocation()`, this function
creates a new CSV.
"""
import sys
if sys.version_info >= (3, 0, 0):
f = open('output.csv', 'w', newline='')
else:
f = open('output.csv', 'wb')
with f:
2015-02-18 19:56:18 +01:00
writer = csv.writer(f)
writer.writerows(updated_address_list)
print("All done!")
2015-02-18 19:56:18 +01:00
if __name__ == '__main__':
csv_file = '25_sample_csv.csv'
all_the_ip_address = get_addresses(csv_file)
updated_address_list = get_geolocation(all_the_ip_address)
create_csv(updated_address_list)