In [1]:
# import dependecies
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np

In [3]:
# create a set of random latitude and longitude combinations
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)
lat_lngs

<zip at 0x121cea980>

In [4]:
# add the lat and lngs from practice into a list
coordinates = list(lat_lngs)

In [5]:
# import citipy module
from citipy import citipy

In [6]:
# create a list for holding the cities
cities = []

# identify nearest city for each lat and lng 
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name
    
    # if city is unique then add to cities list
    if city not in cities:
        cities.append(city)

# print the city count to confirm count
len(cities)

626

In [7]:
# import dependecies pt2
import requests
from config import weather_api_key
from datetime import datetime

# build basic url with api key
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key

In [8]:
# Create an empty list to hold the weather data.
city_data = []

# Print the beginning of the logging.
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters.
record_count = 1
set_count = 1

# Loop through all the cities in the list.
for i, city in enumerate(cities):

    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
    # Create endpoint URL with each city.
    city_url = url + "&q=" + city.replace(" ","+")

    # Log the URL, record, and set numbers and the city.
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    # Add 1 to the record count.
    record_count += 1
    
# Run an API request for each of the cities.
    try:
        # Parse the JSON and retrieve data.
        city_weather = requests.get(city_url).json()
        
        # Parse out the needed data.
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        
        # Convert the date to ISO standard.
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
        
        # Append the city information into city_data list.
        city_data.append({"City": city.title(),
                          "Lat": city_lat,
                          "Lng": city_lng,
                          "Max Temp": city_max_temp,
                          "Humidity": city_humidity,
                          "Cloudiness": city_clouds,
                          "Wind Speed": city_wind,
                          "Country": city_country,
                          "Date": city_date})

# If an error is experienced, skip the city.
    except:
        print("City not found. Skipping...")
        pass

# Indicate that Data Loading is complete.
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")

Beginning Data Retrieval     
-----------------------------
Processing Record 1 of Set 1 | albany
Processing Record 2 of Set 1 | saleaula
City not found. Skipping...
Processing Record 3 of Set 1 | lompoc
Processing Record 4 of Set 1 | avarua
Processing Record 5 of Set 1 | boyolangu
Processing Record 6 of Set 1 | laurel
Processing Record 7 of Set 1 | tuktoyaktuk
Processing Record 8 of Set 1 | kapaa
Processing Record 9 of Set 1 | russell
Processing Record 10 of Set 1 | punta arenas
Processing Record 11 of Set 1 | cape town
Processing Record 12 of Set 1 | tiksi
Processing Record 13 of Set 1 | luderitz
Processing Record 14 of Set 1 | pitimbu
Processing Record 15 of Set 1 | taolanaro
City not found. Skipping...
Processing Record 16 of Set 1 | mooresville
Processing Record 17 of Set 1 | mecca
Processing Record 18 of Set 1 | samarai
Processing Record 19 of Set 1 | guerrero negro
Processing Record 20 of Set 1 | ulladulla
Processing Record 21 of Set 1 | klaksvik
Processing Record 22 of Set 1 | 

Processing Record 36 of Set 4 | cockburn town
Processing Record 37 of Set 4 | humaita
Processing Record 38 of Set 4 | mata grande
Processing Record 39 of Set 4 | penzance
Processing Record 40 of Set 4 | mayumba
Processing Record 41 of Set 4 | goure
Processing Record 42 of Set 4 | higuey
City not found. Skipping...
Processing Record 43 of Set 4 | mahebourg
Processing Record 44 of Set 4 | morondava
Processing Record 45 of Set 4 | norman wells
Processing Record 46 of Set 4 | arman
Processing Record 47 of Set 4 | beni mazar
Processing Record 48 of Set 4 | coihaique
Processing Record 49 of Set 4 | leh
Processing Record 50 of Set 4 | norfolk
Processing Record 1 of Set 5 | burnie
Processing Record 2 of Set 5 | inhambane
Processing Record 3 of Set 5 | nikolskoye
Processing Record 4 of Set 5 | ingham
Processing Record 5 of Set 5 | bongandanga
Processing Record 6 of Set 5 | matamoros
Processing Record 7 of Set 5 | yulara
Processing Record 8 of Set 5 | mount hagen
Processing Record 9 of Set 5 | s

Processing Record 24 of Set 8 | chara
Processing Record 25 of Set 8 | jizan
Processing Record 26 of Set 8 | pangkalanbuun
Processing Record 27 of Set 8 | port blair
Processing Record 28 of Set 8 | butaritari
Processing Record 29 of Set 8 | puerto suarez
Processing Record 30 of Set 8 | rio bueno
Processing Record 31 of Set 8 | jumla
Processing Record 32 of Set 8 | bulawayo
Processing Record 33 of Set 8 | obo
Processing Record 34 of Set 8 | saint-jean-de-maurienne
Processing Record 35 of Set 8 | buta
Processing Record 36 of Set 8 | vila franca do campo
Processing Record 37 of Set 8 | la ronge
Processing Record 38 of Set 8 | kachug
Processing Record 39 of Set 8 | mahibadhoo
Processing Record 40 of Set 8 | san antonio
Processing Record 41 of Set 8 | havelock
Processing Record 42 of Set 8 | buarcos
Processing Record 43 of Set 8 | ennis
Processing Record 44 of Set 8 | jalu
Processing Record 45 of Set 8 | alice springs
Processing Record 46 of Set 8 | sinnamary
Processing Record 47 of Set 8 | 

Processing Record 11 of Set 12 | krasnyy chikoy
Processing Record 12 of Set 12 | hami
Processing Record 13 of Set 12 | sao jose da coroa grande
Processing Record 14 of Set 12 | hay river
Processing Record 15 of Set 12 | landsmeer
Processing Record 16 of Set 12 | hambantota
Processing Record 17 of Set 12 | port macquarie
Processing Record 18 of Set 12 | santiago del estero
Processing Record 19 of Set 12 | chapais
Processing Record 20 of Set 12 | parana
Processing Record 21 of Set 12 | medford
Processing Record 22 of Set 12 | naze
Processing Record 23 of Set 12 | uarini
Processing Record 24 of Set 12 | temaraia
City not found. Skipping...
Processing Record 25 of Set 12 | kantang
Processing Record 26 of Set 12 | waitati
Processing Record 27 of Set 12 | agbor
Processing Record 28 of Set 12 | muros
Processing Record 29 of Set 12 | vestmannaeyjar
Processing Record 30 of Set 12 | nena
Processing Record 31 of Set 12 | merauke
Processing Record 32 of Set 12 | vostok
Processing Record 33 of Set 

In [9]:
# convert the array of dictionaries/data into a pd df
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Albany,42.6001,-73.9662,32.0,29,99,1.01,US,2021-03-16 23:14:45
1,Lompoc,34.6391,-120.4579,55.4,62,75,18.41,US,2021-03-16 23:15:07
2,Avarua,-21.2078,-159.775,84.2,74,75,13.8,CK,2021-03-16 23:15:25
3,Boyolangu,-8.1181,111.8935,74.71,89,66,1.32,ID,2021-03-16 23:15:26
4,Laurel,39.0993,-76.8483,43.0,75,90,5.75,US,2021-03-16 23:15:26
5,Tuktoyaktuk,69.4541,-133.0374,-13.0,77,20,3.44,CA,2021-03-16 23:15:21
6,Kapaa,22.0752,-159.319,73.4,78,90,24.16,US,2021-03-16 23:10:35
7,Russell,32.3502,-85.1999,66.99,88,90,6.91,US,2021-03-16 23:15:27
8,Punta Arenas,-53.15,-70.9167,48.2,71,0,43.73,CL,2021-03-16 23:15:09
9,Cape Town,-33.9258,18.4232,63.0,77,0,14.97,ZA,2021-03-16 23:15:28


In [12]:
# reorder columns in df 
new_column_order = ["City", "Country", "Date", "Lat", "Lng", "Max Temp", "Humidity", "Cloudiness", "Wind Speed"]
city_data_df = city_data_df[new_column_order]
city_data_df.head(10)

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Albany,US,2021-03-16 23:14:45,42.6001,-73.9662,32.0,29,99,1.01
1,Lompoc,US,2021-03-16 23:15:07,34.6391,-120.4579,55.4,62,75,18.41
2,Avarua,CK,2021-03-16 23:15:25,-21.2078,-159.775,84.2,74,75,13.8
3,Boyolangu,ID,2021-03-16 23:15:26,-8.1181,111.8935,74.71,89,66,1.32
4,Laurel,US,2021-03-16 23:15:26,39.0993,-76.8483,43.0,75,90,5.75
5,Tuktoyaktuk,CA,2021-03-16 23:15:21,69.4541,-133.0374,-13.0,77,20,3.44
6,Kapaa,US,2021-03-16 23:10:35,22.0752,-159.319,73.4,78,90,24.16
7,Russell,US,2021-03-16 23:15:27,32.3502,-85.1999,66.99,88,90,6.91
8,Punta Arenas,CL,2021-03-16 23:15:09,-53.15,-70.9167,48.2,71,0,43.73
9,Cape Town,ZA,2021-03-16 23:15:28,-33.9258,18.4232,63.0,77,0,14.97


In [13]:
# create an ouput file (csv)
output_data_file = "weather_data/cities.csv"

# export the city data into a csv
city_data_df.to_csv(output_data_file, index_label="City_ID")