# Create Latitude and Longitude Combinations

In [1]:
# Import dependencies

import pandas as pd
import numpy as np
import matplotlib.pyplot as plt

In [2]:
# Create a set of random latitude and longitude combinations
# pack the latitudes (lats) and longitudes (lngs) as pairs by zipping them (lat_lngs) with the zip() function
# The zip object packs each pair of lats and lngs having the same index in their respective array into a tuple

lats = np.random.uniform(-90,90, size=1500)
lngs = np.random.uniform(-180,180, size=1500)
lat_lngs = zip(lats, lngs)

# When we run this cell, the output is a zip object in memory
lat_lngs

<zip at 0x7fa72b79a640>

In [3]:
# Add the latitudes and longitudes to a list.
coordinates = list(lat_lngs)
coordinates

[(-34.56885488708798, -97.55731610799997),
 (9.282483833763791, 72.85456149819353),
 (-84.75479765106553, 31.363612711703553),
 (4.394298253623745, -56.130349145961674),
 (12.490926740116464, -8.752259886445785),
 (31.275049817901177, -114.01073785812741),
 (54.37746112861828, 52.2808413245117),
 (-45.77172590946024, 131.8292100911006),
 (-81.63028149052985, -42.75062522500187),
 (-15.357622510737741, -90.04603138370938),
 (-9.058311180332893, -129.74629381948577),
 (34.53224068820427, 93.9970235463831),
 (29.62043719533827, -59.781594288287536),
 (50.9293778153548, 144.39033763834118),
 (-87.06896396940519, -127.12461547796272),
 (40.089594039604236, -84.25500136622063),
 (-6.73594356330257, -17.76496510801465),
 (49.434592824025486, 130.44044023494217),
 (81.1532398013575, 55.56482846365881),
 (65.90343624920908, 14.369314697350546),
 (-82.92698846364272, -176.49607414694322),
 (81.38847200237643, 159.5816226752894),
 (-85.2396137158778, -129.59748274000773),
 (-1.6830784065737276, -

In [4]:
# You can only unzip a zipped tuple once before it is removed from the computer’s memory. 
# Make sure you unzip the latitudes and longitudes into the coordinates list before moving on.

# Work with citipy

In [5]:
from citipy import citipy

In [6]:
# Create a list for holding the cities.
cities = []

# Identify the nearest city for each latitude and longitude combination.
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name
    
    # If the city is unique, then we will add it to the cities list.
    if city not in cities:
        cities.append(city)

        # Print the city count to confirm sufficient count.
len(cities)

646

# Request API Weather Data for All Cities

In [7]:
# Import the requests library.
import requests

requests.__version__

'2.23.0'

In [10]:
# Import the API key.
from config import api_key

# Import the datetime module from the datetime library.
from datetime import datetime

In [9]:
# Starting URL for Weather Map API Call.
# units=Imperial added to url
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + api_key

In [12]:
# Create an empty list to hold the weather data.
city_data = []

# Print the beginning of the logging.
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters.
record_count = 1
set_count = 1


# To reference the city in our code, we need to use the indexing on the cities_list, but this will cause programming
# errors when building the city_url because it adds the index, not the city name, to the city_url. To fix this issue,
# use the enumerate() method as an alternative way to iterate through the list of cities and retrieve both the index
# and the city from the list.

# Loop through all the cities in our list.
for i, city in enumerate(cities):
    
    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
    
    # Create endpoint URL with each city.
    city_url = url + "&q=" + city.replace(" ","+")
    
    # Log the URL, record, and set numbers and the city.
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    
    # Add 1 to the record count.
    record_count += 1
    
    # Run an API request for each of the cities.
    try:
        # Parse the JSON and retrieve data.
        city_weather = requests.get(city_url).json()
        # Parse out the needed data.
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        # Convert the date to ISO standard.
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
        # Append the city information into city_data list.
        city_data.append({"City": city.title(),
                          "Lat": city_lat,
                          "Lng": city_lng,
                          "Max Temp": city_max_temp,
                          "Humidity": city_humidity,
                          "Cloudiness": city_clouds,
                          "Wind Speed": city_wind,
                          "Country": city_country,
                          "Date": city_date})

# If an error is experienced, skip the city.
    except:
        print("City not found. Skipping...")
        pass

# Generally, it isn’t good coding practice to add the pass statement to the except block. Ideally, we want to handle
# or catch each error as it happens and do something specific (e.g., add another try block or print out the error).
    
# Indicate that Data Loading is complete.
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")

Beginning Data Retrieval     
-----------------------------
Processing Record 1 of Set 1 | lebu
Processing Record 2 of Set 1 | kavaratti
Processing Record 3 of Set 1 | port elizabeth
Processing Record 4 of Set 1 | brokopondo
Processing Record 5 of Set 1 | kangaba
Processing Record 6 of Set 1 | puerto penasco
Processing Record 7 of Set 1 | shugurovo
Processing Record 8 of Set 1 | port lincoln
Processing Record 9 of Set 1 | ushuaia
Processing Record 10 of Set 1 | huarmey
Processing Record 11 of Set 1 | atuona
Processing Record 12 of Set 1 | lasa
Processing Record 13 of Set 1 | saint george
Processing Record 14 of Set 1 | katangli
Processing Record 15 of Set 1 | rikitea
Processing Record 16 of Set 1 | piqua
Processing Record 17 of Set 1 | georgetown
Processing Record 18 of Set 1 | arkhara
Processing Record 19 of Set 1 | belushya guba
City not found. Skipping...
Processing Record 20 of Set 1 | mo i rana
Processing Record 21 of Set 1 | vaini
Processing Record 22 of Set 1 | cherskiy
Processi

Processing Record 38 of Set 4 | shahreza
Processing Record 39 of Set 4 | beringovskiy
Processing Record 40 of Set 4 | kristiansund
Processing Record 41 of Set 4 | valdivia
Processing Record 42 of Set 4 | fort wellington
Processing Record 43 of Set 4 | am timan
Processing Record 44 of Set 4 | lima
Processing Record 45 of Set 4 | izhma
Processing Record 46 of Set 4 | magadan
Processing Record 47 of Set 4 | socorro
Processing Record 48 of Set 4 | chuy
Processing Record 49 of Set 4 | tuatapere
Processing Record 50 of Set 4 | padang
Processing Record 1 of Set 5 | cidreira
Processing Record 2 of Set 5 | alofi
Processing Record 3 of Set 5 | vaitupu
City not found. Skipping...
Processing Record 4 of Set 5 | kloulklubed
Processing Record 5 of Set 5 | aklavik
Processing Record 6 of Set 5 | zalantun
Processing Record 7 of Set 5 | katsuura
Processing Record 8 of Set 5 | mahebourg
Processing Record 9 of Set 5 | monrovia
Processing Record 10 of Set 5 | yulara
Processing Record 11 of Set 5 | sentyabr

Processing Record 29 of Set 8 | zhanatas
City not found. Skipping...
Processing Record 30 of Set 8 | henties bay
Processing Record 31 of Set 8 | burnie
Processing Record 32 of Set 8 | chunskiy
Processing Record 33 of Set 8 | homestead
Processing Record 34 of Set 8 | saint-pierre
Processing Record 35 of Set 8 | zadar
Processing Record 36 of Set 8 | upington
Processing Record 37 of Set 8 | harper
Processing Record 38 of Set 8 | yatou
Processing Record 39 of Set 8 | geraldton
Processing Record 40 of Set 8 | terney
Processing Record 41 of Set 8 | matagami
Processing Record 42 of Set 8 | salinas
Processing Record 43 of Set 8 | belyy yar
Processing Record 44 of Set 8 | verkhnevilyuysk
Processing Record 45 of Set 8 | loiza
Processing Record 46 of Set 8 | el sauzal
Processing Record 47 of Set 8 | ostersund
Processing Record 48 of Set 8 | liku
Processing Record 49 of Set 8 | ust-kuyga
Processing Record 50 of Set 8 | codrington
Processing Record 1 of Set 9 | castanos
Processing Record 2 of Set 9

Processing Record 16 of Set 12 | pangai
Processing Record 17 of Set 12 | manises
Processing Record 18 of Set 12 | lincoln
Processing Record 19 of Set 12 | mareeba
Processing Record 20 of Set 12 | kortkeros
Processing Record 21 of Set 12 | kalemie
Processing Record 22 of Set 12 | clearwater
Processing Record 23 of Set 12 | ilo
Processing Record 24 of Set 12 | ovsyanka
Processing Record 25 of Set 12 | sompeta
Processing Record 26 of Set 12 | halalo
City not found. Skipping...
Processing Record 27 of Set 12 | ukmerge
Processing Record 28 of Set 12 | bhag
Processing Record 29 of Set 12 | pallasovka
Processing Record 30 of Set 12 | zarubino
Processing Record 31 of Set 12 | desaguadero
Processing Record 32 of Set 12 | guspini
Processing Record 33 of Set 12 | umzimvubu
City not found. Skipping...
Processing Record 34 of Set 12 | chateaubelair
Processing Record 35 of Set 12 | college
Processing Record 36 of Set 12 | mineiros
Processing Record 37 of Set 12 | chernyshevskiy
Processing Record 38 

In [14]:
# Count the number of cities in city_data
len(city_data)

595

# Convert the Array of Dictionaries to Other Formats & Reorder Columns

In [15]:
# Convert the array of dictionaries to a Pandas DataFrame.
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Lebu,-37.62,-73.65,52.99,83,64,12.86,CL,2020-06-17 21:15:40
1,Kavaratti,10.57,72.64,84.56,77,100,22.88,IN,2020-06-17 21:16:53
2,Port Elizabeth,-33.92,25.57,50.0,93,0,2.24,ZA,2020-06-17 21:15:00
3,Brokopondo,4.75,-55.17,80.83,82,49,8.08,SR,2020-06-17 21:16:55
4,Kangaba,11.93,-8.42,86.25,42,88,9.4,ML,2020-06-17 21:16:56
5,Puerto Penasco,31.32,-113.53,82.0,63,0,18.01,MX,2020-06-17 21:16:57
6,Shugurovo,54.51,52.13,60.85,91,12,6.11,RU,2020-06-17 21:16:57
7,Port Lincoln,-34.73,135.87,55.8,63,8,20.11,AU,2020-06-17 21:16:58
8,Ushuaia,-54.8,-68.3,37.4,74,40,3.36,AR,2020-06-17 21:14:13
9,Huarmey,-10.07,-78.15,69.06,68,0,12.82,PE,2020-06-17 21:16:59


In [18]:
# Assign new column order to a variable
new_column_order = ["City","Country","Date","Lat","Lng","Max Temp","Humidity","Cloudiness","Wind Speed",]

In [19]:
#Assign new column order to df
city_data_df = city_data_df[new_column_order]

In [20]:
city_data_df.head(10)

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Lebu,CL,2020-06-17 21:15:40,-37.62,-73.65,52.99,83,64,12.86
1,Kavaratti,IN,2020-06-17 21:16:53,10.57,72.64,84.56,77,100,22.88
2,Port Elizabeth,ZA,2020-06-17 21:15:00,-33.92,25.57,50.0,93,0,2.24
3,Brokopondo,SR,2020-06-17 21:16:55,4.75,-55.17,80.83,82,49,8.08
4,Kangaba,ML,2020-06-17 21:16:56,11.93,-8.42,86.25,42,88,9.4
5,Puerto Penasco,MX,2020-06-17 21:16:57,31.32,-113.53,82.0,63,0,18.01
6,Shugurovo,RU,2020-06-17 21:16:57,54.51,52.13,60.85,91,12,6.11
7,Port Lincoln,AU,2020-06-17 21:16:58,-34.73,135.87,55.8,63,8,20.11
8,Ushuaia,AR,2020-06-17 21:14:13,-54.8,-68.3,37.4,74,40,3.36
9,Huarmey,PE,2020-06-17 21:16:59,-10.07,-78.15,69.06,68,0,12.82


In [21]:
# Create the output file (CSV).
output_data_file = "weather_data/cities.csv"

# Export the City_Data into a CSV.
city_data_df.to_csv(output_data_file, index_label="City_ID")