In [13]:
#Import dependencies
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np

In [14]:
#Create a set of random latitude and longitude combinations
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)
lat_lngs

#This zip objects packs each pair of lats and lngs having the same index in their respective array into a tuple

<zip at 0x22e811e2048>

In [15]:
#Add the latitudes and longitudes to a list
coordinates = list(lat_lngs)

In [16]:
#Use the citipy module to determine city based on latitude and longitude
from citipy import citipy

In [17]:
#Create a list for holding the cities
cities = []

#Identify the nearest city for each latitude and longitude combination
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name
    
    #If the city is unique, then we will add it to the cities list
    if city not in cities:
        cities.append(city)
#Print the city count to confirm sufficient count
len(cities)

603

## Retrieve City Weather Data

In [18]:
#Import dependencies
from citipy import citipy
import requests
from config import weather_api_key
from datetime import datetime

url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key

In [19]:
#Create an empty list to hold the weather data
city_data = []

#Print the beginning of the logging
print("Beginning Data Retrieval     ")
print("-----------------------------")

#Create counters
record_count = 1
set_count = 1

#Loop through all the cities in our list
for i, city in enumerate(cities):
    
    #Group cities in sets of 50 for logging purposes
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
    #Create endpoint URL with each city
    city_url = url + "&q=" + city.replace(" ","+")
    #Log the URL, record, and set numbers and the city
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    #Add 1 toS the record count
    record_count += 1

    ### Code Breakdown ###
    #Create a for loop with the enumerate() method and reference the index and the city in the list
    #Check if the remainder of the index divided by 50 is equal to zero, AND if the index is greater than or equal to 50,
    # using a conditional statement.
    #Create a URL endpoint in the conditional statement. However, we are removing blank spaces in the city name and 
    # concatenating the city name using city.replace(" ","+"). This will find the corresponding weather data for the city
    # instead of finding the weather data for the first part of the city name.
    #Add a print statement that tells the record count, set count, and the city that is being processed
    #Then add 1 to the record count before the next city is processed

#Run an API request for each of the cites 
    try:
        #Parse the JSON and retrieve data
        city_weather = requests.get(city_url).json()
        #Parse out the needed data
        city_lat = city_weather['coord']['lat']
        city_lng = city_weather['coord']['lon']
        city_max_temp = city_weather['main']['temp_max']
        city_humidity = city_weather['main']['humidity']
        city_clouds = city_weather['clouds']['all']
        city_wind = city_weather['wind']['speed']
        city_country = city_weather['sys']['country']
        #Convert the date to ISO standard
        city_date = datetime.utcfromtimestamp(city_weather['dt']).strftime('%Y-%m-%d %H:%M:%S')
        #Append the city information into city_data list
        city_data.append({'City': city.title(),
                          'Lat': city_lat, 
                          'Lng': city_lng, 
                          'Max Temp': city_max_temp, 
                          'Humidity': city_humidity, 
                          'Cloudiness': city_clouds, 
                          'Wind Speed': city_wind, 
                          'Country': city_country, 
                          'Date': city_date})
#If an error is experienced, skip the city
    except:
        print("City not found. Skipping...")
        pass

#Indicate that the Data Loading is complete
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")

    ### Code Breakdown ###
    #Parse the JSON file for the current city.
    #If there is weather data for the city, the metrics are retrieved.
    #The cities list is appended with a dictionary for that city, where the key value pairs 
    # are the values from the parameters.
    #Add the try and except block.
    #Add a pass statement to handle all errors encountered and to allow the program to continue.

Beginning Data Retrieval     
-----------------------------
Processing Record 1 of Set 1 | busselton
Processing Record 2 of Set 1 | qaanaaq
Processing Record 3 of Set 1 | kushima
Processing Record 4 of Set 1 | hermanus
Processing Record 5 of Set 1 | saint george
Processing Record 6 of Set 1 | georgetown
Processing Record 7 of Set 1 | rikitea
Processing Record 8 of Set 1 | bethel
Processing Record 9 of Set 1 | mys shmidta
City not found. Skipping...
Processing Record 10 of Set 1 | guanica
Processing Record 11 of Set 1 | alamos
Processing Record 12 of Set 1 | cayenne
Processing Record 13 of Set 1 | carahue
Processing Record 14 of Set 1 | winslow
Processing Record 15 of Set 1 | lebu
Processing Record 16 of Set 1 | grand gaube
Processing Record 17 of Set 1 | punta arenas
Processing Record 18 of Set 1 | grand river south east
City not found. Skipping...
Processing Record 19 of Set 1 | hobart
Processing Record 20 of Set 1 | mogadishu
Processing Record 21 of Set 1 | kamenskoye
City not found.

Processing Record 39 of Set 4 | araouane
Processing Record 40 of Set 4 | teguldet
Processing Record 41 of Set 4 | isangel
Processing Record 42 of Set 4 | karad
Processing Record 43 of Set 4 | pesca
Processing Record 44 of Set 4 | marcona
City not found. Skipping...
Processing Record 45 of Set 4 | portland
Processing Record 46 of Set 4 | bambous virieux
Processing Record 47 of Set 4 | saint-pierre
Processing Record 48 of Set 4 | ruatoria
City not found. Skipping...
Processing Record 49 of Set 4 | nyurba
Processing Record 50 of Set 4 | faanui
Processing Record 1 of Set 5 | dunedin
Processing Record 2 of Set 5 | padang
Processing Record 3 of Set 5 | douglas
Processing Record 4 of Set 5 | chilca
Processing Record 5 of Set 5 | champagnole
Processing Record 6 of Set 5 | nakusp
Processing Record 7 of Set 5 | chicama
Processing Record 8 of Set 5 | praia da vitoria
Processing Record 9 of Set 5 | dumas
Processing Record 10 of Set 5 | angoche
Processing Record 11 of Set 5 | zyryanka
Processing Re

Processing Record 31 of Set 8 | kieta
Processing Record 32 of Set 8 | kununurra
Processing Record 33 of Set 8 | nanortalik
Processing Record 34 of Set 8 | shar
Processing Record 35 of Set 8 | barcelos
Processing Record 36 of Set 8 | rio grande
Processing Record 37 of Set 8 | lamballe
Processing Record 38 of Set 8 | agua verde
Processing Record 39 of Set 8 | charters towers
Processing Record 40 of Set 8 | port blair
Processing Record 41 of Set 8 | byron bay
Processing Record 42 of Set 8 | san antonio
Processing Record 43 of Set 8 | warqla
City not found. Skipping...
Processing Record 44 of Set 8 | abu samrah
Processing Record 45 of Set 8 | mandalgovi
Processing Record 46 of Set 8 | saint-joseph
Processing Record 47 of Set 8 | varniai
Processing Record 48 of Set 8 | farafangana
Processing Record 49 of Set 8 | thinadhoo
Processing Record 50 of Set 8 | attawapiskat
City not found. Skipping...
Processing Record 1 of Set 9 | wahiawa
Processing Record 2 of Set 9 | kaffrine
Processing Record 3

Processing Record 17 of Set 12 | khorixas
Processing Record 18 of Set 12 | jinji
Processing Record 19 of Set 12 | panvel
Processing Record 20 of Set 12 | muhos
Processing Record 21 of Set 12 | batagay-alyta
Processing Record 22 of Set 12 | dalbandin
Processing Record 23 of Set 12 | serebryansk
Processing Record 24 of Set 12 | erzin
Processing Record 25 of Set 12 | satitoa
City not found. Skipping...
Processing Record 26 of Set 12 | melilla
Processing Record 27 of Set 12 | porto santo
Processing Record 28 of Set 12 | makakilo city
Processing Record 29 of Set 12 | ostersund
Processing Record 30 of Set 12 | vanavara
Processing Record 31 of Set 12 | bansda
City not found. Skipping...
Processing Record 32 of Set 12 | krasnoselkup
Processing Record 33 of Set 12 | debre sina
Processing Record 34 of Set 12 | galiwinku
City not found. Skipping...
Processing Record 35 of Set 12 | amahai
Processing Record 36 of Set 12 | oranjestad
Processing Record 37 of Set 12 | kroderen
City not found. Skipping

In [20]:
len(city_data)

555

In [21]:
#Convert the array of dictionaries into a Pandas data frame
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Busselton,-33.65,115.33,75.99,50,52,3.0,AU,2020-11-19 05:37:59
1,Qaanaaq,77.48,-69.36,27.73,87,100,15.05,GL,2020-11-19 05:37:59
2,Kushima,31.46,131.23,78.8,65,75,19.46,JP,2020-11-19 05:38:00
3,Hermanus,-34.42,19.23,61.0,84,20,3.0,ZA,2020-11-19 05:38:00
4,Saint George,37.1,-113.58,60.8,31,1,11.41,US,2020-11-19 05:38:00
5,Georgetown,5.41,100.34,86.0,79,40,9.17,MY,2020-11-19 05:38:00
6,Rikitea,-23.12,-134.97,70.5,89,100,17.74,PF,2020-11-19 05:33:27
7,Bethel,41.37,-73.41,21.0,79,1,0.92,US,2020-11-19 05:38:01
8,Guanica,17.97,-66.91,75.0,91,11,5.84,PR,2020-11-19 05:38:01
9,Alamos,27.02,-108.93,73.0,63,0,3.49,MX,2020-11-19 05:38:01


In [24]:
#Reorder the columns
new_column_order = ["City", "Country", "Date", "Lat", "Lng", "Max Temp", "Humidity", "Cloudiness", "Wind Speed"]
city_data_df = city_data_df[new_column_order]
city_data_df.head(10)

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Busselton,AU,2020-11-19 05:37:59,-33.65,115.33,75.99,50,52,3.0
1,Qaanaaq,GL,2020-11-19 05:37:59,77.48,-69.36,27.73,87,100,15.05
2,Kushima,JP,2020-11-19 05:38:00,31.46,131.23,78.8,65,75,19.46
3,Hermanus,ZA,2020-11-19 05:38:00,-34.42,19.23,61.0,84,20,3.0
4,Saint George,US,2020-11-19 05:38:00,37.1,-113.58,60.8,31,1,11.41
5,Georgetown,MY,2020-11-19 05:38:00,5.41,100.34,86.0,79,40,9.17
6,Rikitea,PF,2020-11-19 05:33:27,-23.12,-134.97,70.5,89,100,17.74
7,Bethel,US,2020-11-19 05:38:01,41.37,-73.41,21.0,79,1,0.92
8,Guanica,PR,2020-11-19 05:38:01,17.97,-66.91,75.0,91,11,5.84
9,Alamos,MX,2020-11-19 05:38:01,27.02,-108.93,73.0,63,0,3.49


In [23]:
#Create the output file (CSV)
output_data_file = "weather_data/cities.csv"

#Export the city_data into a CSV
city_data_df.to_csv(output_data_file, index_label='City_ID')