In [1]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time

# Import API key
api_key = "39042e07c1158e77a43c5d806d2b6125"

# Incorporated citipy to determine city based on latitude and longitude
from citipy import citipy

# Output File (CSV)
output_data_file = "output_data/cities.csv"

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)

In [2]:
# List for holding lat_lngs and cities
lat_lngs = []
cities = []

# Create a set of random lat and lng combinations
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
len(cities)

604

In [3]:
url = "http://api.openweathermap.org/data/2.5/weather?"
units = "imperial"

query_url = f"{url}appid={api_key}&units={units}&q="

In [None]:
city_name = []
country = []
date = []
lat = []
lng = []
max_temp = []
humidity = []
cloudiness = []
wind_speed = []

record = 0
set_starter = 1

print("Beginning Data Retrieval")

print("--------------------------------")

for city in cities:
   
    try:
        response = requests.get(f"{query_url}{city}").json()
        #city_name.append(response["name"])
        country.append(response["sys"]["country"])
        date.append(response["dt"])
        lat.append(response["coord"]["lat"])
        lng.append(response["coord"]["lon"])
        max_temp.append(response["main"]["temp_max"])
        humidity.append(response["main"]["humidity"])
        cloudiness.append(response["clouds"]["all"])
        wind_speed.append(response["wind"]["speed"])
        city_record = response["name"]
        
        if record > 49:
            record = 1
            set_starter += 1
            city_name.append(response["name"])
        else:
            record += 1
            city_name.append(response["name"])
            
        print(f"Processing Record {record} of Set {set_starter} | {city_record}")
        
        time.sleep(1.02)
              
    except :
              print("City not found. Skipping...")
              
    continue

print("-------------------------------")
print("Data Retrieval Complete")
print("-------------------------------")

Beginning Data Retrieval
--------------------------------
Processing Record 1 of Set 1 | Rikitea
Processing Record 2 of Set 1 | Albany
Processing Record 3 of Set 1 | New Norfolk
City not found. Skipping...
Processing Record 4 of Set 1 | Te Anau
Processing Record 5 of Set 1 | Dunedin
Processing Record 6 of Set 1 | Mataura
Processing Record 7 of Set 1 | Kupang
Processing Record 8 of Set 1 | Hilo
Processing Record 9 of Set 1 | Hermanus
Processing Record 10 of Set 1 | East London
City not found. Skipping...
Processing Record 11 of Set 1 | Ushuaia
City not found. Skipping...
Processing Record 12 of Set 1 | Hithadhoo
Processing Record 13 of Set 1 | Hobart
City not found. Skipping...
Processing Record 14 of Set 1 | Atuona
City not found. Skipping...
Processing Record 15 of Set 1 | Cavalcante
Processing Record 16 of Set 1 | Beringovskiy
Processing Record 17 of Set 1 | Jiayuguan
City not found. Skipping...
Processing Record 18 of Set 1 | Pevek
Processing Record 19 of Set 1 | Coquimbo
Processing

Processing Record 29 of Set 4 | Kununurra
City not found. Skipping...
City not found. Skipping...
City not found. Skipping...
Processing Record 30 of Set 4 | Kodiak
Processing Record 31 of Set 4 | Cabo San Lucas
Processing Record 32 of Set 4 | Sistranda
Processing Record 33 of Set 4 | Podlesnoye
Processing Record 34 of Set 4 | Upernavik
Processing Record 35 of Set 4 | Ialibu
Processing Record 36 of Set 4 | Dunmore East
Processing Record 37 of Set 4 | Ixtapa
Processing Record 38 of Set 4 | Morant Bay
City not found. Skipping...
Processing Record 39 of Set 4 | San Vicente
Processing Record 40 of Set 4 | Chuy
Processing Record 41 of Set 4 | Quang Ngai
Processing Record 42 of Set 4 | Jinka
Processing Record 43 of Set 4 | Varhaug
Processing Record 44 of Set 4 | Cherskiy
Processing Record 45 of Set 4 | Kurchum
Processing Record 46 of Set 4 | Mahanoro
Processing Record 47 of Set 4 | Klaksvik
Processing Record 48 of Set 4 | Harnosand
Processing Record 49 of Set 4 | Komsomolskiy
Processing Reco

In [None]:
#Covert Raw Data to DataFrame

weather_table = {
    "City":city_name,
    "Cloudiness":cloudiness,
    "Country":country,
    "Date":date,
    "Humidity":humidity,
    "Lat":lat,
    "Lng":lng,
    "Max Temp":max_temp,
    "Wind Speed":wind_speed
}


In [None]:
weather_df = pd.DataFrame(weather_table)
weather_df.head()

In [None]:
weather_df.count()

In [None]:
weather_df.to_csv("output/weather_df.csv", index = False, header = True)

In [None]:
#Latitude vs. Temperature Plot
plt.scatter(weather_df["Lat"], weather_df["Max Temp"], edgecolors="black",
           facecolors="royalblue")
plt.title("City Latitude vs. Max Temperature (08/24/19)")
plt.xlabel("Latitude")
plt.ylabel("Max Temperature (F)")
plt.savefig("figures/fig1.png")
plt.grid(True)
plt.show()


In [None]:
#Latitude vs. Humidity
plt.scatter(weather_df["Lat"], weather_df["Humidity"], edgecolors="black",
           facecolors="royalblue")
plt.title("City Latitude vs. Humidity (08/24/19)")
plt.xlabel("Latitude")
plt.ylabel("Humidity (%)")
plt.savefig("figures/fig2.png")
plt.grid(True)
plt.show()

In [None]:
#Latitude vs. Cloudiness
plt.scatter(weather_df["Lat"], weather_df["Cloudiness"], edgecolors="black",
           facecolors="royalblue")
plt.title("City Latitude vs. Cloudiness (08/24/19)")
plt.xlabel("Latitude")
plt.ylabel("Cloudiness (%)")
plt.savefig("figures/fig3.png")
plt.grid(True)
plt.show()

In [None]:
#Latitude vs. Wind Speed
plt.scatter(weather_df["Lat"], weather_df["Wind Speed"], edgecolors="black",
           facecolors="royalblue")
plt.title("City Latitude vs. Wind Speed (08/24/19)")
plt.xlabel("Latitude")
plt.ylabel("Wind Speed (mph)")
plt.savefig("figures/fig4.png")
plt.grid(True)
plt.show()