In [None]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
from pprint import pprint
# Import API key
import api_keys

# Incorporated citipy to determine city based on latitude and longitude
from citipy import citipy

# Output File (CSV)
output_data_file = "output_data/cities.csv"

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)

In [None]:
# List for holding lat_lngs and cities
lat_lngs = []
cities = []

# Create a set of random lat and lng combinations
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
len(cities)

url = "http://api.openweathermap.org/data/2.5/weather?"
units  = "imperial"

In [None]:
weather_df = pd.DataFrame({"City": cities,
                           "Latitude": latitude,
                           "Longitude": longitude,
                           "Humidity": humidity,
                           "Max Temp": temperature,
                           "Cloudiness": cloudiness,
                           "Wind Speed": wind_speed,
                           "Date": dates,
                           "Country": country_codes
                          })

for x in range(len(cities)): 
    response = requests.get(f"{query}{cities[x]},{country_codes[x].upper()}").json()
    
    try: 
        print(f"Processing record {x + 1} | {cities[x]}")
        df.loc[-1] = [response['name'],
                     response['clouds']['all'], 
                     response['sys']['country'],
                     response['dt'],
                     response['main']['humidity'], 
                     response['coord']['lat'],
                     response['coord']['lon'],
                     response['main']['temp_max'],
                     response['wind']['speed']]
        df.index = df.index + 1
        df = df.sort_index()
    except KeyError:
        print('City not found. Skipping..')

In [None]:
weather_df.to_csv()
print(df.shape)
weather_df.head()

In [None]:
plt.scatter(x = weather_df['Latitude'], y = weather_df['Max Temp'], edgecolor = 'black')
plt.grid()
plt.xlabel('Latitude')
plt.ylabel('Max Temperature (F)')
plt.title('City Latitude vs. Max Temperature')
plt.ylim(ymin = min(df['Max Temp']) - (max(df['Max Temp']) - min(df['Max Temp']))/20, ymax = max(df['Max Temp']) + (max(df['Max Temp']) - min(df['Max Temp']))/20)
plt.xlim(xmin = min(df['Lat']) - 5, xmax = max(df['Lat']) + 5)
plt.savefig('latvstemp.png')
plt.show()

In [None]:
plt.scatter(x = weather_df['Latitude'], y = weather_df['Humidity'], edgecolor = 'black')
plt.grid()
plt.xlabel('Latitude')
plt.ylabel('Humidity (%)')
plt.title('City Latitude vs. Humidity')
plt.ylim(ymin = min(df['Humidity']) - (max(df['Humidity']) - min(df['Humidity']))/20, ymax = max(df['Humidity']) + (max(df['Humidity']) - min(df['Humidity']))/20)
plt.xlim(xmin = min(df['Lat']) - 5, xmax = max(df['Lat']) + 5)
plt.savefig('latvshumidity.png')
plt.show()

In [None]:
plt.scatter(x = weather_df['Latitude'], y = weather_df['Cloudiness'], edgecolor = 'black')
plt.grid()
plt.xlabel('Latitude')
plt.ylabel('Cloudiness (%)')
plt.title('City Latitude vs. Cloudiness')
plt.ylim(ymin = min(df['Cloudiness']) - (max(df['Cloudiness']) - min(df['Cloudiness']))/20, ymax = max(df['Cloudiness']) + (max(df['Cloudiness']) - min(df['Cloudiness']))/20)
plt.xlim(xmin = min(df['Lat']) - 5, xmax = max(df['Lat']) + 5)
plt.savefig('latvscloudiness.png')
plt.show()

In [None]:
plt.scatter(x = weather_df['Latitude'], y = weather_df['Wind Speed'], edgecolor = 'black')
plt.grid()
plt.xlabel('Latitude')
plt.ylabel('Wind Speed (%)')
plt.title('City Latitude vs. Wind Speed')
plt.ylim(ymin = min(df['Wind Speed']) - (max(df['Wind Speed']) - min(df['Wind Speed']))/20, ymax = max(df['Wind Speed']) + (max(df['Wind Speed']) - min(df['Wind Speed']))/20)
plt.xlim(xmin = min(df['Lat']) - 5, xmax = max(df['Lat']) + 5)
plt.savefig('latvswindspeed.png')
plt.show()