In [None]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
from scipy.stats import linregress

# Import API key
from api_keys import weather_api

# Incorporated citipy to determine city based on latitude and longitude
from citipy import citipy

# Output File (CSV)
output_data_file = 'output_data/cities.csv'

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)


In [None]:
# List for holding lat_lngs and cities
lat_lngs = []
cities = []

# Create a set of random lat and lng combinations
lats = np.random.uniform(lat_range[0], lat_range[1], size=1500)
lngs = np.random.uniform(lng_range[0], lng_range[1], size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)
        
base_url = 'http://api.openweathermap.org/data/2.5/weather?q='
query_url = base_url + city + '&appid=' + weather_api

# Print the city count to confirm sufficient count
len(cities)

In [None]:
#Empty lists for my variables
cloudinesses = []
dates = []
humidities = []
lats = []
lngs = []
max_temps = []
wind_speeds = []
countries = []
city_column = []

count_one = 0
set_one = 1

#Run the API call for each city
print('Beginning Data Retrieval')
print('-----------------------------')

for city in cities:
    weather_response = requests.get(query_url)
    weather_json = weather_response.json()
    try:
        cloudinesses.append(weather_json['clouds']['all'])
        countries.append( weather_json['sys']['country'])
        dates.append( weather_json['dt'])
        humidities.append( weather_json['main']['humidity'])
        lats.append( weather_json['coord']['lat'])
        lngs.append( weather_json['coord']['lon'])
        max_temps.append( weather_json['main']['temp_max'])
        wind_speeds.append( weather_json['wind']['speed'])
        if count_one > 48:
            count_one = 1
            set_one += 1
            city_column.append(city)
        else:
            count_one += 1
            city_column.append(city)
        print(f"Processing Record {count_one} of Set {set_one} | {city}")
    except:
        print('City not found. Skipping...')
    pass
print('------------------------------')
print('Data Retrieval Complete')
print('------------------------------')

In [None]:
#create new dataframe using new columns
weather_dict = {
    "City":city_column,
    "Cloudiness":cloudinesses,
    "Country":countries,
    "Date":dates,
    "Humidity":humidities,
    "Lat":lats,
    "Lng":lngs,
    "Max Temp":max_temps,
    "Wind Speed":wind_speeds}
weather_df = pd.DataFrame(weather_dict)
weather_df.head()

In [None]:
weather_df.to_csv(output_data_file)

In [None]:
plt.scatter(weather_df["Lat"],weather_df["Max Temp"],edgecolors="black",facecolors="blue")
plt.title("City Latitude vs. Max Temperature (07/23/2020)")
plt.xlabel("Latitude")
plt.ylabel("Max Temperature (F)")
plt.grid (b=True,which="major",axis="both",linestyle="-",color="lightgrey")
plt.savefig("Figures/fig1.png")
plt.show()

In [None]:
plt.scatter(weather_df["Lat"],weather_df["Humidity"],edgecolors="black",facecolors="blue")
plt.title("City Latitude vs. Humidity (07/23/2020)")
plt.xlabel("Latitude")
plt.ylabel("Humidity (%)")
plt.ylim(15,105)
plt.grid (b=True,which="major",axis="both",linestyle="-",color="lightgrey")
plt.savefig("Figures/fig2.png")
plt.show()

In [None]:
plt.scatter(weather_dataframe["Lat"],weather_data["Cloudiness"],edgecolors="black",facecolors="blue")
plt.title("City Latitude vs. Cloudiness (07/23/2020)")
plt.xlabel("Latitude")
plt.ylabel("Cloudiness (%)")
plt.grid (b=True,which="major",axis="both",linestyle="-",color="lightgrey")
plt.savefig("Figures/fig3.png")
plt.show()