In [4]:
# Dependencies and Setup

# visualizations
import matplotlib.pyplot as plt
import seaborn as sns

#data science - standard library
import pandas as pd
import numpy as np

#requests
import requests
from pprint import pprint
import time

#regression
from scipy.stats import linregress
import statsmodels.api as sm
from sklearn.linear_model import LinearRegression

# Import API key
from api_keys import weather_api_key

# Incorporated citipy to determine city based on latitude and longitude
from citipy import citipy

# Output File (CSV)
output_data_file = "Lane_cities.csv"

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)

In [5]:
# List for holding lat_lngs and cities
lat_lngs = []
cities = []

# Create a set of random lat and lng combinations
lats = np.random.uniform(lat_range[0], lat_range[1], size=1500)
lngs = np.random.uniform(lng_range[0], lng_range[1], size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
len(cities)

598

In [8]:
cities_sub=cities[0:5]
cities_sub

['carnarvon', 'vila velha', 'hithadhoo', 'pangnirtung', 'albany']

In [23]:
#init lists to hold parsed data
lats = []
longs = []
temps = []
humid = []
windSpeed = []
cloudiness = []
cities_found = []

for city in cities_sub:
    #get the city
    #city = cities[i]
    
    #create the url
    units = "imperial"
    url = f"http://api.openweathermap.org/data/2.5/weather?q={city}&units={units}&appid={weather_api_key}"
#     print(url)

    #make the request
    response = requests.get(url)
#     print(response.status_code)
    
    #error check
    if response.status_code == 200:
        data = response.json()
#         pprint(data)
        
        try:
            lat = data["coord"]["lat"]
            long = data["coord"]["lon"]
            temp = data["main"]["temp"]
            humidity = data["main"]["humidity"]
            speed = data["wind"]["speed"]
            clouds = data["clouds"]["all"]
            city_name = data["name"]

            #save the data
            lats.append(lat)
            longs.append(long)
            temps.append(temp)
            humid.append(humidity)
            windSpeed.append(speed)
            cloudiness.append(clouds)
            cities_found.append(city_name)
        except Exception as e:
            print(f"Through exception for city {city}: {e}")
    
    elif response.status_code == 404:
        print(f"Missing data in API for {city}")
    else:
        print(response.status_code)
        print("The API is broken.")
        
    #print every 5
    #if (i % 5 == 0):
        #print(f"Data gathered for: {i} of {len(cities)}")
    
    #sleep for requests
    time.sleep(1)
        
# make the dataframe
df = pd.DataFrame()
df["City"] = cities_found
df["Latitude"] = lats
df["Longitude"] = longs
df["Temperature"] = temps
df["Humidity"] = humid
df["Wind Speed"] = windSpeed
df["Cloudiness"] = cloudiness

df.head(10)

Unnamed: 0,City,Latitude,Longitude,Temperature,Humidity,Wind Speed,Cloudiness
0,Carnarvon,-24.87,113.63,71.6,88,12.75,90
1,Vila Velha,-20.33,-40.29,76.77,83,9.17,75
2,Hithadhoo,-0.6,73.08,83.32,71,2.86,100
3,Pangnirtung,66.15,-65.71,7.07,73,7.16,100
4,Albany,42.6,-73.97,55.15,47,11.41,75


In [7]:
df.to_csv(output_data_file)