In [1]:
# Import the dependencies.
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np
import os
from scipy.stats import linregress
import time
from datetime import datetime
from citipy import citipy
import requests

#get config variable from folder above
os.chdir("..")
from config import weather_api_key
os.chdir("Weather_Database")

In [2]:
# Create a set of random latitude and longitude combinations.
lats = np.random.uniform(low=-90.000, high=90.000, size=2000)
lngs = np.random.uniform(low=-180.000, high=180.000, size=2000)
lat_lngs = zip(lats, lngs)
lat_lngs

<zip at 0x1d913023ec0>

In [3]:
# Add the latitudes and longitudes to a list.
coordinates = list(lat_lngs)

In [4]:
# Create a list for holding the cities.
cities = []
# Identify the nearest city for each latitude and longitude combination.
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name

    # If the city is unique, then we will add it to the cities list.
    if city not in cities:
        cities.append(city)
# Print the city count to confirm sufficient count.
len(cities)

751

In [5]:
# Starting URL for Weather Map API Call.
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key

In [6]:
# Create an empty list to hold the weather data.
city_data = []
# Print the beginning of the logging.
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters.
record_count = 1
set_count = 1

# Loop through all the cities in the list.
for i, city in enumerate(cities):

    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
        time.sleep(60)

    # Create endpoint URL with each city.
    city_url = url + "&q=" + city.replace(" ","+")

    # Log the URL, record, and set numbers and the city.
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    # Add 1 to the record count.
    record_count += 1
    # Run an API request for each of the cities.
    try:
        # Parse the JSON and retrieve data.
        city_weather = requests.get(city_url).json()
        # Parse out the needed data.
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        city_current = city_weather["weather"][0]["description"]
        # Convert the date to ISO standard.
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
        # Append the city information into city_data list.
        city_data.append({"City": city.title(),
                          "Country": city_country,
                          "Lat": city_lat,
                          "Lng": city_lng,
                          "Max Temp": city_max_temp,
                          "Humidity": city_humidity,
                          "Cloudiness": city_clouds,
                          "Wind Speed": city_wind,
                          "Current Description" : city_current})

    # If an error is experienced, skip the city.
    except:
        print("City not found. Skipping...")
        pass

# Indicate that Data Loading is complete.
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")

Beginning Data Retrieval     
-----------------------------
Processing Record 1 of Set 1 | flinders
Processing Record 2 of Set 1 | alofi
Processing Record 3 of Set 1 | san quintin
Processing Record 4 of Set 1 | narsaq
Processing Record 5 of Set 1 | ugoofaaru
Processing Record 6 of Set 1 | albany
Processing Record 7 of Set 1 | grindavik
Processing Record 8 of Set 1 | ushuaia
Processing Record 9 of Set 1 | atar
Processing Record 10 of Set 1 | acarau
Processing Record 11 of Set 1 | kapaa
Processing Record 12 of Set 1 | busselton
Processing Record 13 of Set 1 | lensk
Processing Record 14 of Set 1 | temaraia
City not found. Skipping...
Processing Record 15 of Set 1 | mar del plata
Processing Record 16 of Set 1 | puerto ayora
Processing Record 17 of Set 1 | dir
Processing Record 18 of Set 1 | taolanaro
City not found. Skipping...
Processing Record 19 of Set 1 | barrow
Processing Record 20 of Set 1 | shimanovsk
Processing Record 21 of Set 1 | illoqqortoormiut
City not found. Skipping...
Proce

Processing Record 39 of Set 4 | calabozo
Processing Record 40 of Set 4 | chapais
Processing Record 41 of Set 4 | port elizabeth
Processing Record 42 of Set 4 | amderma
City not found. Skipping...
Processing Record 43 of Set 4 | jiuquan
Processing Record 44 of Set 4 | bilma
Processing Record 45 of Set 4 | hit
Processing Record 46 of Set 4 | kalmunai
Processing Record 47 of Set 4 | guerrero negro
Processing Record 48 of Set 4 | cap malheureux
Processing Record 49 of Set 4 | ippy
Processing Record 50 of Set 4 | kodiak
Processing Record 1 of Set 5 | yuncheng
Processing Record 2 of Set 5 | wagar
Processing Record 3 of Set 5 | san pedro
Processing Record 4 of Set 5 | clermont
Processing Record 5 of Set 5 | djambala
Processing Record 6 of Set 5 | faya
Processing Record 7 of Set 5 | camacha
Processing Record 8 of Set 5 | la rioja
Processing Record 9 of Set 5 | bonavista
Processing Record 10 of Set 5 | biak
Processing Record 11 of Set 5 | tessalit
Processing Record 12 of Set 5 | khakhea
Process

Processing Record 26 of Set 8 | moroni
Processing Record 27 of Set 8 | honiara
Processing Record 28 of Set 8 | port blair
Processing Record 29 of Set 8 | itoman
Processing Record 30 of Set 8 | massa marittima
Processing Record 31 of Set 8 | vallenar
Processing Record 32 of Set 8 | naze
Processing Record 33 of Set 8 | mehran
Processing Record 34 of Set 8 | ilebo
Processing Record 35 of Set 8 | marakkanam
Processing Record 36 of Set 8 | bulawayo
Processing Record 37 of Set 8 | sulangan
Processing Record 38 of Set 8 | onega
Processing Record 39 of Set 8 | komsomolskiy
Processing Record 40 of Set 8 | moron
Processing Record 41 of Set 8 | araguaina
Processing Record 42 of Set 8 | ipixuna
Processing Record 43 of Set 8 | sedelnikovo
City not found. Skipping...
Processing Record 44 of Set 8 | kutum
Processing Record 45 of Set 8 | can tho
Processing Record 46 of Set 8 | roberto payan
City not found. Skipping...
Processing Record 47 of Set 8 | palabuhanratu
City not found. Skipping...
Processing

Processing Record 13 of Set 12 | alyangula
Processing Record 14 of Set 12 | kjollefjord
Processing Record 15 of Set 12 | sentyabrskiy
City not found. Skipping...
Processing Record 16 of Set 12 | biloela
Processing Record 17 of Set 12 | santa clara
Processing Record 18 of Set 12 | attawapiskat
City not found. Skipping...
Processing Record 19 of Set 12 | husavik
Processing Record 20 of Set 12 | erdemli
Processing Record 21 of Set 12 | butembo
Processing Record 22 of Set 12 | olinda
Processing Record 23 of Set 12 | dali
Processing Record 24 of Set 12 | teya
Processing Record 25 of Set 12 | perth
Processing Record 26 of Set 12 | westfield
Processing Record 27 of Set 12 | mandalgovi
Processing Record 28 of Set 12 | jijiga
Processing Record 29 of Set 12 | prince george
Processing Record 30 of Set 12 | mwinilunga
Processing Record 31 of Set 12 | molina
Processing Record 32 of Set 12 | havoysund
Processing Record 33 of Set 12 | verkhoyansk
Processing Record 34 of Set 12 | kashan
Processing Rec

Processing Record 49 of Set 15 | linhares
Processing Record 50 of Set 15 | padre paraiso
Processing Record 1 of Set 16 | vohibinany
-----------------------------
Data Retrieval Complete      
-----------------------------


In [7]:
# Convert the array of dictionaries to a Pandas DataFrame.
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Country,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Current Description
0,Flinders,AU,-34.5833,150.8552,65.37,91,73,4.0,broken clouds
1,Alofi,NU,-19.0595,-169.9187,80.49,89,91,3.44,overcast clouds
2,San Quintin,MX,30.4833,-115.95,80.2,25,72,8.3,broken clouds
3,Narsaq,GL,60.9167,-46.05,37.62,70,39,5.03,scattered clouds
4,Ugoofaaru,MV,5.6667,73.0,84.54,66,28,5.23,scattered clouds
5,Albany,US,42.6001,-73.9662,56.05,61,65,1.99,broken clouds
6,Grindavik,IS,63.8424,-22.4338,37.35,48,0,4.61,clear sky
7,Ushuaia,AR,-54.8,-68.3,46.02,65,0,3.44,clear sky
8,Atar,MR,20.5169,-13.0499,86.92,10,0,10.56,clear sky
9,Acarau,BR,-2.8856,-40.12,82.09,80,32,13.15,scattered clouds


In [8]:
# Create the output file (CSV).
output_data_file = os.path.join("Weather_Database.csv")
# Export the City_Data into a CSV.
city_data_df.to_csv(output_data_file, index_label="City_ID")