In [1]:
#Import dependencies
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np
from citipy import citipy

# Import the requests library
import requests

# Import the API key
from config import weather_api_key

# Import the datetime module from the datetime library.
from datetime import datetime

In [2]:
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = list(zip(lats,lngs))
lat_lngs

[(24.605145709410934, 33.16998041287832),
 (-53.77897774773471, 75.12808187689319),
 (-54.42703620165992, 37.605485447420506),
 (-42.341997166914226, 135.40062065584368),
 (-55.095893984420336, 132.67357741788828),
 (-28.11686127170566, -109.9819361224097),
 (53.94725557869711, 110.38147604379475),
 (-60.32685870596936, -11.546663451625705),
 (-31.663347945666914, -15.089510128550444),
 (-35.09515265627526, 153.4459437116392),
 (-16.986864274319714, -13.456152764623766),
 (78.85283197204234, -104.90550160403671),
 (-50.011554968005484, 75.9132684820766),
 (79.51413542184912, -146.8305084252397),
 (44.68961217299071, -87.69904079355437),
 (63.40219961332102, -118.85935621690783),
 (10.615908111691056, -101.05694365747065),
 (-33.70446893013254, -156.4523275694427),
 (49.2806877588728, 61.49030939816933),
 (1.819269816808685, -91.51396293848012),
 (16.390845137239495, -68.84927360345993),
 (-56.411332848417146, 90.32281136515081),
 (-16.324286757445833, 38.553835907553974),
 (-44.7425488

In [3]:
# Create a list for holding the cities.
cities = []
# Identify the nearest city for each latitude and longitude combination.
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name

    # If the city is unique, then we will add it to the cities list.
    if city not in cities:
        cities.append(city)
# Print the city count to confirm sufficient count.
len(cities)

621

In [4]:
#Import our dependencies and initialize counters and an empty list that will hold the weather data.
#Loop through the cities list.
#Group the cities in sets of 50 to log the process as we find the weather data for each city.
###  Two counters will be needed here: one to log the city count from 1 to 50, and another for the sets.
#Build the city_url or endpoint for each city.
#Log the URL and the record and set numbers.
#Make an API request for each city.
#Parse the JSON weather data for the following:
###  City, country, and date
###  Latitude and longitude
###  Maximum temperature
###  Humidity
###  Cloudiness
###  Wind speed
#Add the data to a list in a dictionary format and then convert the list to a DataFrame.

In [6]:
# Create an empty list to hold the weather data.
city_data = []
# Print the beginning of the logging.
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters.
record_count = 1
set_count = 1

# Starting URL for Weather Map API Call.
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key

# Loop through all the cities in the list.
for i, city in enumerate(cities):

    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
    # Create endpoint URL with each city.
    city_url = url + "&q=" + city

    # Log the URL, record, and set numbers and the city.
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    # Add 1 to the record count.
    record_count += 1
    
# Run an API request for each of the cities.
    try:
        # Parse the JSON and retrieve data.
        city_weather = requests.get(city_url).json()
        # Parse out the needed data.
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        # Convert the date to ISO standard.
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
        # Append the city information into city_data list.
        city_data.append({"City": city.title(),
                          "Lat": city_lat,
                          "Lng": city_lng,
                          "Max Temp": city_max_temp,
                          "Humidity": city_humidity,
                          "Cloudiness": city_clouds,
                          "Wind Speed": city_wind,
                          "Country": city_country,
                          "Date": city_date})

# If an error is experienced, skip the city.
    except:
        print("City not found. Skipping...")
        pass

# Indicate that Data Loading is complete.
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")

Beginning Data Retrieval     
-----------------------------
Processing Record 1 of Set 1 | aswan
Processing Record 2 of Set 1 | souillac
Processing Record 3 of Set 1 | port alfred
Processing Record 4 of Set 1 | mount gambier
Processing Record 5 of Set 1 | new norfolk
Processing Record 6 of Set 1 | rikitea
Processing Record 7 of Set 1 | kurumkan
Processing Record 8 of Set 1 | cape town
Processing Record 9 of Set 1 | jamestown
Processing Record 10 of Set 1 | sydney
Processing Record 11 of Set 1 | yellowknife
Processing Record 12 of Set 1 | mahebourg
Processing Record 13 of Set 1 | barrow
Processing Record 14 of Set 1 | bellevue
Processing Record 15 of Set 1 | hay river
Processing Record 16 of Set 1 | tecoanapa
Processing Record 17 of Set 1 | avera
Processing Record 18 of Set 1 | svetlyy
City not found. Skipping...
Processing Record 19 of Set 1 | puerto ayora
Processing Record 20 of Set 1 | la romana
Processing Record 21 of Set 1 | busselton
Processing Record 22 of Set 1 | mocuba
Processi

Processing Record 39 of Set 4 | vicuna
City not found. Skipping...
Processing Record 40 of Set 4 | castro
Processing Record 41 of Set 4 | havre-saint-pierre
Processing Record 42 of Set 4 | nikolskoye
Processing Record 43 of Set 4 | gawler
Processing Record 44 of Set 4 | berlevag
Processing Record 45 of Set 4 | alyangula
Processing Record 46 of Set 4 | camacha
Processing Record 47 of Set 4 | yerbogachen
Processing Record 48 of Set 4 | mizdah
Processing Record 49 of Set 4 | blagoyevo
Processing Record 50 of Set 4 | the pas
Processing Record 1 of Set 5 | yei
City not found. Skipping...
Processing Record 2 of Set 5 | antropovo
Processing Record 3 of Set 5 | paamiut
Processing Record 4 of Set 5 | emerald
Processing Record 5 of Set 5 | bay saint louis
Processing Record 6 of Set 5 | hithadhoo
Processing Record 7 of Set 5 | sao jose da coroa grande
Processing Record 8 of Set 5 | kieta
Processing Record 9 of Set 5 | surt
Processing Record 10 of Set 5 | constitucion
Processing Record 11 of Set 5

Processing Record 21 of Set 8 | korla
City not found. Skipping...
Processing Record 22 of Set 8 | pangnirtung
Processing Record 23 of Set 8 | dolbeau
City not found. Skipping...
Processing Record 24 of Set 8 | ballina
Processing Record 25 of Set 8 | sola
Processing Record 26 of Set 8 | sept-iles
Processing Record 27 of Set 8 | saraland
Processing Record 28 of Set 8 | burns lake
Processing Record 29 of Set 8 | soloneshnoye
Processing Record 30 of Set 8 | phalaborwa
Processing Record 31 of Set 8 | porterville
Processing Record 32 of Set 8 | klaksvik
Processing Record 33 of Set 8 | dicabisagan
Processing Record 34 of Set 8 | mahibadhoo
Processing Record 35 of Set 8 | nacozari
Processing Record 36 of Set 8 | castlemaine
Processing Record 37 of Set 8 | kalomo
City not found. Skipping...
Processing Record 38 of Set 8 | cumaribo
City not found. Skipping...
Processing Record 39 of Set 8 | inirida
Processing Record 40 of Set 8 | cockburn town
Processing Record 41 of Set 8 | mananara
City not fo

Processing Record 5 of Set 12 | luganville
Processing Record 6 of Set 12 | praia
Processing Record 7 of Set 12 | barmer
Processing Record 8 of Set 12 | balkanabat
Processing Record 9 of Set 12 | isangel
Processing Record 10 of Set 12 | loanda
Processing Record 11 of Set 12 | quelimane
Processing Record 12 of Set 12 | tortoli
Processing Record 13 of Set 12 | ampanihy
Processing Record 14 of Set 12 | kuche
City not found. Skipping...
Processing Record 15 of Set 12 | bayji
Processing Record 16 of Set 12 | tandalti
Processing Record 17 of Set 12 | kolyvan
Processing Record 18 of Set 12 | ilhabela
Processing Record 19 of Set 12 | te anau
Processing Record 20 of Set 12 | saleaula
City not found. Skipping...
Processing Record 21 of Set 12 | billings
Processing Record 22 of Set 12 | oga
Processing Record 23 of Set 12 | uspenka
Processing Record 24 of Set 12 | geraldton
Processing Record 25 of Set 12 | san cristobal
Processing Record 26 of Set 12 | santa quiteria
Processing Record 27 of Set 12 

In [7]:
# Convert the array of dictionaries to a Pandas DataFrame.
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Aswan,24.09,32.9,71.6,26,55,5.82,EG,2019-11-05 07:25:00
1,Souillac,45.6,-0.6,50.0,93,98,12.75,FR,2019-11-05 07:25:00
2,Port Alfred,-33.59,26.89,71.01,80,22,8.01,ZA,2019-11-05 07:25:00
3,Mount Gambier,-37.83,140.78,59.0,67,90,19.46,AU,2019-11-05 07:25:00
4,New Norfolk,-42.78,147.06,60.01,41,75,18.34,AU,2019-11-05 07:25:00
5,Rikitea,-23.12,-134.97,75.76,89,100,4.9,PF,2019-11-05 07:25:01
6,Kurumkan,54.33,110.32,14.32,78,89,2.17,RU,2019-11-05 07:25:01
7,Cape Town,-33.93,18.42,78.01,38,100,10.29,ZA,2019-11-05 07:25:01
8,Jamestown,-33.21,138.6,70.99,22,18,14.25,AU,2019-11-05 07:22:42
9,Sydney,-33.85,151.22,66.2,59,20,16.11,AU,2019-11-05 07:22:15


In [9]:
newColumnOrder = ["City", "Country", "Date", "Lat", "Lng", "Max Temp", "Humidity", "Cloudiness", "Wind Speed"]
city_data_Update_df = city_data_df[newColumnOrder]
city_data_Update_df

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Aswan,EG,2019-11-05 07:25:00,24.09,32.90,71.60,26,55,5.82
1,Souillac,FR,2019-11-05 07:25:00,45.60,-0.60,50.00,93,98,12.75
2,Port Alfred,ZA,2019-11-05 07:25:00,-33.59,26.89,71.01,80,22,8.01
3,Mount Gambier,AU,2019-11-05 07:25:00,-37.83,140.78,59.00,67,90,19.46
4,New Norfolk,AU,2019-11-05 07:25:00,-42.78,147.06,60.01,41,75,18.34
...,...,...,...,...,...,...,...,...,...
552,Mildura,AU,2019-11-05 07:27:01,-34.18,142.16,73.40,23,38,10.29
553,Gravdal,NO,2019-11-05 07:27:01,59.79,5.78,39.20,55,54,6.93
554,Kirovsk,RU,2019-11-05 07:27:01,67.62,33.66,10.96,94,69,8.08
555,Santa Isabel,MX,2019-11-05 07:27:01,32.63,-115.58,60.80,17,1,5.82


In [10]:
# Create the output file (CSV).
output_data_file = "weather_data/cities.csv"
# Export the City_Data into a CSV.
city_data_df.to_csv(output_data_file, index_label="City_ID")