In [1]:
# Import the dependencies.
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np
import requests

from citipy import citipy

# Import weather_api_key.
from config import weather_api_key

# Import the datetime module from the datetime library.
from datetime import datetime

In [2]:
# Create a set of random latitude combinations.
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)
lat_lngs

<zip at 0x1cf3b2b4f08>

In [3]:
# Add the latitude and longitudes to a list.
coordinates = list(lat_lngs)

In [4]:
# Create a list for holding the cities.
cities = []

# Identify the nearest city for each latitude and longitude combination.
for coordinate in coordinates :
    city = citipy.nearest_city(coordinate[0],coordinate[1]).city_name
    
    # If city is unique, then we will add it to the cities list.
    if city not in cities:
        cities.append(city)
        
# Print the city count to confirm sufficient count.
len(cities)

623

In [5]:
# Bulding the basic url for the OpenWeatherMap
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&appid=" + weather_api_key

In [6]:
# Create an empty list to hold the weather data.
city_data = []
# Print the beginning of the logging.
print("Beginning Data Retrieval          ")
print("----------------------------------")

# Create counters.
record_count = 1
set_count = 1

# Loop through all the cities in our list.
for i, city in enumerate(cities):
    
    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count += 1
        
    # Create endpoint URL with each city.
    city_url = url + "&q=" + city.replace(" ","+")
    
    # Log the URL, record and set numbers and the city.
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    
    # Add 1 to the record count.
    record_count += 1

    # Run an API request for each of the cities.
    try:
        # Parse the JSON and retrieve data.
        city_weather = requests.get(city_url).json()
        
        # Parse out the needed data.
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        
        # Convert the date to ISO standard.
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
        
        # Append the city information into the city_data list.
        city_data.append({"City": city.title() ,
                          "Lat": city_lat,
                          "Lng": city_lng,
                          "Max Temp": city_max_temp,
                          "Humidity": city_humidity,
                          "Cloudiness": city_clouds,
                          "Wind Speed": city_wind,
                          "Country": city_country,
                          "Date": city_date})
        
    # If an error is experienced, skip the city.
    except:
        print("City not found. Skipping...")
        pass
    
# Indicate that data loading is complete.
print("----------------------------------")
print("Data Retrieval Complete           ")
print("----------------------------------")

Beginning Data Retrieval          
----------------------------------
Processing Record 1 of Set 1 | xuddur
Processing Record 2 of Set 1 | thompson
Processing Record 3 of Set 1 | port shepstone
Processing Record 4 of Set 1 | nikolskoye
Processing Record 5 of Set 1 | lubango
Processing Record 6 of Set 1 | husavik
Processing Record 7 of Set 1 | mataura
Processing Record 8 of Set 1 | bosilovo
Processing Record 9 of Set 1 | torbay
Processing Record 10 of Set 1 | rikitea
Processing Record 11 of Set 1 | albany
Processing Record 12 of Set 1 | tura
Processing Record 13 of Set 1 | tumannyy
City not found. Skipping...
Processing Record 14 of Set 1 | mount isa
Processing Record 15 of Set 1 | chokurdakh
Processing Record 16 of Set 1 | igarka
Processing Record 17 of Set 1 | yellowknife
Processing Record 18 of Set 1 | vaini
Processing Record 19 of Set 1 | saleaula
City not found. Skipping...
Processing Record 20 of Set 1 | torrington
Processing Record 21 of Set 1 | taolanaro
City not found. Skipping

Processing Record 189 of Set 4 | hasaki
Processing Record 190 of Set 4 | ovalle
Processing Record 191 of Set 4 | chuy
Processing Record 192 of Set 4 | uren
Processing Record 193 of Set 4 | amderma
City not found. Skipping...
Processing Record 194 of Set 4 | ostrovnoy
Processing Record 195 of Set 4 | hofn
Processing Record 196 of Set 4 | nanning
Processing Record 197 of Set 4 | lafiagi
Processing Record 198 of Set 4 | sarkand
Processing Record 199 of Set 4 | cabo san lucas
Processing Record 200 of Set 4 | vila velha
Processing Record 201 of Set 4 | dum duma
Processing Record 202 of Set 4 | kutum
Processing Record 203 of Set 4 | jardim
Processing Record 205 of Set 5 | lagunas
Processing Record 206 of Set 5 | grand gaube
Processing Record 207 of Set 5 | pangkalanbuun
Processing Record 208 of Set 5 | bardiyah
Processing Record 209 of Set 5 | satitoa
City not found. Skipping...
Processing Record 210 of Set 5 | shubarshi
Processing Record 211 of Set 5 | puerto quijarro
Processing Record 212 

Processing Record 378 of Set 8 | aplahoue
Processing Record 379 of Set 8 | maun
Processing Record 380 of Set 8 | palauig
Processing Record 381 of Set 8 | ballina
Processing Record 382 of Set 8 | crestview
Processing Record 383 of Set 8 | sidi ali
Processing Record 384 of Set 8 | coulihaut
City not found. Skipping...
Processing Record 385 of Set 8 | petrolina
Processing Record 386 of Set 8 | pampa
Processing Record 387 of Set 8 | portland
Processing Record 388 of Set 8 | akom
Processing Record 389 of Set 8 | mahebourg
Processing Record 390 of Set 8 | verkhoyansk
Processing Record 391 of Set 8 | przhevalskoye
Processing Record 392 of Set 8 | santa ana
Processing Record 393 of Set 8 | tomatlan
Processing Record 394 of Set 8 | saint-augustin
Processing Record 395 of Set 8 | gat
Processing Record 396 of Set 8 | la serena
Processing Record 397 of Set 8 | umzimvubu
City not found. Skipping...
Processing Record 398 of Set 8 | tarudant
City not found. Skipping...
Processing Record 399 of Set 8 

Processing Record 563 of Set 12 | aranos
Processing Record 564 of Set 12 | tabou
Processing Record 565 of Set 12 | burica
City not found. Skipping...
Processing Record 566 of Set 12 | basco
Processing Record 567 of Set 12 | el alto
Processing Record 568 of Set 12 | alpena
Processing Record 569 of Set 12 | hovd
Processing Record 570 of Set 12 | iacu
Processing Record 571 of Set 12 | nizwa
Processing Record 572 of Set 12 | longonjo
Processing Record 573 of Set 12 | aswan
Processing Record 574 of Set 12 | kaka
Processing Record 575 of Set 12 | halalo
City not found. Skipping...
Processing Record 576 of Set 12 | krasnouralsk
Processing Record 577 of Set 12 | durban
Processing Record 578 of Set 12 | khasan
Processing Record 579 of Set 12 | ondorhaan
City not found. Skipping...
Processing Record 580 of Set 12 | chagda
City not found. Skipping...
Processing Record 581 of Set 12 | itanhem
Processing Record 582 of Set 12 | ratnagiri
Processing Record 583 of Set 12 | santo antonio do ica
Process

In [7]:
print(len(city_data))

566


In [8]:
# Convert the array of dictionaries to a Pandas DataFrame.
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Xuddur,4.1213,43.8894,70.45,77,12,14.34,SO,2021-05-24 03:50:15
1,Thompson,55.7435,-97.8558,50.16,66,40,6.91,CA,2021-05-24 03:50:03
2,Port Shepstone,-30.7414,30.455,59.05,63,10,8.41,ZA,2021-05-24 03:53:47
3,Nikolskoye,59.7035,30.7861,50.4,95,100,11.5,RU,2021-05-24 03:50:52
4,Lubango,-14.9172,13.4925,54.55,51,51,4.5,AO,2021-05-24 03:53:48
5,Husavik,66.0449,-17.3389,40.91,87,100,6.82,IS,2021-05-24 03:51:32
6,Mataura,-46.1927,168.8643,49.48,68,68,2.64,NZ,2021-05-24 03:50:18
7,Bosilovo,41.4406,22.7278,63.82,66,75,4.7,MK,2021-05-24 03:53:48
8,Torbay,47.6666,-52.7314,37.76,97,90,18.41,CA,2021-05-24 03:50:34
9,Rikitea,-23.1203,-134.9692,74.77,75,46,5.06,PF,2021-05-24 03:50:19


In [9]:
# Reorder the columns
new_column_order = ["City", "Country", "Date", "Lat", "Lng", "Max Temp", "Humidity", "Cloudiness", "Wind Speed"]
city_data_df = city_data_df[new_column_order]
city_data_df.head(10)

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Xuddur,SO,2021-05-24 03:50:15,4.1213,43.8894,70.45,77,12,14.34
1,Thompson,CA,2021-05-24 03:50:03,55.7435,-97.8558,50.16,66,40,6.91
2,Port Shepstone,ZA,2021-05-24 03:53:47,-30.7414,30.455,59.05,63,10,8.41
3,Nikolskoye,RU,2021-05-24 03:50:52,59.7035,30.7861,50.4,95,100,11.5
4,Lubango,AO,2021-05-24 03:53:48,-14.9172,13.4925,54.55,51,51,4.5
5,Husavik,IS,2021-05-24 03:51:32,66.0449,-17.3389,40.91,87,100,6.82
6,Mataura,NZ,2021-05-24 03:50:18,-46.1927,168.8643,49.48,68,68,2.64
7,Bosilovo,MK,2021-05-24 03:53:48,41.4406,22.7278,63.82,66,75,4.7
8,Torbay,CA,2021-05-24 03:50:34,47.6666,-52.7314,37.76,97,90,18.41
9,Rikitea,PF,2021-05-24 03:50:19,-23.1203,-134.9692,74.77,75,46,5.06


In [10]:
# Create the output file (CSV).
output_data_file = "weather_data/cities.csv"

# Export the City_Data into a CSV.
city_data_df.to_csv(output_data_file, index_label='City_ID')