In [1]:
# Import modules
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np
import timeit
import requests
import time
from datetime import datetime
from citipy import citipy
from config import weather_api_key

In [2]:
# Starting URL for Weather Map API Call.
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key

In [3]:
# Create a set of random latitude and longitude combinations.
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)
lat_lngs

<zip at 0x23290660988>

In [4]:
# Add the latitudes and longitudes to a list.
coordinates = list(lat_lngs)

In [5]:
# Create a list for holding the cities.
cities = []

# Identify the nearest city for each latitude and longitude combination.
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name

    # If the city is unique, then we will add it to the cities list.
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count.
len(cities)

621

In [6]:
# Create an empty list to hold the weather data.
city_data = []

# Print the beginning of the logging.
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters.
record_count = 1
set_count = 1

Beginning Data Retrieval     
-----------------------------


In [7]:
# Loop through all the cities in the list.
for i, city in enumerate(cities):

    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
        time.sleep(60)

    # Create endpoint URL with each city.
    city_url = url + "&q=" + city.replace(" ","+")

    # Log the URL, record, and set numbers and the city.
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    
    # Add 1 to the record count.
    record_count += 1
    
    # Run an API request for each of the cities.
    try:
        
        # Parse the JSON and retrieve data.
        city_weather = requests.get(city_url).json()
        
        # Parse out the needed data.
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        
        # Convert the date to ISO standard.
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
        
        # Append the city information into city_data list.
        city_data.append({"City": city.title(),
                          "Lat": city_lat,
                          "Lng": city_lng,
                          "Max Temp": city_max_temp,
                          "Humidity": city_humidity,
                          "Cloudiness": city_clouds,
                          "Wind Speed": city_wind,
                          "Country": city_country,
                          "Date": city_date})

    # If an error is experienced, skip the city.
    except:
        print("City not found. Skipping...")
        pass

# Indicate that Data Loading is complete.
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")

Processing Record 1 of Set 1 | irbil
Processing Record 2 of Set 1 | souillac
Processing Record 3 of Set 1 | ahipara
Processing Record 4 of Set 1 | rikitea
Processing Record 5 of Set 1 | kilmez
City not found. Skipping...
Processing Record 6 of Set 1 | illoqqortoormiut
City not found. Skipping...
Processing Record 7 of Set 1 | mataura
Processing Record 8 of Set 1 | yulara
Processing Record 9 of Set 1 | chokurdakh
Processing Record 10 of Set 1 | tasiilaq
Processing Record 11 of Set 1 | punta arenas
Processing Record 12 of Set 1 | tonantins
Processing Record 13 of Set 1 | thompson
Processing Record 14 of Set 1 | auki
Processing Record 15 of Set 1 | taolanaro
City not found. Skipping...
Processing Record 16 of Set 1 | kodiak
Processing Record 17 of Set 1 | bethel
Processing Record 18 of Set 1 | ushuaia
Processing Record 19 of Set 1 | basoko
Processing Record 20 of Set 1 | iqaluit
Processing Record 21 of Set 1 | albany
Processing Record 22 of Set 1 | hilo
Processing Record 23 of Set 1 | sas

Processing Record 37 of Set 4 | odweyne
Processing Record 38 of Set 4 | lerwick
Processing Record 39 of Set 4 | moron
Processing Record 40 of Set 4 | batagay-alyta
Processing Record 41 of Set 4 | chagda
City not found. Skipping...
Processing Record 42 of Set 4 | lincoln
Processing Record 43 of Set 4 | butaritari
Processing Record 44 of Set 4 | hermanus
Processing Record 45 of Set 4 | castro
Processing Record 46 of Set 4 | praia
Processing Record 47 of Set 4 | cockburn town
Processing Record 48 of Set 4 | santo angelo
Processing Record 49 of Set 4 | kutum
Processing Record 50 of Set 4 | ochamchira
Processing Record 1 of Set 5 | zvishavane
Processing Record 2 of Set 5 | kindu
Processing Record 3 of Set 5 | thayetmyo
Processing Record 4 of Set 5 | mogadishu
Processing Record 5 of Set 5 | samusu
City not found. Skipping...
Processing Record 6 of Set 5 | saint-philippe
Processing Record 7 of Set 5 | port hardy
Processing Record 8 of Set 5 | nasice
Processing Record 9 of Set 5 | broome
Proce

Processing Record 27 of Set 8 | trebinje
Processing Record 28 of Set 8 | duz
City not found. Skipping...
Processing Record 29 of Set 8 | teguise
Processing Record 30 of Set 8 | broken hill
Processing Record 31 of Set 8 | robertsport
Processing Record 32 of Set 8 | uralets
Processing Record 33 of Set 8 | rungata
City not found. Skipping...
Processing Record 34 of Set 8 | gat
Processing Record 35 of Set 8 | gornji vakuf
Processing Record 36 of Set 8 | mana
Processing Record 37 of Set 8 | khandyga
Processing Record 38 of Set 8 | san cristobal
Processing Record 39 of Set 8 | oranjemund
Processing Record 40 of Set 8 | anloga
Processing Record 41 of Set 8 | tilichiki
Processing Record 42 of Set 8 | kraslava
Processing Record 43 of Set 8 | la maddalena
Processing Record 44 of Set 8 | myitkyina
Processing Record 45 of Set 8 | coquimbo
Processing Record 46 of Set 8 | portland
Processing Record 47 of Set 8 | kousseri
Processing Record 48 of Set 8 | roald
Processing Record 49 of Set 8 | pyapon
Pr

Processing Record 15 of Set 12 | tres arroyos
Processing Record 16 of Set 12 | camopi
Processing Record 17 of Set 12 | youghal
Processing Record 18 of Set 12 | puerto escondido
Processing Record 19 of Set 12 | eagle pass
Processing Record 20 of Set 12 | alice springs
Processing Record 21 of Set 12 | janovice nad uhlavou
Processing Record 22 of Set 12 | agadir
Processing Record 23 of Set 12 | moose factory
Processing Record 24 of Set 12 | olafsvik
Processing Record 25 of Set 12 | binga
Processing Record 26 of Set 12 | arlit
Processing Record 27 of Set 12 | sakaiminato
Processing Record 28 of Set 12 | rongcheng
Processing Record 29 of Set 12 | dukat
Processing Record 30 of Set 12 | westport
Processing Record 31 of Set 12 | pozo colorado
Processing Record 32 of Set 12 | abu dhabi
Processing Record 33 of Set 12 | dolbeau
City not found. Skipping...
Processing Record 34 of Set 12 | lata
Processing Record 35 of Set 12 | veraval
Processing Record 36 of Set 12 | skjervoy
Processing Record 37 o

In [8]:
len(city_data)

572

In [9]:
# Convert the array of dictionaries to a Pandas DataFrame.
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Irbil,36.1926,44.0106,85.82,19,0,3.44,IQ,2022-07-05 03:27:16
1,Souillac,-20.5167,57.5167,68.38,83,40,11.5,MU,2022-07-05 03:26:03
2,Ahipara,-35.1667,173.1667,58.8,96,100,13.35,NZ,2022-07-05 03:23:09
3,Rikitea,-23.1203,-134.9692,75.16,73,4,8.43,PF,2022-07-05 03:21:49
4,Mataura,-46.1927,168.8643,54.48,64,28,11.86,NZ,2022-07-05 03:21:53
5,Yulara,-25.2406,130.9889,55.96,28,0,11.1,AU,2022-07-05 03:27:17
6,Chokurdakh,70.6333,147.9167,71.83,54,100,12.19,RU,2022-07-05 03:22:07
7,Tasiilaq,65.6145,-37.6368,39.36,84,100,5.88,GL,2022-07-05 03:27:18
8,Punta Arenas,-53.15,-70.9167,26.71,93,0,5.75,CL,2022-07-05 03:18:20
9,Tonantins,-2.8731,-67.8022,72.01,99,100,1.1,BR,2022-07-05 03:27:18


In [11]:
# Reorder the columns
new_column_order = ['City', 'Country', 'Date', 'Lat', 'Lng', 'Max Temp', 'Humidity', 'Cloudiness', 'Wind Speed']
city_data_df = city_data_df[new_column_order]
city_data_df 

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Irbil,IQ,2022-07-05 03:27:16,36.1926,44.0106,85.82,19,0,3.44
1,Souillac,MU,2022-07-05 03:26:03,-20.5167,57.5167,68.38,83,40,11.50
2,Ahipara,NZ,2022-07-05 03:23:09,-35.1667,173.1667,58.80,96,100,13.35
3,Rikitea,PF,2022-07-05 03:21:49,-23.1203,-134.9692,75.16,73,4,8.43
4,Mataura,NZ,2022-07-05 03:21:53,-46.1927,168.8643,54.48,64,28,11.86
...,...,...,...,...,...,...,...,...,...
567,Goderich,CA,2022-07-05 03:42:53,43.7501,-81.7165,75.52,64,100,5.75
568,Maketu,NZ,2022-07-05 03:42:54,-37.7667,176.4500,56.75,91,100,13.33
569,Beverly,US,2022-07-05 03:42:54,42.5584,-70.8801,70.92,67,0,1.01
570,Kattivakkam,IN,2022-07-05 03:42:55,13.2167,80.3167,86.09,71,100,18.12


In [12]:
# Create the output file (CSV).
output_data_file = "weather_data/cities.csv"

# Export the City_Data into a CSV.
city_data_df.to_csv(output_data_file, index_label="City_ID")