In [1]:
# Import the dependencies
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np
import time
from datetime import datetime
from citipy import citipy
import requests
from config import weather_api_key

In [2]:
# Create a set of random latitude and longitude combinations
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)
lat_lngs

<zip at 0x7f8d7404cb40>

In [3]:
# Add the latitudes and longitudes into a list
coordinates = list(lat_lngs)

In [6]:
# Create a list for holding the cities
cities = []

# Identify the nearest city for each latitude and longitude combination
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name
    
    # If the city is unique, the we will add it to the cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficint count
print(len(cities))

589


In [7]:
# Starting URL for Weather Map API Call.
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key

In [8]:
# Create an empty list to hold the weather data
city_data = []

# Print the beginning of the logging
print("Beginning Data Retrieval    ")
print("----------------------------")

# Create counters
record_count = 1
set_count = 1

# Loop through all the cities in our list
for i, city in enumerate(cities):
    
    # Group cities in sets of 50 for logging purposes
    if (i % 50 == 0 and i >=50):
        set_count += 1
        record_count = 1
        time.sleep(60)
        
    # Create endpoint URL with each city
    city_url = url + "&q=" + city.replace(" ","+")
    
    # Log the URL, record, and set numbers and the city
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    
    # Add 1 to the record count
    record_count += 1
    
# Run an API request for each of the cities
    try:
        # Parse the JSON and retrieve data
        city_weather = requests.get(city_url).json()
        
        # Parse the needed data
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        
        # Convert the date to ISO standard
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
        
        # Append the city information into city_data list
        city_data.append({"City": city.title(),
                         "Lat": city_lat,
                         "Lng": city_lng,
                         "Max Temp": city_max_temp,
                         "Humidity": city_humidity,
                         "Cloudiness": city_clouds,
                         "Wind Speed": city_wind,
                         "Country": city_country,
                         "Date": city_date})
        
# If an error is experienced, skip the city
    except:
        print("City not found. Skipping...")
        pass
    
# Indicate that Data Loading is complete
print("-------------------------------")
print("Data Retrieval Complete        ")
print("-------------------------------")

Beginning Data Retrieval    
----------------------------
Processing Record 1 of Set 1 | mataura
Processing Record 2 of Set 1 | punta arenas
Processing Record 3 of Set 1 | biltine
Processing Record 4 of Set 1 | chuguyevka
Processing Record 5 of Set 1 | dikson
Processing Record 6 of Set 1 | kapaa
Processing Record 7 of Set 1 | taolanaro
City not found. Skipping...
Processing Record 8 of Set 1 | arlit
Processing Record 9 of Set 1 | busselton
Processing Record 10 of Set 1 | pizarro
Processing Record 11 of Set 1 | georgetown
Processing Record 12 of Set 1 | hobyo
Processing Record 13 of Set 1 | emba
Processing Record 14 of Set 1 | russell
Processing Record 15 of Set 1 | upernavik
Processing Record 16 of Set 1 | kruisfontein
Processing Record 17 of Set 1 | den helder
Processing Record 18 of Set 1 | lavumisa
Processing Record 19 of Set 1 | jian
Processing Record 20 of Set 1 | wazzan
City not found. Skipping...
Processing Record 21 of Set 1 | tuatapere
Processing Record 22 of Set 1 | shingu
Pr

Processing Record 40 of Set 4 | belushya guba
City not found. Skipping...
Processing Record 41 of Set 4 | tasiilaq
Processing Record 42 of Set 4 | bhainsdehi
Processing Record 43 of Set 4 | komsomolskiy
Processing Record 44 of Set 4 | kirakira
Processing Record 45 of Set 4 | bowen
Processing Record 46 of Set 4 | watsa
Processing Record 47 of Set 4 | hlyboka
Processing Record 48 of Set 4 | vestmannaeyjar
Processing Record 49 of Set 4 | channel-port aux basques
Processing Record 50 of Set 4 | berlevag
Processing Record 1 of Set 5 | aguimes
Processing Record 2 of Set 5 | hofn
Processing Record 3 of Set 5 | asau
Processing Record 4 of Set 5 | touros
Processing Record 5 of Set 5 | kemijarvi
Processing Record 6 of Set 5 | soni
Processing Record 7 of Set 5 | darhan
Processing Record 8 of Set 5 | pochutla
Processing Record 9 of Set 5 | yangambi
Processing Record 10 of Set 5 | maykor
Processing Record 11 of Set 5 | kerema
Processing Record 12 of Set 5 | lagoa
Processing Record 13 of Set 5 | med

Processing Record 26 of Set 8 | saint-francois
Processing Record 27 of Set 8 | mehamn
Processing Record 28 of Set 8 | karkaralinsk
City not found. Skipping...
Processing Record 29 of Set 8 | lorengau
Processing Record 30 of Set 8 | lima
Processing Record 31 of Set 8 | tibati
Processing Record 32 of Set 8 | carbonia
Processing Record 33 of Set 8 | rio gallegos
Processing Record 34 of Set 8 | harper
Processing Record 35 of Set 8 | presidente olegario
Processing Record 36 of Set 8 | ubinskoye
Processing Record 37 of Set 8 | broken hill
Processing Record 38 of Set 8 | niamey
Processing Record 39 of Set 8 | dalvik
Processing Record 40 of Set 8 | siniscola
Processing Record 41 of Set 8 | louisbourg
City not found. Skipping...
Processing Record 42 of Set 8 | oxford
Processing Record 43 of Set 8 | hella
Processing Record 44 of Set 8 | svetlaya
Processing Record 45 of Set 8 | san rafael
Processing Record 46 of Set 8 | el oro
Processing Record 47 of Set 8 | henties bay
Processing Record 48 of Se

Processing Record 15 of Set 12 | banda aceh
Processing Record 16 of Set 12 | cozumel
Processing Record 17 of Set 12 | elmira
Processing Record 18 of Set 12 | hanumangarh
Processing Record 19 of Set 12 | logan
Processing Record 20 of Set 12 | pangody
Processing Record 21 of Set 12 | atar
Processing Record 22 of Set 12 | tianpeng
Processing Record 23 of Set 12 | port macquarie
Processing Record 24 of Set 12 | steamboat springs
Processing Record 25 of Set 12 | zhemchuzhnyy
City not found. Skipping...
Processing Record 26 of Set 12 | barra
Processing Record 27 of Set 12 | yerkoy
Processing Record 28 of Set 12 | kalmunai
Processing Record 29 of Set 12 | cleveland
Processing Record 30 of Set 12 | luderitz
Processing Record 31 of Set 12 | ilhabela
Processing Record 32 of Set 12 | homestead
Processing Record 33 of Set 12 | kyabram
Processing Record 34 of Set 12 | akdepe
Processing Record 35 of Set 12 | inuvik
Processing Record 36 of Set 12 | puri
Processing Record 37 of Set 12 | manthani
Proce

In [12]:
len(city_data)

541

In [13]:
# Convert the array of dictionaries to a Pandas DataFrame
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Mataura,-46.1927,168.8643,47.48,81,94,5.86,NZ,2022-07-05 22:29:33
1,Punta Arenas,-53.15,-70.9167,21.31,100,0,6.91,CL,2022-07-05 22:29:34
2,Biltine,14.5333,20.9167,83.26,50,37,10.36,TD,2022-07-05 22:29:34
3,Chuguyevka,44.1653,133.8633,70.45,94,77,2.3,RU,2022-07-05 22:29:35
4,Dikson,73.5069,80.5464,34.7,98,95,10.51,RU,2022-07-05 22:29:35
5,Kapaa,22.0752,-159.319,87.78,75,100,16.11,US,2022-07-05 22:29:35
6,Arlit,18.7369,7.3853,91.15,31,91,13.42,NE,2022-07-05 22:29:36
7,Busselton,-33.65,115.3333,50.5,66,76,9.13,AU,2022-07-05 22:29:36
8,Pizarro,4.9533,-77.366,78.26,88,85,6.69,CO,2022-07-05 22:29:37
9,Georgetown,5.4112,100.3354,80.89,86,20,2.3,MY,2022-07-05 22:29:18


In [14]:
new_column_order = ["City", "Country", "Date", "Lat", "Lng", "Max Temp", "Humidity", "Cloudiness", "Wind Speed"]
city_data_df[new_column_order]

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Mataura,NZ,2022-07-05 22:29:33,-46.1927,168.8643,47.48,81,94,5.86
1,Punta Arenas,CL,2022-07-05 22:29:34,-53.1500,-70.9167,21.31,100,0,6.91
2,Biltine,TD,2022-07-05 22:29:34,14.5333,20.9167,83.26,50,37,10.36
3,Chuguyevka,RU,2022-07-05 22:29:35,44.1653,133.8633,70.45,94,77,2.30
4,Dikson,RU,2022-07-05 22:29:35,73.5069,80.5464,34.70,98,95,10.51
...,...,...,...,...,...,...,...,...,...
536,Inuvik,CA,2022-07-05 22:43:58,68.3499,-133.7218,83.16,47,40,9.22
537,Puri,IN,2022-07-05 22:40:09,19.8000,85.8500,79.32,83,100,8.46
538,Manthani,IN,2022-07-05 22:43:59,18.6500,79.6667,78.06,88,94,4.88
539,Ende,ID,2022-07-05 22:43:59,-8.8432,121.6623,73.45,78,95,6.73


In [15]:
# Create the output file (CSV)
output_data_file = "weather_data/cities.csv"

# Export the City_Data into a CSV
city_data_df.to_csv(output_data_file, index_label="City_ID")