In [1]:
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np
from citipy import citipy
import requests

#Import the API key.
from config import weather_api_key

#Import datetime module from datetime library
from datetime import datetime

In [2]:
#Generate a set of random latitude and longitude combinations
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)
lat_lngs

<zip at 0x20ab4f35840>

In [3]:
#create a list of latitudes and longitudes
coordinates = list(lat_lngs)

In [4]:
#Create empty list to hold cities
cities = []
#Identify the nearest city for each latitude and longitude combination
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name

    #If the city is unique, add it to the cities list
    if city not in cities:
        cities.append(city)
#Check the list count to confirm >500 unique cities generated
len(cities)

606

In [5]:
#Starting URL for Weather Map API call
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key

#Create an empty list to hold weather data
city_data = []

#Print a message at the beginning of logging
print("Beginning Data Retrieval\n-------------------------")

#Create record counters
record_count = 1
set_count = 1

#Loop through all the cities in cities[]
for i, city in enumerate(cities):
    
    #Group into sets of 50
    if (i % 50 == 0 and i >= 50):
        set_count += 1
  
        
    #Create endpoint URL with each city, removing blank spaces - concatenate names to reduce liklihood of name errors
    city_url = url + "&q=" + city.replace(" ","+")
    
    #Log the URL, record, set numbers and the city
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    
    # Add 1 to the record count.
    record_count += 1
    
    #Run API requests for each of the cities
    try:
        #Parse the JSON and retrieve data
        city_weather = requests.get(city_url).json()
        
        #Parse out the needed data
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        
        #Convert the date to ISO standard
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
        
        #Append the city information into city_data dictionary
        city_data.append({"City": city.title(),
                          "Lat": city_lat,
                          "Lng": city_lng,
                          "Max Temp": city_max_temp,
                          "Humidity": city_humidity,
                          "Cloudiness": city_clouds,
                          "Wind Speed": city_wind,
                          "Country": city_country,
                          "Date": city_date})

    #If an error occurs, skip the city and keep going
    except:
        print(f"City name {city} not found. Skipping...")
        pass

# Indicate that Data Loading is complete.
print("------------------------\nData Retrieval Complete\n------------------------")

Beginning Data Retrieval
-------------------------
Processing Record 1 of Set 1 | saldanha
Processing Record 2 of Set 1 | taolanaro
City name taolanaro not found. Skipping...
Processing Record 3 of Set 1 | dingle
Processing Record 4 of Set 1 | vaini
Processing Record 5 of Set 1 | illoqqortoormiut
City name illoqqortoormiut not found. Skipping...
Processing Record 6 of Set 1 | ilebo
Processing Record 7 of Set 1 | marawi
Processing Record 8 of Set 1 | cape town
Processing Record 9 of Set 1 | albany
Processing Record 10 of Set 1 | filadelfia
Processing Record 11 of Set 1 | chuy
Processing Record 12 of Set 1 | rikitea
Processing Record 13 of Set 1 | hilo
Processing Record 14 of Set 1 | medvedka
Processing Record 15 of Set 1 | gimbi
Processing Record 16 of Set 1 | caravelas
Processing Record 17 of Set 1 | alexandria
Processing Record 18 of Set 1 | sitka
Processing Record 19 of Set 1 | corn island
Processing Record 20 of Set 1 | tabiauea
City name tabiauea not found. Skipping...
Processing R

Processing Record 178 of Set 4 | lorengau
Processing Record 179 of Set 4 | ponta do sol
Processing Record 180 of Set 4 | teya
Processing Record 181 of Set 4 | kaoma
Processing Record 182 of Set 4 | noumea
Processing Record 183 of Set 4 | novoagansk
Processing Record 184 of Set 4 | barrow
Processing Record 185 of Set 4 | dobryanka
Processing Record 186 of Set 4 | najran
Processing Record 187 of Set 4 | tecoanapa
Processing Record 188 of Set 4 | camacha
Processing Record 189 of Set 4 | ostrovnoy
Processing Record 190 of Set 4 | carnarvon
Processing Record 191 of Set 4 | narowal
Processing Record 192 of Set 4 | saint anthony
Processing Record 193 of Set 4 | shenkursk
Processing Record 194 of Set 4 | stromness
Processing Record 195 of Set 4 | okhotsk
Processing Record 196 of Set 4 | oliveira do hospital
Processing Record 197 of Set 4 | kodiak
Processing Record 198 of Set 4 | belushya guba
City name belushya guba not found. Skipping...
Processing Record 199 of Set 4 | sao joao da barra
Proc

Processing Record 357 of Set 8 | hihifo
City name hihifo not found. Skipping...
Processing Record 358 of Set 8 | andenes
Processing Record 359 of Set 8 | aporawan
City name aporawan not found. Skipping...
Processing Record 360 of Set 8 | lagos
Processing Record 361 of Set 8 | puerto carreno
Processing Record 362 of Set 8 | bakloh
Processing Record 363 of Set 8 | corbelia
Processing Record 364 of Set 8 | svetlaya
Processing Record 365 of Set 8 | iranshahr
Processing Record 366 of Set 8 | ciras
City name ciras not found. Skipping...
Processing Record 367 of Set 8 | andradas
Processing Record 368 of Set 8 | yei
Processing Record 369 of Set 8 | maragogi
Processing Record 370 of Set 8 | beruni
City name beruni not found. Skipping...
Processing Record 371 of Set 8 | havre
Processing Record 372 of Set 8 | asau
Processing Record 373 of Set 8 | altay
Processing Record 374 of Set 8 | rocha
Processing Record 375 of Set 8 | salalah
Processing Record 376 of Set 8 | nioro
Processing Record 377 of Se

Processing Record 538 of Set 11 | daugavpils
Processing Record 539 of Set 11 | bondoukou
Processing Record 540 of Set 11 | wulanhaote
City name wulanhaote not found. Skipping...
Processing Record 541 of Set 11 | acapulco
Processing Record 542 of Set 11 | namibe
Processing Record 543 of Set 11 | podgornoye
Processing Record 544 of Set 11 | storm lake
Processing Record 545 of Set 11 | aksarka
Processing Record 546 of Set 11 | bulgan
Processing Record 547 of Set 11 | magistralnyy
Processing Record 548 of Set 11 | fuling
Processing Record 549 of Set 11 | ongandjera
Processing Record 550 of Set 11 | khatanga
Processing Record 551 of Set 12 | hirara
Processing Record 552 of Set 12 | tessalit
Processing Record 553 of Set 12 | karkaralinsk
City name karkaralinsk not found. Skipping...
Processing Record 554 of Set 12 | malatya
Processing Record 555 of Set 12 | jinji
Processing Record 556 of Set 12 | tapaua
City name tapaua not found. Skipping...
Processing Record 557 of Set 12 | carutapera
Proc

In [6]:
#Verify we have at least 500 cities with data
len(city_data)

555

In [7]:
#Convert city_data to a dataframe
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Saldanha,-33.0117,17.9442,57.18,83,7,0.83,ZA,2021-05-26 01:23:51
1,Dingle,10.9995,122.6711,83.55,77,100,3.42,PH,2021-05-26 01:23:52
2,Vaini,-21.2,-175.2,73.56,88,90,9.22,TO,2021-05-26 01:23:52
3,Ilebo,-4.3167,20.5833,68.58,69,45,1.95,CD,2021-05-26 01:23:52
4,Marawi,7.9986,124.2928,74.64,68,82,3.65,PH,2021-05-26 01:23:53
5,Cape Town,-33.9258,18.4232,60.89,78,75,4.0,ZA,2021-05-26 01:19:03
6,Albany,42.6001,-73.9662,74.05,66,100,5.06,US,2021-05-26 01:23:53
7,Filadelfia,39.9523,-75.1638,71.13,73,40,4.0,US,2021-05-26 01:23:54
8,Chuy,-33.6971,-53.4616,49.06,83,0,6.44,UY,2021-05-26 01:23:54
9,Rikitea,-23.1203,-134.9692,77.59,77,35,16.04,PF,2021-05-26 01:23:54


In [9]:
#Reorder the column 
new_col_order = ["City", "Country", "Date", "Lat", "Lng", "Max Temp", "Humidity", "Cloudiness", "Wind Speed"]
city_data_df = city_data_df[new_col_order]
city_data_df

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Saldanha,ZA,2021-05-26 01:23:51,-33.0117,17.9442,57.18,83,7,0.83
1,Dingle,PH,2021-05-26 01:23:52,10.9995,122.6711,83.55,77,100,3.42
2,Vaini,TO,2021-05-26 01:23:52,-21.2000,-175.2000,73.56,88,90,9.22
3,Ilebo,CD,2021-05-26 01:23:52,-4.3167,20.5833,68.58,69,45,1.95
4,Marawi,PH,2021-05-26 01:23:53,7.9986,124.2928,74.64,68,82,3.65
...,...,...,...,...,...,...,...,...,...
550,Luau,AO,2021-05-26 01:27:15,-10.7073,22.2247,54.39,58,66,4.21
551,Makakilo City,US,2021-05-26 01:27:15,21.3469,-158.0858,81.68,65,75,10.36
552,Kang,BW,2021-05-26 01:27:15,-23.6752,22.7876,53.40,44,98,6.29
553,Nizhniy Chir,RU,2021-05-26 01:27:16,48.3597,43.0865,55.31,83,17,7.85


In [10]:
#Create the output file (CSV)
output_data_file = "weather_data/cities.csv"

#Export city_data into a CSV file
city_data_df.to_csv(output_data_file, index_label="City_ID")