In [1]:
# Import the dependencies.
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np
from citipy import citipy

# Import the datetime module from the datetime library.
from datetime import datetime

# Import the API key.
from config import weather_api_key

# Import requests
import requests

In [2]:
# Create a set of random latitude and longitude combinations.
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)
lat_lngs

<zip at 0x7fb01f8256e0>

In [3]:
# Add the latitudes and longitudes to a list.
coordinates = list(lat_lngs)

In [4]:
# Create a list for holding the cities.
cities = []
# Identify the nearest city for each latitude and longitude combination.
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name

    # If the city is unique, then we will add it to the cities list.
    if city not in cities:
        cities.append(city)
# Print the city count to confirm sufficient count.
len(cities)

612

In [5]:
cities

['yellowknife',
 'rocha',
 'marzuq',
 'port alfred',
 'tebingtinggi',
 'hobart',
 'beringovskiy',
 'atuona',
 'buraydah',
 'ushuaia',
 'punta arenas',
 'hasaki',
 'mar del plata',
 'bambous virieux',
 'banbury',
 'luena',
 'tuktoyaktuk',
 'yar-sale',
 'jamestown',
 'hermanus',
 'talnakh',
 'alyangula',
 'ca mau',
 'albany',
 'norman wells',
 'bluff',
 'port macquarie',
 'souillac',
 'salta',
 'vaitupu',
 'mataura',
 'ambatolampy',
 'chuy',
 'saleaula',
 'harindanga',
 'zhitikara',
 'yumen',
 'pasighat',
 'rikitea',
 'vila franca do campo',
 'vaini',
 'bijar',
 'potosi',
 'kodiak',
 'dinajpur',
 'ngukurr',
 'constitucion',
 'butaritari',
 'shieli',
 'taolanaro',
 'kapaa',
 'arraial do cabo',
 'avarua',
 'toora-khem',
 'mys shmidta',
 'la ronge',
 'upernavik',
 'ribeira grande',
 'semirom',
 'isangel',
 'adrar',
 'muroto',
 'aklavik',
 'itupiranga',
 'illoqqortoormiut',
 'bilma',
 'nome',
 'port elizabeth',
 'abha',
 'houma',
 'brae',
 'busselton',
 'maldonado',
 'samusu',
 'dalvik',
 'n

In [6]:
# Starting URL for Weather Map API Call.
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key
print(url)

http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=faf0b3a56ae8e1d08d219ca62c9931f9


In [7]:
# Create an empty list to hold the weather data.
city_data = []
# Print the beginning of the logging.
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters.
record_count = 1
set_count = 1

# Loop through all the cities in the list.
for i, city in enumerate(cities):

    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
    # Create endpoint URL with each city.
    city_url = url + "&q=" + city.replace(" ","+")

    # Log the URL, record, and set numbers and the city.
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    # Add 1 to the record count.
    record_count += 1
    
# Run an API request for each of the cities.
    try:
        # Parse the JSON and retrieve data.
        city_weather = requests.get(city_url).json()
        # Parse out the needed data.
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        # Convert the date to ISO standard.
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
        # Append the city information into city_data list.
        city_data.append({"City": city.title(),
                          "Lat": city_lat,
                          "Lng": city_lng,
                          "Max Temp": city_max_temp,
                          "Humidity": city_humidity,
                          "Cloudiness": city_clouds,
                          "Wind Speed": city_wind,
                          "Country": city_country,
                          "Date": city_date})

# If an error is experienced, skip the city.
    except:
        print("City not found. Skipping..." + city + str(i))
        pass

# Indicate that Data Loading is complete.
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")

Beginning Data Retrieval     
-----------------------------
Processing Record 1 of Set 1 | yellowknife
Processing Record 2 of Set 1 | rocha
Processing Record 3 of Set 1 | marzuq
Processing Record 4 of Set 1 | port alfred
Processing Record 5 of Set 1 | tebingtinggi
Processing Record 6 of Set 1 | hobart
Processing Record 7 of Set 1 | beringovskiy
Processing Record 8 of Set 1 | atuona
Processing Record 9 of Set 1 | buraydah
Processing Record 10 of Set 1 | ushuaia
Processing Record 11 of Set 1 | punta arenas
Processing Record 12 of Set 1 | hasaki
Processing Record 13 of Set 1 | mar del plata
Processing Record 14 of Set 1 | bambous virieux
Processing Record 15 of Set 1 | banbury
Processing Record 16 of Set 1 | luena
Processing Record 17 of Set 1 | tuktoyaktuk
Processing Record 18 of Set 1 | yar-sale
Processing Record 19 of Set 1 | jamestown
Processing Record 20 of Set 1 | hermanus
Processing Record 21 of Set 1 | talnakh
Processing Record 22 of Set 1 | alyangula
Processing Record 23 of Set 1

Processing Record 32 of Set 4 | faanui
Processing Record 33 of Set 4 | narsaq
Processing Record 34 of Set 4 | longyearbyen
Processing Record 35 of Set 4 | sept-iles
Processing Record 36 of Set 4 | carnarvon
Processing Record 37 of Set 4 | port-gentil
Processing Record 38 of Set 4 | ayolas
Processing Record 39 of Set 4 | aguimes
Processing Record 40 of Set 4 | margate
Processing Record 41 of Set 4 | rungata
City not found. Skipping...rungata190
Processing Record 42 of Set 4 | big spring
Processing Record 43 of Set 4 | marshalltown
Processing Record 44 of Set 4 | xining
Processing Record 45 of Set 4 | mitsamiouli
Processing Record 46 of Set 4 | bull savanna
Processing Record 47 of Set 4 | tiksi
Processing Record 48 of Set 4 | beloha
Processing Record 49 of Set 4 | kindu
Processing Record 50 of Set 4 | jalu
Processing Record 1 of Set 5 | dolores hidalgo
Processing Record 2 of Set 5 | oyama
Processing Record 3 of Set 5 | sanandaj
Processing Record 4 of Set 5 | kirakira
Processing Record 5 

Processing Record 17 of Set 8 | ocampo
Processing Record 18 of Set 8 | mahebourg
Processing Record 19 of Set 8 | ndago
Processing Record 20 of Set 8 | launceston
Processing Record 21 of Set 8 | collingwood
Processing Record 22 of Set 8 | lata
Processing Record 23 of Set 8 | krasnoyarsk-45
City not found. Skipping...krasnoyarsk-45372
Processing Record 24 of Set 8 | lorengau
Processing Record 25 of Set 8 | burkhala
City not found. Skipping...burkhala374
Processing Record 26 of Set 8 | meadow lake
Processing Record 27 of Set 8 | hovd
Processing Record 28 of Set 8 | davila
Processing Record 29 of Set 8 | faya
Processing Record 30 of Set 8 | tumannyy
City not found. Skipping...tumannyy379
Processing Record 31 of Set 8 | yulara
Processing Record 32 of Set 8 | amderma
City not found. Skipping...amderma381
Processing Record 33 of Set 8 | saquisili
Processing Record 34 of Set 8 | haines junction
Processing Record 35 of Set 8 | hulan
Processing Record 36 of Set 8 | kamenka
Processing Record 37 o

Processing Record 4 of Set 12 | sioux lookout
Processing Record 5 of Set 12 | padang
Processing Record 6 of Set 12 | riberalta
Processing Record 7 of Set 12 | sao joao da barra
Processing Record 8 of Set 12 | merrill
Processing Record 9 of Set 12 | impfondo
Processing Record 10 of Set 12 | evanton
Processing Record 11 of Set 12 | yazoo city
Processing Record 12 of Set 12 | tiznit
Processing Record 13 of Set 12 | bereda
Processing Record 14 of Set 12 | corpus christi
Processing Record 15 of Set 12 | shubarshi
Processing Record 16 of Set 12 | alice springs
Processing Record 17 of Set 12 | kawambwa
Processing Record 18 of Set 12 | saint-pierre
Processing Record 19 of Set 12 | okhotsk
Processing Record 20 of Set 12 | sidi bu zayd
City not found. Skipping...sidi bu zayd569
Processing Record 21 of Set 12 | kankaanpaa
Processing Record 22 of Set 12 | noormarkku
Processing Record 23 of Set 12 | comodoro rivadavia
Processing Record 24 of Set 12 | junction city
Processing Record 25 of Set 12 | m

In [8]:
city_data

[{'City': 'Yellowknife',
  'Lat': 62.456,
  'Lng': -114.3525,
  'Max Temp': -11.99,
  'Humidity': 77,
  'Cloudiness': 20,
  'Wind Speed': 3.44,
  'Country': 'CA',
  'Date': '2021-01-31 01:41:44'},
 {'City': 'Rocha',
  'Lat': -34.4833,
  'Lng': -54.3333,
  'Max Temp': 65.26,
  'Humidity': 89,
  'Cloudiness': 100,
  'Wind Speed': 14.94,
  'Country': 'UY',
  'Date': '2021-01-31 01:41:44'},
 {'City': 'Marzuq',
  'Lat': 14.4,
  'Lng': 46.4667,
  'Max Temp': 57.04,
  'Humidity': 61,
  'Cloudiness': 0,
  'Wind Speed': 2.8,
  'Country': 'YE',
  'Date': '2021-01-31 01:38:35'},
 {'City': 'Port Alfred',
  'Lat': -33.5906,
  'Lng': 26.891,
  'Max Temp': 63,
  'Humidity': 92,
  'Cloudiness': 0,
  'Wind Speed': 1.97,
  'Country': 'ZA',
  'Date': '2021-01-31 01:41:45'},
 {'City': 'Tebingtinggi',
  'Lat': 3.3285,
  'Lng': 99.1625,
  'Max Temp': 77,
  'Humidity': 100,
  'Cloudiness': 40,
  'Wind Speed': 3.44,
  'Country': 'ID',
  'Date': '2021-01-31 01:41:45'},
 {'City': 'Hobart',
  'Lat': -42.8794,
  

In [9]:
city_data[0]

{'City': 'Yellowknife',
 'Lat': 62.456,
 'Lng': -114.3525,
 'Max Temp': -11.99,
 'Humidity': 77,
 'Cloudiness': 20,
 'Wind Speed': 3.44,
 'Country': 'CA',
 'Date': '2021-01-31 01:41:44'}

In [10]:
city_weather

{'coord': {'lon': -40.2925, 'lat': -20.3297},
 'weather': [{'id': 803,
   'main': 'Clouds',
   'description': 'broken clouds',
   'icon': '04n'}],
 'base': 'stations',
 'main': {'temp': 78.39,
  'feels_like': 82.62,
  'temp_min': 78.01,
  'temp_max': 78.8,
  'pressure': 1016,
  'humidity': 78},
 'visibility': 10000,
 'wind': {'speed': 6.91, 'deg': 360},
 'clouds': {'all': 75},
 'dt': 1612057413,
 'sys': {'type': 1,
  'id': 8474,
  'country': 'BR',
  'sunrise': 1611995024,
  'sunset': 1612041907},
 'timezone': -10800,
 'id': 3445026,
 'name': 'Vila Velha',
 'cod': 200}

In [11]:
len(city_data)

557

In [12]:
# Convert the array of dictionaries to a Pandas DataFrame.
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Yellowknife,62.456,-114.3525,-11.99,77,20,3.44,CA,2021-01-31 01:41:44
1,Rocha,-34.4833,-54.3333,65.26,89,100,14.94,UY,2021-01-31 01:41:44
2,Marzuq,14.4,46.4667,57.04,61,0,2.8,YE,2021-01-31 01:38:35
3,Port Alfred,-33.5906,26.891,63.0,92,0,1.97,ZA,2021-01-31 01:41:45
4,Tebingtinggi,3.3285,99.1625,77.0,100,40,3.44,ID,2021-01-31 01:41:45
5,Hobart,-42.8794,147.3294,75.0,45,40,11.5,AU,2021-01-31 01:37:21
6,Beringovskiy,63.05,179.3167,6.33,94,100,30.67,RU,2021-01-31 01:41:46
7,Atuona,-9.8,-139.0333,79.07,75,44,17.13,PF,2021-01-31 01:41:46
8,Buraydah,26.326,43.975,46.4,76,0,5.75,SA,2021-01-31 01:41:51
9,Ushuaia,-54.8,-68.3,50.0,66,20,24.16,AR,2021-01-31 01:41:51


In [15]:
new_column_order = ["City", "Country", "Date", "Lat", "Lng", "Max Temp", "Humidity", "Cloudiness", "Wind Speed"]

In [16]:
city_data_df = city_data_df[new_column_order]
city_data_df

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Yellowknife,CA,2021-01-31 01:41:44,62.4560,-114.3525,-11.99,77,20,3.44
1,Rocha,UY,2021-01-31 01:41:44,-34.4833,-54.3333,65.26,89,100,14.94
2,Marzuq,YE,2021-01-31 01:38:35,14.4000,46.4667,57.04,61,0,2.80
3,Port Alfred,ZA,2021-01-31 01:41:45,-33.5906,26.8910,63.00,92,0,1.97
4,Tebingtinggi,ID,2021-01-31 01:41:45,3.3285,99.1625,77.00,100,40,3.44
...,...,...,...,...,...,...,...,...,...
552,Port Augusta,AU,2021-01-31 01:43:32,-32.5000,137.7667,71.60,60,100,14.97
553,Ulaanbaatar,MN,2021-01-31 01:41:52,47.9077,106.8832,1.40,71,40,15.66
554,Imamoglu,TR,2021-01-31 01:43:33,37.2651,35.6572,48.99,100,75,13.80
555,Port-Cartier,CA,2021-01-31 01:43:33,50.0334,-66.8654,19.40,63,9,9.22


In [17]:
# Create the output file (CSV).
output_data_file = "weather_data/cities.csv"

# Export the City_Data into a CSV.
city_data_df.to_csv(output_data_file, index_label="City_ID")