In [1]:
# Import the dependencies.
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np

In [2]:
# Create a set of random latitude and longitude combinations.
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)
lat_lngs

<zip at 0x1f81cc16440>

In [3]:
# Add the latitudes and longitudes to a list.
coordinates = list(lat_lngs)

In [4]:
coordinates

[(87.19363570617972, 37.912856387645974),
 (72.86227133201882, -114.37713213325904),
 (52.25105443067693, -172.86694142759234),
 (-69.41067270874288, 25.43508675252434),
 (-0.982091179494347, -13.35547890837995),
 (88.69825856525983, -17.388623299480116),
 (57.583002786865706, 23.66060257134066),
 (-72.88533327729681, -21.19326229616709),
 (-86.92299593208666, 8.557309822158714),
 (-49.903652636590934, -117.193877603006),
 (-30.94135095641615, 61.12059648849569),
 (-52.667597546163556, 139.75921175341438),
 (56.63056437941418, -95.48981651916691),
 (-50.072073865355826, -163.99022352538415),
 (73.17737468868307, -141.85442742257231),
 (-52.02375023254863, -34.52147768740656),
 (54.59509261359483, -94.05219441034762),
 (-74.61028900742569, -112.35342532289339),
 (13.155956401594366, -108.33026945831637),
 (-65.1234671636718, 39.06864956265082),
 (-78.37309023281117, -156.58180083875428),
 (-46.54093467197515, -113.29782592272184),
 (34.3336091398579, -84.56401006374787),
 (-20.000217279

In [5]:
pip install citipy

Note: you may need to restart the kernel to use updated packages.


In [6]:
from citipy import citipy

In [7]:
# Create a list for holding the cities.
cities = []
# Identify the nearest city for each latitude and longitude combination.
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name

    # If the city is unique, then we will add it to the cities list.
    if city not in cities:
        cities.append(city)
# Print the city count to confirm sufficient count.
len(cities)

588

In [8]:
cities

['vardo',
 'yellowknife',
 'provideniya',
 'bredasdorp',
 'georgetown',
 'illoqqortoormiut',
 'jurmala',
 'mar del plata',
 'hermanus',
 'rikitea',
 'saint-philippe',
 'new norfolk',
 'thompson',
 'avarua',
 'aklavik',
 'chuy',
 'punta arenas',
 'san patricio',
 'port alfred',
 'mataura',
 'canton',
 'puerto ayora',
 'nizhneyansk',
 'hobyo',
 'busselton',
 'tiksi',
 'lima',
 'albany',
 'adrar',
 'yerbogachen',
 'samarai',
 'hilo',
 'ushuaia',
 'kapaa',
 'hamilton',
 'mizque',
 'hobart',
 'flinders',
 'saskylakh',
 'arraial do cabo',
 'ust-tsilma',
 'saint-augustin',
 'port elizabeth',
 'tynda',
 'san isidro',
 'cape town',
 'ketchikan',
 'solnechnyy',
 'beloha',
 'umzimvubu',
 'bilibino',
 'burgersdorp',
 'qaanaaq',
 'byron bay',
 'umuahia',
 'butaritari',
 'carnarvon',
 'lebu',
 'verkhnevilyuysk',
 'ivanteyevka',
 'severo-kurilsk',
 'oshkosh',
 'vaitupu',
 'ostrovnoy',
 'quatre cocos',
 'kodiak',
 'codrington',
 'chokurdakh',
 'santa rosa',
 'san rafael',
 'narsaq',
 'surt',
 'bambous

In [9]:
import requests


In [10]:
conda install -c conda-forge requests

Collecting package metadata (current_repodata.json): ...working... done
Solving environment: ...working... done

# All requested packages already installed.


Note: you may need to restart the kernel to use updated packages.


In [11]:
# Import the API key.
from config import weather_api_key

In [12]:
# Starting URL for Weather Map API Call.
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key
print(url)

http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=4d5ea3cb53e6ed4c59cc0e64aea22fc0


In [13]:
# Import the datetime module from the datetime library.
from datetime import datetime

In [14]:
# Create an empty list to hold the weather data.
city_data = []
# Print the beginning of the logging.
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters.
record_count = 1
set_count = 1

# Loop through all the cities in the list.
for i, city in enumerate(cities):

    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
    # Create endpoint URL with each city.
    city_url = url + "&q=" + city.replace(" ","+")

    # Log the URL, record, and set numbers and the city.
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    # Add 1 to the record count.
    record_count += 1# Run an API request for each of the cities.
    try:
        # Parse the JSON and retrieve data.
        city_weather = requests.get(city_url).json()
        # Parse out the needed data.
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        # Convert the date to ISO standard.
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
        # Append the city information into city_data list.
        city_data.append({"City": city.title(),
                          "Lat": city_lat,
                          "Lng": city_lng,
                          "Max Temp": city_max_temp,
                          "Humidity": city_humidity,
                          "Cloudiness": city_clouds,
                          "Wind Speed": city_wind,
                          "Country": city_country,
                          "Date": city_date})

# If an error is experienced, skip the city.
    except:
        print("City not found. Skipping...")
        pass

# Indicate that Data Loading is complete.
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")
    
    

Beginning Data Retrieval     
-----------------------------
Processing Record 1 of Set 1 | vardo
Processing Record 2 of Set 1 | yellowknife
Processing Record 3 of Set 1 | provideniya
Processing Record 4 of Set 1 | bredasdorp
Processing Record 5 of Set 1 | georgetown
Processing Record 6 of Set 1 | illoqqortoormiut
City not found. Skipping...
Processing Record 7 of Set 1 | jurmala
Processing Record 8 of Set 1 | mar del plata
Processing Record 9 of Set 1 | hermanus
Processing Record 10 of Set 1 | rikitea
Processing Record 11 of Set 1 | saint-philippe
Processing Record 12 of Set 1 | new norfolk
Processing Record 13 of Set 1 | thompson
Processing Record 14 of Set 1 | avarua
Processing Record 15 of Set 1 | aklavik
Processing Record 16 of Set 1 | chuy
Processing Record 17 of Set 1 | punta arenas
Processing Record 18 of Set 1 | san patricio
Processing Record 19 of Set 1 | port alfred
Processing Record 20 of Set 1 | mataura
Processing Record 21 of Set 1 | canton
Processing Record 22 of Set 1 | 

Processing Record 39 of Set 4 | la asuncion
Processing Record 40 of Set 4 | apac
Processing Record 41 of Set 4 | mys shmidta
City not found. Skipping...
Processing Record 42 of Set 4 | kaitangata
Processing Record 43 of Set 4 | hurricane
Processing Record 44 of Set 4 | qasigiannguit
Processing Record 45 of Set 4 | komsomolskiy
Processing Record 46 of Set 4 | namibe
Processing Record 47 of Set 4 | baturaja
Processing Record 48 of Set 4 | vao
Processing Record 49 of Set 4 | labuan
Processing Record 50 of Set 4 | pareora
Processing Record 1 of Set 5 | tromso
Processing Record 2 of Set 5 | libenge
Processing Record 3 of Set 5 | klaksvik
Processing Record 4 of Set 5 | marrakesh
Processing Record 5 of Set 5 | hays
Processing Record 6 of Set 5 | humaita
Processing Record 7 of Set 5 | magdagachi
Processing Record 8 of Set 5 | harper
Processing Record 9 of Set 5 | malanje
Processing Record 10 of Set 5 | namie
Processing Record 11 of Set 5 | pokaran
Processing Record 12 of Set 5 | balaipungut
Pr

Processing Record 31 of Set 8 | gawler
Processing Record 32 of Set 8 | morro bay
Processing Record 33 of Set 8 | johnson city
Processing Record 34 of Set 8 | chicama
Processing Record 35 of Set 8 | chiavari
Processing Record 36 of Set 8 | nouadhibou
Processing Record 37 of Set 8 | ginda
Processing Record 38 of Set 8 | katsuura
Processing Record 39 of Set 8 | scarborough
Processing Record 40 of Set 8 | halifax
Processing Record 41 of Set 8 | santa isabel do rio negro
Processing Record 42 of Set 8 | klyuchi
Processing Record 43 of Set 8 | slave lake
Processing Record 44 of Set 8 | smithers
Processing Record 45 of Set 8 | abonnema
Processing Record 46 of Set 8 | killybegs
Processing Record 47 of Set 8 | narasapur
Processing Record 48 of Set 8 | walvis bay
Processing Record 49 of Set 8 | tuy hoa
Processing Record 50 of Set 8 | praia
Processing Record 1 of Set 9 | chara
Processing Record 2 of Set 9 | hirara
Processing Record 3 of Set 9 | mae sot
Processing Record 4 of Set 9 | resistencia
Pr

Processing Record 21 of Set 12 | tunduru
City not found. Skipping...
Processing Record 22 of Set 12 | dumas
Processing Record 23 of Set 12 | palauig
Processing Record 24 of Set 12 | ambovombe
Processing Record 25 of Set 12 | cortez
Processing Record 26 of Set 12 | stekolnyy
City not found. Skipping...
Processing Record 27 of Set 12 | marquette
Processing Record 28 of Set 12 | mount gambier
Processing Record 29 of Set 12 | naryan-mar
Processing Record 30 of Set 12 | oktyabrskoye
Processing Record 31 of Set 12 | jinchang
Processing Record 32 of Set 12 | jinka
Processing Record 33 of Set 12 | itoman
Processing Record 34 of Set 12 | akdepe
Processing Record 35 of Set 12 | afgoye
City not found. Skipping...
Processing Record 36 of Set 12 | maralal
Processing Record 37 of Set 12 | totma
Processing Record 38 of Set 12 | port blair
-----------------------------
Data Retrieval Complete      
-----------------------------


In [15]:
len(city_data)

546

In [21]:
# Convert the array of dictionaries to a Pandas DataFrame.
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Vardo,70.3705,31.1107,33.8,80,75,23.02,NO,2021-02-17 21:13:39
1,Yellowknife,62.456,-114.3525,-13.0,76,90,4.61,CA,2021-02-17 21:13:27
2,Provideniya,64.3833,-173.3,1.4,60,0,26.84,RU,2021-02-17 21:13:25
3,Bredasdorp,-34.5322,20.0403,62.6,82,75,5.75,ZA,2021-02-17 21:13:30
4,Georgetown,5.4112,100.3354,78.8,69,20,6.91,MY,2021-02-17 21:11:06
5,Jurmala,56.968,23.7704,6.8,85,0,3.44,LV,2021-02-17 21:15:09
6,Mar Del Plata,-38.0023,-57.5575,69.8,73,40,10.36,AR,2021-02-17 21:09:12
7,Hermanus,-34.4187,19.2345,66.99,83,69,1.99,ZA,2021-02-17 21:13:25
8,Rikitea,-23.1203,-134.9692,78.6,70,12,11.27,PF,2021-02-17 21:13:22
9,Saint-Philippe,-21.3585,55.7679,78.8,73,0,5.75,RE,2021-02-17 21:13:30


In [24]:
new_column_order = ["City","Country","Date", "Lat", "Lng", "Max Temp", "Humidity", "Cloudiness", "Wind Speed"]

In [25]:
city_data_df = city_data_df[new_column_order]

In [26]:
city_data_df.head()

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Vardo,NO,2021-02-17 21:13:39,70.3705,31.1107,33.8,80,75,23.02
1,Yellowknife,CA,2021-02-17 21:13:27,62.456,-114.3525,-13.0,76,90,4.61
2,Provideniya,RU,2021-02-17 21:13:25,64.3833,-173.3,1.4,60,0,26.84
3,Bredasdorp,ZA,2021-02-17 21:13:30,-34.5322,20.0403,62.6,82,75,5.75
4,Georgetown,MY,2021-02-17 21:11:06,5.4112,100.3354,78.8,69,20,6.91


In [27]:
# Create the output file (CSV).
output_data_file = "weather_data/cities.csv"
# Export the City_Data into a CSV.
city_data_df.to_csv(output_data_file, index_label="City_ID")