In [1]:
# Import the dependencies.
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np

# Import the requests library.
import requests

# Use the citipy module to determine city based on latitude and longitude.
from citipy import citipy

# Import the datetime module from the datetime library.
from datetime import datetime

# Import the API key.
from config import weather_api_key

In [2]:
# Create a set of random latitude and longitude combinations.
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)
lat_lngs

<zip at 0x7fd513af42c0>

In [3]:
# Add the latitudes and longitudes to a list.
coordinates = list(lat_lngs)

In [4]:
# Use the tuple() function to display the latitude and longitude combinations.
for coordinate in coordinates:
    print(citipy.nearest_city(coordinate[0], coordinate[1]).city_name,
          citipy.nearest_city(coordinate[0], coordinate[1]).country_code)

krasnoye ru
petropavlovsk-kamchatskiy ru
taolanaro mg
lucban ph
nikolskoye ru
puerto ayora ec
neiafu to
san patricio mx
atuona pf
faanui pf
vao nc
mar del plata ar
codrington ag
vestmannaeyjar is
bredasdorp za
pallasovka ru
quelimane mz
rikitea pf
belaya gora ru
codrington ag
hastings nz
ewa beach us
olafsvik is
hermanus za
mataura pf
ushuaia ar
arraial do cabo br
raudeberg no
adrar dz
yuncheng cn
eyl so
dikson ru
bluff nz
kaitangata nz
bulgan mn
rikitea pf
mantua cu
le port re
punta arenas cl
sao francisco do sul br
tsihombe mg
roma au
caravelas br
esperance au
hermanus za
ati td
clyde river ca
mataura pf
porangatu br
fairbanks us
bermeo es
fairbanks us
port alfred za
ushuaia ar
saint-philippe re
ushuaia ar
busselton au
rikitea pf
ushuaia ar
kununurra au
aasiaat gl
atuona pf
rikitea pf
alotau pg
bahia blanca ar
burica pa
butaritari ki
mataura pf
bethel us
tiksi ru
ilulissat gl
sayyan ye
punta arenas cl
carnarvon au
kautokeino no
bethel us
saskylakh ru
busselton au
bambanglipuro id
ush

In [5]:
# Create a list for holding the cities.
cities = []
# Identify the nearest city for each latitude and longitude combination.
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name

    # If the city is unique, then we will add it to the cities list.
    if city not in cities:
        cities.append(city)
# Print the city count to confirm sufficient count.
len(cities)

619

In [6]:
# Starting URL for Weather Map API Call.
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key

In [None]:
# Create an empty list to hold the weather data.
city_data = []

# Print the beginning of the logging.
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters.
record_count = 1
set_count = 1

# Loop through all the cities in the list.
for i, city in enumerate(cities):

    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
    # Create endpoint URL with each city.
    city_url = url + "&q=" + city.replace(" ","+")

    # Log the URL, record, and set numbers and the city.
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    # Add 1 to the record count.
    record_count += 1

# Run an API request for each of the cities.
    try:
        # Parse the JSON and retrieve data.
        city_weather = requests.get(city_url).json()
        # Parse out the needed data.
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        # Convert the date to ISO standard.
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
        # Append the city information into city_data list.
        city_data.append({"City": city.title(),
                          "Lat": city_lat,
                          "Lng": city_lng,
                          "Max Temp": city_max_temp,
                          "Humidity": city_humidity,
                          "Cloudiness": city_clouds,
                          "Wind Speed": city_wind,
                          "Country": city_country,
                          "Date": city_date})

# If an error is experienced, skip the city.
    except:
        print("City not found. Skipping...")
        pass

# Indicate that Data Loading is complete.
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")

Beginning Data Retrieval     
-----------------------------
Processing Record 1 of Set 1 | krasnoye
Processing Record 2 of Set 1 | petropavlovsk-kamchatskiy
Processing Record 3 of Set 1 | taolanaro
City not found. Skipping...
Processing Record 4 of Set 1 | lucban
Processing Record 5 of Set 1 | nikolskoye
Processing Record 6 of Set 1 | puerto ayora
Processing Record 7 of Set 1 | neiafu
Processing Record 8 of Set 1 | san patricio
Processing Record 9 of Set 1 | atuona
Processing Record 10 of Set 1 | faanui
Processing Record 11 of Set 1 | vao
Processing Record 12 of Set 1 | mar del plata
Processing Record 13 of Set 1 | codrington
Processing Record 14 of Set 1 | vestmannaeyjar
Processing Record 15 of Set 1 | bredasdorp
Processing Record 16 of Set 1 | pallasovka
Processing Record 17 of Set 1 | quelimane
Processing Record 18 of Set 1 | rikitea
Processing Record 19 of Set 1 | belaya gora
Processing Record 20 of Set 1 | hastings
Processing Record 21 of Set 1 | ewa beach
Processing Record 22 of 

In [None]:
len(city_data)

In [None]:
# Convert the array of dictionaries to a Pandas DataFrame.
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

In [None]:
# Reorder columns in city_data DataFrame.
new_order_city_data = ['City', 'Country', 'Date', 'Lat', 'Lng', 'Max Temp', 
                       'Humidity', 'Cloudiness', 'Wind Speed']
# Reassign reordered DataFrame to city_data DataFrame.
city_data_df = city_data_df[new_order_city_data ]

city_data_df.head(10)

In [None]:
# Create the output file (CSV).
output_data_file = "weather_data/cities.csv"

# Export the City_Data into a CSV.
city_data_df.to_csv(output_data_file, index_label="City_ID")