In [1]:
# Import the dependencies.
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np
from citipy import citipy
import requests
from config import weatherkey
import time
from datetime import datetime

In [2]:
# Starting URL fo Weather Map API Call.
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weatherkey

In [3]:
# Create an empty list to hold the weather data.
city_data = []
# Print the beginning of the logging.
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters.
record_count = 1
set_count = 1

Beginning Data Retrieval     
-----------------------------


In [4]:
# Create a set of random latitutde and longitude combinations.
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)
lat_lngs

<zip at 0x2bfbebc7dc8>

In [5]:
# Add the latitudes and longitudes to a list.
coordinates = list(lat_lngs)

In [6]:
# Create a list for holding the cities.
cities = []
# Identify the nearest city for each latitude and longitude combination.
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name

    # If the city is unique, then we will add it to the cities list.
    if city not in cities:
        cities.append(city)
# Print the city count to confirm sufficient count.
len(cities)

611

In [7]:
# Loop through all the cities in our list.
for i, city in enumerate(cities):
    
    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
        time.sleep(60)
    
    # Create endpoint URL with each city.
    city_url = url + "&q=" + city.replace(" ", "+")
    
    # Log the URL, record, and set numbers and the city.
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    # Add 1 to the record count.
    record_count += 1

    # Run an API request for each of the cities.
    try:
        # Parse the JSON and retrieve data.
        city_weather = requests.get(city_url).json()
        # Parse out the needed data.
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        # Convert the date to ISO standard.
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
        # Append the city information into city_data list.
        city_data.append({"City": city.title(),
                          "Lat": city_lat,
                          "Lng": city_lng,
                          "Max Temp": city_max_temp,
                          "Humidity": city_humidity,
                          "Cloudiness": city_clouds,
                          "Wind Speed": city_wind,
                          "Country": city_country,
                          "Date": city_date})

# If an error is experienced, skip the city.
    except:
        print("City not found. Skipping...")
        pass

# Indicate that Data Loading is complete.
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")

Processing Record 1 of Set 1 | severo-kurilsk
Processing Record 2 of Set 1 | ribeira grande
Processing Record 3 of Set 1 | mayo
Processing Record 4 of Set 1 | mount isa
Processing Record 5 of Set 1 | port elizabeth
Processing Record 6 of Set 1 | mataura
Processing Record 7 of Set 1 | puerto ayora
Processing Record 8 of Set 1 | cape town
Processing Record 9 of Set 1 | hobart
Processing Record 10 of Set 1 | hithadhoo
Processing Record 11 of Set 1 | albany
Processing Record 12 of Set 1 | taolanaro
City not found. Skipping...
Processing Record 13 of Set 1 | itigi
Processing Record 14 of Set 1 | cururupu
Processing Record 15 of Set 1 | tsihombe
City not found. Skipping...
Processing Record 16 of Set 1 | provideniya
Processing Record 17 of Set 1 | thompson
Processing Record 18 of Set 1 | hermanus
Processing Record 19 of Set 1 | kaitangata
Processing Record 20 of Set 1 | puerto del rosario
Processing Record 21 of Set 1 | rikitea
Processing Record 22 of Set 1 | bluff
Processing Record 23 of Se

City not found. Skipping...
Processing Record 38 of Set 4 | hamilton
Processing Record 39 of Set 4 | sao joao da barra
Processing Record 40 of Set 4 | klaksvik
Processing Record 41 of Set 4 | bure
Processing Record 42 of Set 4 | kalmunai
Processing Record 43 of Set 4 | fairbanks
Processing Record 44 of Set 4 | ponta do sol
Processing Record 45 of Set 4 | puerto escondido
Processing Record 46 of Set 4 | beihai
Processing Record 47 of Set 4 | sitka
Processing Record 48 of Set 4 | avera
Processing Record 49 of Set 4 | khatanga
Processing Record 50 of Set 4 | montrose
Processing Record 1 of Set 5 | coahuayana
Processing Record 2 of Set 5 | luganville
Processing Record 3 of Set 5 | dayong
Processing Record 4 of Set 5 | hovd
Processing Record 5 of Set 5 | waipawa
Processing Record 6 of Set 5 | san fernando
Processing Record 7 of Set 5 | saint george
Processing Record 8 of Set 5 | east london
Processing Record 9 of Set 5 | grand gaube
Processing Record 10 of Set 5 | antsohihy
Processing Recor

Processing Record 31 of Set 8 | codrington
Processing Record 32 of Set 8 | corinto
Processing Record 33 of Set 8 | yulara
Processing Record 34 of Set 8 | kitgum
Processing Record 35 of Set 8 | kovdor
Processing Record 36 of Set 8 | kupino
Processing Record 37 of Set 8 | blagoyevo
Processing Record 38 of Set 8 | achalpur
Processing Record 39 of Set 8 | tazovskiy
Processing Record 40 of Set 8 | mount gambier
Processing Record 41 of Set 8 | maroantsetra
Processing Record 42 of Set 8 | saleaula
City not found. Skipping...
Processing Record 43 of Set 8 | brunsbuttel
Processing Record 44 of Set 8 | troitsko-pechorsk
Processing Record 45 of Set 8 | road town
Processing Record 46 of Set 8 | riyadh
Processing Record 47 of Set 8 | kaeo
Processing Record 48 of Set 8 | srednekolymsk
Processing Record 49 of Set 8 | kollam
Processing Record 50 of Set 8 | eyl
Processing Record 1 of Set 9 | upata
Processing Record 2 of Set 9 | linhares
Processing Record 3 of Set 9 | pemangkat
Processing Record 4 of Se

Processing Record 18 of Set 12 | riohacha
Processing Record 19 of Set 12 | taupo
Processing Record 20 of Set 12 | angra
City not found. Skipping...
Processing Record 21 of Set 12 | la asuncion
Processing Record 22 of Set 12 | buala
Processing Record 23 of Set 12 | sorvag
City not found. Skipping...
Processing Record 24 of Set 12 | manoel urbano
Processing Record 25 of Set 12 | san jose
Processing Record 26 of Set 12 | xichang
Processing Record 27 of Set 12 | walvis bay
Processing Record 28 of Set 12 | carroll
Processing Record 29 of Set 12 | saint-francois
Processing Record 30 of Set 12 | angangxi
City not found. Skipping...
Processing Record 31 of Set 12 | thunder bay
Processing Record 32 of Set 12 | north adams
Processing Record 33 of Set 12 | vilyuysk
Processing Record 34 of Set 12 | erzin
Processing Record 35 of Set 12 | shache
Processing Record 36 of Set 12 | sayyan
Processing Record 37 of Set 12 | palabuhanratu
City not found. Skipping...
Processing Record 38 of Set 12 | chacalti

In [17]:
# Convert the array of dictionaries to a Pandas DataFrame.
output_city_data_df = pd.DataFrame(city_data)
output_city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Severo-Kurilsk,50.6789,156.125,26.38,55,45,5.75,RU,2022-01-26 01:24:46
1,Ribeira Grande,38.5167,-28.7,59.68,79,100,6.98,PT,2022-01-26 01:24:46
2,Mayo,38.8876,-76.5119,35.71,55,100,7.0,US,2022-01-26 01:24:18
3,Mount Isa,-20.7333,139.5,85.77,66,75,12.66,AU,2022-01-26 01:24:47
4,Port Elizabeth,-33.918,25.5701,70.11,83,100,10.36,ZA,2022-01-26 01:22:36
5,Mataura,-46.1927,168.8643,55.47,96,100,3.4,NZ,2022-01-26 01:24:47
6,Puerto Ayora,-0.7393,-90.3518,73.87,88,76,6.35,EC,2022-01-26 01:24:48
7,Cape Town,-33.9258,18.4232,68.41,79,0,5.99,ZA,2022-01-26 01:24:00
8,Hobart,-42.8794,147.3294,67.01,73,75,8.05,AU,2022-01-26 01:24:48
9,Hithadhoo,-0.6,73.0833,81.1,67,100,17.94,MV,2022-01-26 01:24:48


In [18]:
# Rearrange columns
new_column_order = ["City", "Country", "Date", "Lat", "Lng", "Max Temp", "Humidity", "Cloudiness", "Wind Speed"]
city_data_df = city_data_df[new_column_order]
city_data_df

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Severo-Kurilsk,RU,2022-01-26 01:24:46,50.6789,156.1250,26.38,55,45,5.75
1,Ribeira Grande,PT,2022-01-26 01:24:46,38.5167,-28.7000,59.68,79,100,6.98
2,Mayo,US,2022-01-26 01:24:18,38.8876,-76.5119,35.71,55,100,7.00
3,Mount Isa,AU,2022-01-26 01:24:47,-20.7333,139.5000,85.77,66,75,12.66
4,Port Elizabeth,ZA,2022-01-26 01:22:36,-33.9180,25.5701,70.11,83,100,10.36
...,...,...,...,...,...,...,...,...,...
558,Mezen,RU,2022-01-26 01:40:15,65.8522,44.2400,7.65,98,30,5.75
559,Komsomolskiy,UZ,2022-01-26 01:40:16,40.4272,71.7189,29.62,80,75,6.91
560,Constitucion,CL,2022-01-26 01:40:16,-35.3333,-72.4167,56.46,93,2,8.01
561,Touros,BR,2022-01-26 01:40:16,-5.1989,-35.4608,81.50,76,100,13.51


In [19]:
# Create the output file (CSV).
output_data_file = "weather_data/cities.csv"
# Export the City_Data into a CSV.
city_data_df.to_csv(output_data_file, index_label = "City_ID")