In [1]:
# Import the dependencies
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np
from citipy import citipy
# Import the requests library
import requests
# Import the API key
from config import weather_api_key
# Import the datetime module from the datetime library.
from datetime import datetime

url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key

In [2]:
# Create a set of random latitude and longitude combinations
lats = np.random.uniform(low=-90.000,high=90.000, size=1800)
lngs = np.random.uniform(low=-180.000,high=180.000, size=1800)
lat_lngs = zip(lats, lngs)
lat_lngs

<zip at 0x7ffc199faa50>

In [3]:
# Add the latitudes and longitudes to a list.
coordinates = list(lat_lngs)


In [4]:
# Create a list for holding the cities
cities = []
# Identify the nearest city for each latitude and longitude combination
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name
    
    # If the city is unique, then we will add it to the cities list
    if city not in cities:
        cities.append(city)
        
# Print the city count to confirm sufficient count
len(cities)

720

In [5]:
# Create an empty list to hold the weather data
city_data = []
# Print the beginning of the logging
print("Beginning Data Retrieval     ")
print("-----------------------------")

# create counters
record_count = 1
set_count = 1
# Loop through all the cities in the list
for i, city in enumerate(cities):
    # Group cities in sets of 50 for logging purposes
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
    # create endpoint URL with each city
    #city_url = url + "&q=" + city.replace("","+"), if there is no space between "", nothing will be replaced
    city_url = url + "&q=" + city.replace(" ","+")
    
    # Log the URL, record, and set numbers and the city
    print(f"Processing Record {record_count} of Set {set_count})|{city}")
    # Add 1 to the record count
    record_count += 1
# Run an API request for each of the cities.
    try:
        # Parse the JSON and retrieve data.
        city_weather = requests.get(city_url).json()
        # Parse out the needed data.
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        # Convert the date to ISO standard.
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
        # Append the city information into city_data list.
        city_data.append({"City": city.title(),
                          "Lat": city_lat,
                          "Lng": city_lng,
                          "Max Temp": city_max_temp,
                          "Humidity": city_humidity,
                          "Cloudiness": city_clouds,
                          "Wind Speed": city_wind,
                          "Country": city_country,
                          "Date": city_date})

# If an error is experienced, skip the city.
    except:
        print("City not found. Skipping...")
        pass

# Indicate that Data Loading is complete.
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")

Beginning Data Retrieval     
-----------------------------
Processing Record 1 of Set 1)|okhotsk
Processing Record 2 of Set 1)|hithadhoo
Processing Record 3 of Set 1)|atuona
Processing Record 4 of Set 1)|saleaula
City not found. Skipping...
Processing Record 5 of Set 1)|taolanaro
City not found. Skipping...
Processing Record 6 of Set 1)|nador
Processing Record 7 of Set 1)|keuruu
Processing Record 8 of Set 1)|georgetown
Processing Record 9 of Set 1)|qaanaaq
Processing Record 10 of Set 1)|punta arenas
Processing Record 11 of Set 1)|butaritari
Processing Record 12 of Set 1)|ahuimanu
Processing Record 13 of Set 1)|albany
Processing Record 14 of Set 1)|vestmannaeyjar
Processing Record 15 of Set 1)|jasper
Processing Record 16 of Set 1)|hrusovany nad jevisovkou
Processing Record 17 of Set 1)|huntsville
Processing Record 18 of Set 1)|hermanus
Processing Record 19 of Set 1)|ushuaia
Processing Record 20 of Set 1)|lebu
Processing Record 21 of Set 1)|yulara
Processing Record 22 of Set 1)|jamestow

Processing Record 43 of Set 4)|itaituba
Processing Record 44 of Set 4)|hamilton
Processing Record 45 of Set 4)|esperance
Processing Record 46 of Set 4)|lavrentiya
Processing Record 47 of Set 4)|pandan
Processing Record 48 of Set 4)|illoqqortoormiut
City not found. Skipping...
Processing Record 49 of Set 4)|manicore
Processing Record 50 of Set 4)|huadian
Processing Record 1 of Set 5)|havre
Processing Record 2 of Set 5)|provideniya
Processing Record 3 of Set 5)|loikaw
Processing Record 4 of Set 5)|hadejia
Processing Record 5 of Set 5)|palembang
Processing Record 6 of Set 5)|belushya guba
City not found. Skipping...
Processing Record 7 of Set 5)|ariguani
Processing Record 8 of Set 5)|kaoma
Processing Record 9 of Set 5)|kaeo
Processing Record 10 of Set 5)|vostok
Processing Record 11 of Set 5)|igarka
Processing Record 12 of Set 5)|tripoli
Processing Record 13 of Set 5)|husavik
Processing Record 14 of Set 5)|dikson
Processing Record 15 of Set 5)|kinkala
Processing Record 16 of Set 5)|sandnes

Processing Record 41 of Set 8)|taltal
Processing Record 42 of Set 8)|felanitx
Processing Record 43 of Set 8)|rodino
Processing Record 44 of Set 8)|kargil
Processing Record 45 of Set 8)|pangkalanbuun
Processing Record 46 of Set 8)|paamiut
Processing Record 47 of Set 8)|okha
Processing Record 48 of Set 8)|lopez jaena
Processing Record 49 of Set 8)|coxim
Processing Record 50 of Set 8)|wagar
Processing Record 1 of Set 9)|aykhal
Processing Record 2 of Set 9)|rungata
City not found. Skipping...
Processing Record 3 of Set 9)|bima
Processing Record 4 of Set 9)|traralgon
Processing Record 5 of Set 9)|severodvinsk
Processing Record 6 of Set 9)|sangar
Processing Record 7 of Set 9)|hasaki
Processing Record 8 of Set 9)|samalaeulu
City not found. Skipping...
Processing Record 9 of Set 9)|morros
Processing Record 10 of Set 9)|sola
Processing Record 11 of Set 9)|omboue
Processing Record 12 of Set 9)|kibungo
Processing Record 13 of Set 9)|rafaela
Processing Record 14 of Set 9)|malwan
City not found. Sk

Processing Record 35 of Set 12)|port macquarie
Processing Record 36 of Set 12)|san andres
Processing Record 37 of Set 12)|sistranda
Processing Record 38 of Set 12)|ode
Processing Record 39 of Set 12)|khani
Processing Record 40 of Set 12)|kargasok
Processing Record 41 of Set 12)|manzil tamim
City not found. Skipping...
Processing Record 42 of Set 12)|suifenhe
Processing Record 43 of Set 12)|abu dhabi
Processing Record 44 of Set 12)|pyaozerskiy
Processing Record 45 of Set 12)|oda
Processing Record 46 of Set 12)|pundaguitan
Processing Record 47 of Set 12)|hudson bay
Processing Record 48 of Set 12)|cagayan de tawi-tawi
City not found. Skipping...
Processing Record 49 of Set 12)|dingle
Processing Record 50 of Set 12)|uusikaupunki
Processing Record 1 of Set 13)|timra
Processing Record 2 of Set 13)|nova olimpia
Processing Record 3 of Set 13)|pueblo nuevo
Processing Record 4 of Set 13)|doctor pedro p. pena
City not found. Skipping...
Processing Record 5 of Set 13)|road town
Processing Record 6

In [6]:
len(city_data)

672

In [7]:
# Convert the array of dictionaries to a Pandas DataFrame.
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Okhotsk,59.3833,143.3,7.48,92,64,5.97,RU,2021-04-02 17:12:39
1,Hithadhoo,-0.6,73.0833,83.73,77,24,20.09,MV,2021-04-02 17:12:39
2,Atuona,-9.8,-139.0333,80.82,78,81,13.94,PF,2021-04-02 17:12:40
3,Nador,35.174,-2.9287,68.0,52,20,13.8,MA,2021-04-02 17:12:40
4,Keuruu,62.2667,24.7,37.99,75,0,4.61,FI,2021-04-02 17:12:41
5,Georgetown,5.4112,100.3354,84.2,89,40,4.61,MY,2021-04-02 17:09:03
6,Qaanaaq,77.484,-69.3632,-11.25,75,100,12.91,GL,2021-04-02 17:12:41
7,Punta Arenas,-53.15,-70.9167,50.0,62,0,14.97,CL,2021-04-02 17:10:55
8,Butaritari,3.0707,172.7902,81.18,81,22,17.63,KI,2021-04-02 17:12:41
9,Ahuimanu,21.4447,-157.8378,71.6,73,20,6.91,US,2021-04-02 17:12:42


In [8]:
# reorder the columns
new_column_order = ["City","Country","Date","Lat","Lng","Max Temp","Humidity","Cloudiness","Wind Speed"]
city_data_df = city_data_df[new_column_order]
city_data_df.head()

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Okhotsk,RU,2021-04-02 17:12:39,59.3833,143.3,7.48,92,64,5.97
1,Hithadhoo,MV,2021-04-02 17:12:39,-0.6,73.0833,83.73,77,24,20.09
2,Atuona,PF,2021-04-02 17:12:40,-9.8,-139.0333,80.82,78,81,13.94
3,Nador,MA,2021-04-02 17:12:40,35.174,-2.9287,68.0,52,20,13.8
4,Keuruu,FI,2021-04-02 17:12:41,62.2667,24.7,37.99,75,0,4.61


In [11]:
# Create the output file (CSV)
output_data_file = "weather_data/cities.csv"
# Export the City_Data into a CSV
city_data_df.to_csv(output_data_file, index_label="City_ID")