In [5]:
# Import the dependencies.
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np

In [6]:
# Create a set of random latitude and longitude combinations.
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)
lat_lngs

<zip at 0x11ae5db90>

In [8]:
# Add the latitudes and longitudes to a list.
coordinates = list(lat_lngs)

In [9]:
# Use the citipy module to determine city based on latitude and longitude.
from citipy import citipy

In [10]:
# Create a list for holding the cities.
cities = []
# Identify the nearest city for each latitude and longitude combination.
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name

    # If the city is unique, then we will add it to the cities list.
    if city not in cities:
        cities.append(city)
# Print the city count to confirm sufficient count.
len(cities)

621

In [11]:
cities

['barentsburg',
 'bluff',
 'padang',
 'severo-yeniseyskiy',
 'tommot',
 'hofn',
 'butaritari',
 'taolanaro',
 'puerto ayora',
 'yellowknife',
 'murray bridge',
 'wairoa',
 'anadyr',
 'hobart',
 'victoria',
 'saint-philippe',
 'katsuura',
 'maldonado',
 'mount isa',
 'safaga',
 'mitu',
 'atuona',
 'san cristobal',
 'omboue',
 'east london',
 'dhidhdhoo',
 'lorengau',
 'carnarvon',
 'rikitea',
 'palabuhanratu',
 'arraial do cabo',
 'castro',
 'hithadhoo',
 'bambous virieux',
 'ushuaia',
 'albany',
 'arlit',
 'busselton',
 'cape town',
 'iskateley',
 'georgetown',
 'port hawkesbury',
 'saskylakh',
 'abyek',
 'yagodnoye',
 'avarua',
 'ampanihy',
 'inhambane',
 'camocim',
 'talnakh',
 'vaitupu',
 'fortuna',
 'pogaceaua',
 'okhotsk',
 'lagoa',
 'nanortalik',
 'barabinsk',
 'illoqqortoormiut',
 'khatanga',
 'chuy',
 'punta arenas',
 'halifax',
 'vaini',
 'vao',
 'leh',
 'cherskiy',
 'amderma',
 'grand gaube',
 'neryungri',
 'bahia honda',
 'kaeo',
 'quatre cocos',
 'dwarka',
 'cameron park',


In [12]:
len(cities)

621

In [14]:
# Import the requests library.
import requests

# Import the API key.
from config import weather_api_key

In [15]:
# Starting URL for Weather Map API Call.
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key
print(url)

http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=25d38e422a25052620a67beb790e3e5e


In [17]:
# Create an endpoint URL for a city.
city_url = url + "&q=" + "Boston"
city_weather = requests.get(city_url)
city_weather.json()

{'coord': {'lon': -71.0598, 'lat': 42.3584},
 'weather': [{'id': 804,
   'main': 'Clouds',
   'description': 'overcast clouds',
   'icon': '04n'}],
 'base': 'stations',
 'main': {'temp': 60.28,
  'feels_like': 60.1,
  'temp_min': 56.62,
  'temp_max': 63.43,
  'pressure': 1016,
  'humidity': 87},
 'visibility': 10000,
 'wind': {'speed': 1.01, 'deg': 92, 'gust': 8.01},
 'clouds': {'all': 90},
 'dt': 1633306583,
 'sys': {'type': 2,
  'id': 2013408,
  'country': 'US',
  'sunrise': 1633257816,
  'sunset': 1633299753},
 'timezone': -14400,
 'id': 4930956,
 'name': 'Boston',
 'cod': 200}

In [18]:
# Get the JSON data.
boston_data = city_weather.json()

In [19]:
lat = boston_data["coord"]["lat"]
lng = boston_data["coord"]["lon"]
max_temp = boston_data["main"]["temp_max"]
humidity = boston_data["main"]["humidity"]
clouds = boston_data["clouds"]["all"]
wind = boston_data["wind"]["speed"]
print(lat, lng, max_temp, humidity, clouds, wind)

42.3584 -71.0598 63.43 87 90 1.01


In [20]:
# Import the datetime module from the datetime library.
from datetime import datetime
# Get the date from the JSON file.
date = boston_data["dt"]
# Convert the UTC date to a date format with year, month, day, hours, minutes, and seconds.
datetime.utcfromtimestamp(date)

datetime.datetime(2021, 10, 4, 0, 16, 23)

In [21]:
# Import the datetime module from the datetime library.
from datetime import datetime


In [22]:
# Create an empty list to hold the weather data.
city_data = []
# Print the beginning of the logging.
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters.
record_count = 1
set_count = 1

# Loop through all the cities in the list.
for i, city in enumerate(cities):

    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
    # Create endpoint URL with each city.
    city_url = url + "&q=" + city.replace(" ","+")

    # Log the URL, record, and set numbers and the city.
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    # Add 1 to the record count.
    record_count += 1
# Run an API request for each of the cities.
    try:
        # Parse the JSON and retrieve data.
        city_weather = requests.get(city_url).json()
        # Parse out the needed data.
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        # Convert the date to ISO standard.
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
        # Append the city information into city_data list.
        city_data.append({"City": city.title(),
                          "Lat": city_lat,
                          "Lng": city_lng,
                          "Max Temp": city_max_temp,
                          "Humidity": city_humidity,
                          "Cloudiness": city_clouds,
                          "Wind Speed": city_wind,
                          "Country": city_country,
                          "Date": city_date})

# If an error is experienced, skip the city.
    except:
        print("City not found. Skipping...")
        pass

# Indicate that Data Loading is complete.
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")

Beginning Data Retrieval     
-----------------------------
Processing Record 1 of Set 1 | barentsburg
City not found. Skipping...
Processing Record 2 of Set 1 | bluff
Processing Record 3 of Set 1 | padang
Processing Record 4 of Set 1 | severo-yeniseyskiy
Processing Record 5 of Set 1 | tommot
Processing Record 6 of Set 1 | hofn
Processing Record 7 of Set 1 | butaritari
Processing Record 8 of Set 1 | taolanaro
City not found. Skipping...
Processing Record 9 of Set 1 | puerto ayora
Processing Record 10 of Set 1 | yellowknife
Processing Record 11 of Set 1 | murray bridge
Processing Record 12 of Set 1 | wairoa
Processing Record 13 of Set 1 | anadyr
Processing Record 14 of Set 1 | hobart
Processing Record 15 of Set 1 | victoria
Processing Record 16 of Set 1 | saint-philippe
Processing Record 17 of Set 1 | katsuura
Processing Record 18 of Set 1 | maldonado
Processing Record 19 of Set 1 | mount isa
Processing Record 20 of Set 1 | safaga
Processing Record 21 of Set 1 | mitu
Processing Record 2

Processing Record 39 of Set 4 | prainha
Processing Record 40 of Set 4 | hibbing
Processing Record 41 of Set 4 | phan rang
City not found. Skipping...
Processing Record 42 of Set 4 | benguela
Processing Record 43 of Set 4 | las palmas
Processing Record 44 of Set 4 | vaasa
Processing Record 45 of Set 4 | tabou
Processing Record 46 of Set 4 | san patricio
Processing Record 47 of Set 4 | pangnirtung
Processing Record 48 of Set 4 | belushya guba
City not found. Skipping...
Processing Record 49 of Set 4 | hilo
Processing Record 50 of Set 4 | longyearbyen
Processing Record 1 of Set 5 | irondequoit
Processing Record 2 of Set 5 | seoul
Processing Record 3 of Set 5 | axim
Processing Record 4 of Set 5 | severo-kurilsk
Processing Record 5 of Set 5 | manzhouli
Processing Record 6 of Set 5 | nizhneyansk
City not found. Skipping...
Processing Record 7 of Set 5 | hamilton
Processing Record 8 of Set 5 | nemuro
Processing Record 9 of Set 5 | bontang
Processing Record 10 of Set 5 | new norfolk
Processing

Processing Record 26 of Set 8 | matay
Processing Record 27 of Set 8 | loubomo
Processing Record 28 of Set 8 | latehar
Processing Record 29 of Set 8 | raga
Processing Record 30 of Set 8 | sabha
Processing Record 31 of Set 8 | aksarka
Processing Record 32 of Set 8 | raglan
Processing Record 33 of Set 8 | snasa
Processing Record 34 of Set 8 | el alto
Processing Record 35 of Set 8 | hong gai
Processing Record 36 of Set 8 | brae
Processing Record 37 of Set 8 | aransas pass
Processing Record 38 of Set 8 | maragogi
Processing Record 39 of Set 8 | gat
Processing Record 40 of Set 8 | kalikino
Processing Record 41 of Set 8 | batemans bay
Processing Record 42 of Set 8 | owando
Processing Record 43 of Set 8 | coahuayana
Processing Record 44 of Set 8 | necochea
Processing Record 45 of Set 8 | baykit
Processing Record 46 of Set 8 | bengkulu
Processing Record 47 of Set 8 | iraucuba
Processing Record 48 of Set 8 | cardston
Processing Record 49 of Set 8 | kualakapuas
Processing Record 50 of Set 8 | hai

Processing Record 16 of Set 12 | korem
Processing Record 17 of Set 12 | beringovskiy
Processing Record 18 of Set 12 | loreto
Processing Record 19 of Set 12 | hanzhong
Processing Record 20 of Set 12 | ust-kamchatsk
City not found. Skipping...
Processing Record 21 of Set 12 | nueva gerona
Processing Record 22 of Set 12 | oussouye
Processing Record 23 of Set 12 | tahe
Processing Record 24 of Set 12 | rabat
Processing Record 25 of Set 12 | kabin buri
Processing Record 26 of Set 12 | iwaki
Processing Record 27 of Set 12 | buin
Processing Record 28 of Set 12 | greytown
Processing Record 29 of Set 12 | panjab
Processing Record 30 of Set 12 | magway
Processing Record 31 of Set 12 | port lincoln
Processing Record 32 of Set 12 | la ronge
Processing Record 33 of Set 12 | dunedin
Processing Record 34 of Set 12 | may pen
Processing Record 35 of Set 12 | kango
Processing Record 36 of Set 12 | kamaishi
Processing Record 37 of Set 12 | urucara
Processing Record 38 of Set 12 | leo
Processing Record 39 

In [24]:
# Convert the array of dictionaries to a Pandas DataFrame.
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)


Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Bluff,-46.6,168.3333,52.81,78,100,25.88,NZ,2021-10-04 02:36:44
1,Padang,-0.9492,100.3543,82.45,74,100,3.04,ID,2021-10-04 02:36:45
2,Severo-Yeniseyskiy,60.3725,93.0408,31.37,89,100,3.36,RU,2021-10-04 02:36:45
3,Tommot,58.9564,126.2925,37.4,64,23,5.97,RU,2021-10-04 02:36:46
4,Hofn,64.2539,-15.2082,44.96,79,100,21.27,IS,2021-10-04 02:36:46
5,Butaritari,3.0707,172.7902,82.96,68,7,16.69,KI,2021-10-04 02:36:46
6,Puerto Ayora,-0.7393,-90.3518,69.4,86,60,10.51,EC,2021-10-04 02:36:47
7,Yellowknife,62.456,-114.3525,44.42,62,20,6.91,CA,2021-10-04 02:36:47
8,Murray Bridge,-35.1167,139.2667,58.42,54,28,27.22,AU,2021-10-04 02:36:47
9,Wairoa,-39.0333,177.3667,65.55,80,100,5.01,NZ,2021-10-04 02:36:48


In [27]:
column_adjust = ["City", "Country", "Date", "Lat", "Lng", "Max Temp", "Humidity", "Cloudiness", "Wind Speed"]
city_data_df = city_data_df[column_adjust]
city_data_df.head()


Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Bluff,NZ,2021-10-04 02:36:44,-46.6,168.3333,52.81,78,100,25.88
1,Padang,ID,2021-10-04 02:36:45,-0.9492,100.3543,82.45,74,100,3.04
2,Severo-Yeniseyskiy,RU,2021-10-04 02:36:45,60.3725,93.0408,31.37,89,100,3.36
3,Tommot,RU,2021-10-04 02:36:46,58.9564,126.2925,37.4,64,23,5.97
4,Hofn,IS,2021-10-04 02:36:46,64.2539,-15.2082,44.96,79,100,21.27


In [29]:
# Create the output file (CSV).
output_data_file = "weather_data/cities.csv"
# Export the City_Data into a CSV.
city_data_df.to_csv(output_data_file, index_label="City_ID")

In [30]:
# Extract relevant fields from the DataFrame for plotting.
lats = city_data_df["Lat"]
max_temps = city_data_df["Max Temp"]
humidity = city_data_df["Humidity"]
cloudiness = city_data_df["Cloudiness"]
wind_speed = city_data_df["Wind Speed"]

In [None]:
# Import time module
import time

# Build the scatter plot for latitude vs. max temperature.
plt.scatter(lats,
            max_temps,
            edgecolor="black", linewidths=1, marker="o",
            alpha=0.8, label="Cities")

# Incorporate the other graph properties.
plt.title(f"City Latitude vs. Max Temperature "+ time.strftime("%x"))
plt.ylabel("Max Temperature (F)")
plt.xlabel("Latitude")
plt.grid(True)

# Save the figure.
plt.savefig("weather_data/Fig1.png")

# Show plot.
plt.show()