In [17]:
# Import the dependencies.
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np

In [18]:
# Create a set of random latitude and longitude combinations.
lats = np.random.uniform(low=-90.000, high=90.000, size=2000)
lngs = np.random.uniform(low=-180.000, high=180.000, size=2000)
lat_lngs = zip(lats, lngs)
lat_lngs

<zip at 0x2afb0098c88>

In [19]:
# Add the latitudes and longitudes to a list.
coordinates = list(lat_lngs)

In [20]:
# Use the citipy module to determine city based on latitude and longitude.
from citipy import citipy

In [21]:
# Create a list for holding the cities.
cities = []
# Identify the nearest city for each latitude and longitude combination.
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name

    # If the city is unique, then we will add it to the cities list.
    if city not in cities:
        cities.append(city)
# Print the city count to confirm sufficient count.
len(cities)

743

In [22]:
# Import the requests library.
import requests

# Import the API key.
from config import weather_api_key

In [23]:
# Starting URL for Weather Map API Call.
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key

In [24]:
from datetime import datetime

In [25]:
city_url = url + "&q=" + city.replace(" ","+")
city_weather = requests.get(city_url).json()
city_weather

{'coord': {'lon': 114.0089, 'lat': 4.4148},
 'weather': [{'id': 802,
   'main': 'Clouds',
   'description': 'scattered clouds',
   'icon': '03n'}],
 'base': 'stations',
 'main': {'temp': 77,
  'feels_like': 84.36,
  'temp_min': 77,
  'temp_max': 77,
  'pressure': 1007,
  'humidity': 88},
 'visibility': 10000,
 'wind': {'speed': 3.44, 'deg': 120},
 'clouds': {'all': 40},
 'dt': 1616876729,
 'sys': {'type': 1,
  'id': 9368,
  'country': 'MY',
  'sunrise': 1616883884,
  'sunset': 1616927593},
 'timezone': 28800,
 'id': 1738050,
 'name': 'Marabu',
 'cod': 200}

In [None]:
# Create an empty list to hold the weather data.
city_data = []
# Print the beginning of the logging.
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters.
record_count = 1
set_count = 1

# Loop through all the cities in the list.
for i, city in enumerate(cities):

    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
    # Create endpoint URL with each city.
    city_url = url + "&q=" + city.replace(" ","+")

    # Log the URL, record, and set numbers and the city.
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    # Add 1 to the record count.
    record_count += 1
       # Run an API request for each of the cities.
    try:
        # Parse the JSON and retrieve data.
        city_weather = requests.get(city_url).json()
        # Parse out the needed data.
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        # Convert the date to ISO standard.
        city_desc = city_weather["weather"][2]["description"]
        # Append the city information into city_data list.
        city_data.append({"City": city.title(),
                          "Lat": city_lat,
                          "Lng": city_lng,
                          "Max Temp": city_max_temp,
                          "Humidity": city_humidity,
                          "Cloudiness": city_clouds,
                          "Wind Speed": city_wind,
                          "Country": city_country,
                          "Date": city_date})

# If an error is experienced, skip the city.
    except:
        print("City not found. Skipping...")
        pass

# Indicate that Data Loading is complete.
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")

Processing Record muisne
City not found. Skipping...
Processing Record hilo
City not found. Skipping...
Processing Record atuona
City not found. Skipping...
Processing Record rikitea
City not found. Skipping...
Processing Record saint-philippe
City not found. Skipping...
Processing Record barrow
City not found. Skipping...
Processing Record roma
City not found. Skipping...
Processing Record norman wells
City not found. Skipping...
Processing Record grand river south east
City not found. Skipping...
Processing Record mar del plata
City not found. Skipping...
Processing Record ushuaia
City not found. Skipping...
Processing Record illoqqortoormiut
City not found. Skipping...
Processing Record belushya guba
City not found. Skipping...
Processing Record satitoa
City not found. Skipping...
Processing Record longyearbyen
City not found. Skipping...
Processing Record albany
City not found. Skipping...
Processing Record bangalore
City not found. Skipping...
Processing Record mahebourg
City not 

In [11]:
# Convert the array of dictionaries to a Pandas DataFrame.
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Torbay,47.6666,-52.7314,28.99,93,90,23.02,CA,2021-03-27 19:29:17
1,Mujiayingzi,42.1167,118.7833,49.44,37,100,17.96,CN,2021-03-27 19:29:49
2,Vaini,-21.2,-175.2,80.6,89,20,8.05,TO,2021-03-27 19:29:18
3,Ushuaia,-54.8,-68.3,59.0,63,75,13.8,AR,2021-03-27 19:26:36
4,Kerema,-7.9631,145.7785,78.13,87,38,3.65,PG,2021-03-27 19:29:49
5,Peleduy,59.6289,112.7406,6.78,97,100,3.4,RU,2021-03-27 19:29:50
6,Ixtapa,20.7,-105.2,73.4,64,1,10.36,MX,2021-03-27 19:29:50
7,Leh,34.1667,77.5833,40.46,46,98,6.53,IN,2021-03-27 19:29:50
8,East London,-33.0153,27.9116,66.2,68,0,13.8,ZA,2021-03-27 19:29:51
9,Busselton,-33.65,115.3333,55.99,94,0,8.23,AU,2021-03-27 19:29:51


In [12]:
new_column_order = ["City", "Country", "Date", "Lat", "Lng", "Max Temp", "Humidity", "Cloudiness", "Wind Speed"]
city_data_df = city_data_df[new_column_order]
city_data_df.head(10)

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Torbay,CA,2021-03-27 19:29:17,47.6666,-52.7314,28.99,93,90,23.02
1,Mujiayingzi,CN,2021-03-27 19:29:49,42.1167,118.7833,49.44,37,100,17.96
2,Vaini,TO,2021-03-27 19:29:18,-21.2,-175.2,80.6,89,20,8.05
3,Ushuaia,AR,2021-03-27 19:26:36,-54.8,-68.3,59.0,63,75,13.8
4,Kerema,PG,2021-03-27 19:29:49,-7.9631,145.7785,78.13,87,38,3.65
5,Peleduy,RU,2021-03-27 19:29:50,59.6289,112.7406,6.78,97,100,3.4
6,Ixtapa,MX,2021-03-27 19:29:50,20.7,-105.2,73.4,64,1,10.36
7,Leh,IN,2021-03-27 19:29:50,34.1667,77.5833,40.46,46,98,6.53
8,East London,ZA,2021-03-27 19:29:51,-33.0153,27.9116,66.2,68,0,13.8
9,Busselton,AU,2021-03-27 19:29:51,-33.65,115.3333,55.99,94,0,8.23


In [13]:
# Create the output file (CSV).
output_data_file = "Weather_Database/WeatherPy_Database.csv"
# Export the City_Data into a CSV.
city_data_df.to_csv(output_data_file, index_label="City_ID")